{"step": 1, "loss": 6.748, "grad_norm": "2.778e+02", "learning_rate": "0.000e+00", "dlm_loss": "5.125e+00", "anc_loss": "1.562e+01", "dlm_acc": "0.000e+00", "anc_acc": "1.421e-03", "epoch": 2e-06} {"step": 5, "loss": 8.2075, "grad_norm": "2.796e+02", "learning_rate": "8.000e-07", "dlm_loss": "5.453e+00", "anc_loss": "1.448e+01", "dlm_acc": "3.704e-04", "anc_acc": "2.054e-03", "epoch": 1e-05} {"step": 10, "loss": 7.5373, "grad_norm": "1.739e+02", "learning_rate": "1.800e-06", "dlm_loss": "6.381e+00", "anc_loss": "1.668e+01", "dlm_acc": "5.119e-04", "anc_acc": "2.737e-04", "epoch": 2e-05} {"step": 15, "loss": 6.7762, "grad_norm": "9.971e+01", "learning_rate": "2.800e-06", "dlm_loss": "5.403e+00", "anc_loss": "1.371e+01", "dlm_acc": "3.914e-02", "anc_acc": "3.633e-03", "epoch": 3e-05} {"step": 20, "loss": 5.9598, "grad_norm": "1.247e+02", "learning_rate": "3.800e-06", "dlm_loss": "4.678e+00", "anc_loss": "1.012e+01", "dlm_acc": "1.243e-02", "anc_acc": "2.365e-02", "epoch": 4e-05} {"step": 25, "loss": 4.7693, "grad_norm": "5.227e+01", "learning_rate": "4.800e-06", "dlm_loss": "2.930e+00", "anc_loss": "7.019e+00", "dlm_acc": "9.700e-02", "anc_acc": "5.707e-02", "epoch": 5e-05} {"step": 30, "loss": 4.6264, "grad_norm": "3.370e+01", "learning_rate": "5.800e-06", "dlm_loss": "1.997e+00", "anc_loss": "5.022e+00", "dlm_acc": "1.633e-01", "anc_acc": "1.092e-01", "epoch": 6e-05} {"step": 35, "loss": 4.6063, "grad_norm": "2.970e+01", "learning_rate": "6.800e-06", "dlm_loss": "3.938e+00", "anc_loss": "7.612e+00", "dlm_acc": "1.196e-01", "anc_acc": "1.433e-01", "epoch": 7e-05} {"step": 40, "loss": 4.6929, "grad_norm": "2.035e+01", "learning_rate": "7.800e-06", "dlm_loss": "4.144e+00", "anc_loss": "7.662e+00", "dlm_acc": "6.167e-02", "anc_acc": "7.607e-02", "epoch": 8e-05} {"step": 45, "loss": 4.1705, "grad_norm": "2.116e+01", "learning_rate": "8.800e-06", "dlm_loss": "4.341e+00", "anc_loss": "6.900e+00", "dlm_acc": "2.535e-02", "anc_acc": "7.241e-02", "epoch": 9e-05} {"step": 50, "loss": 4.0354, "grad_norm": "1.008e+01", "learning_rate": "9.800e-06", "dlm_loss": "2.844e+00", "anc_loss": "4.159e+00", "dlm_acc": "1.006e-01", "anc_acc": "1.904e-01", "epoch": 0.0001} {"step": 55, "loss": 4.0526, "grad_norm": "1.556e+01", "learning_rate": "1.080e-05", "dlm_loss": "2.752e+00", "anc_loss": "3.622e+00", "dlm_acc": "1.773e-01", "anc_acc": "2.151e-01", "epoch": 0.00011} {"step": 60, "loss": 3.8849, "grad_norm": "8.974e+00", "learning_rate": "1.180e-05", "dlm_loss": "3.178e+00", "anc_loss": "4.050e+00", "dlm_acc": "8.027e-02", "anc_acc": "1.085e-01", "epoch": 0.00012} {"step": 65, "loss": 3.6017, "grad_norm": "7.899e+00", "learning_rate": "1.280e-05", "dlm_loss": "2.833e+00", "anc_loss": "3.487e+00", "dlm_acc": "9.805e-02", "anc_acc": "1.193e-01", "epoch": 0.00013} {"step": 70, "loss": 2.8929, "grad_norm": "7.062e+00", "learning_rate": "1.380e-05", "dlm_loss": "2.859e+00", "anc_loss": "3.447e+00", "dlm_acc": "1.158e-01", "anc_acc": "1.538e-01", "epoch": 0.00014} {"step": 75, "loss": 3.0119, "grad_norm": "5.400e+00", "learning_rate": "1.480e-05", "dlm_loss": "2.021e+00", "anc_loss": "2.346e+00", "dlm_acc": "2.872e-01", "anc_acc": "3.156e-01", "epoch": 0.00015} {"step": 80, "loss": 2.1308, "grad_norm": "1.033e+01", "learning_rate": "1.580e-05", "dlm_loss": "1.702e+00", "anc_loss": "2.036e+00", "dlm_acc": "3.126e-01", "anc_acc": "3.188e-01", "epoch": 0.00016} {"step": 85, "loss": 2.1919, "grad_norm": "5.982e+00", "learning_rate": "1.680e-05", "dlm_loss": "1.712e+00", "anc_loss": "2.072e+00", "dlm_acc": "3.135e-01", "anc_acc": "3.067e-01", "epoch": 0.00017} {"step": 90, "loss": 2.8741, "grad_norm": "4.344e+00", "learning_rate": "1.780e-05", "dlm_loss": "2.763e+00", "anc_loss": "3.269e+00", "dlm_acc": "1.929e-01", "anc_acc": "2.065e-01", "epoch": 0.00018} {"step": 95, "loss": 2.7445, "grad_norm": "5.089e+00", "learning_rate": "1.880e-05", "dlm_loss": "2.452e+00", "anc_loss": "2.780e+00", "dlm_acc": "2.422e-01", "anc_acc": "2.605e-01", "epoch": 0.00019} {"step": 100, "loss": 2.8585, "grad_norm": "6.366e+00", "learning_rate": "1.980e-05", "dlm_loss": "2.163e+00", "anc_loss": "2.438e+00", "dlm_acc": "2.404e-01", "anc_acc": "2.585e-01", "epoch": 0.0002} {"step": 105, "loss": 2.8183, "grad_norm": "4.183e+00", "learning_rate": "2.080e-05", "dlm_loss": "2.644e+00", "anc_loss": "3.034e+00", "dlm_acc": "2.019e-01", "anc_acc": "2.051e-01", "epoch": 0.00021} {"step": 110, "loss": 2.286, "grad_norm": "3.924e+00", "learning_rate": "2.180e-05", "dlm_loss": "2.862e+00", "anc_loss": "3.241e+00", "dlm_acc": "2.098e-01", "anc_acc": "2.174e-01", "epoch": 0.00022} {"step": 115, "loss": 2.1827, "grad_norm": "7.572e+00", "learning_rate": "2.280e-05", "dlm_loss": "1.214e+00", "anc_loss": "1.401e+00", "dlm_acc": "3.281e-01", "anc_acc": "3.308e-01", "epoch": 0.00023} {"step": 120, "loss": 1.8003, "grad_norm": "2.881e+00", "learning_rate": "2.380e-05", "dlm_loss": "1.304e+00", "anc_loss": "1.458e+00", "dlm_acc": "3.556e-01", "anc_acc": "3.624e-01", "epoch": 0.00024} {"step": 125, "loss": 1.7177, "grad_norm": "4.071e+00", "learning_rate": "2.480e-05", "dlm_loss": "9.070e-01", "anc_loss": "1.012e+00", "dlm_acc": "3.755e-01", "anc_acc": "3.739e-01", "epoch": 0.00025} {"step": 130, "loss": 1.6392, "grad_norm": "7.596e+00", "learning_rate": "2.580e-05", "dlm_loss": "8.063e-01", "anc_loss": "9.148e-01", "dlm_acc": "4.525e-01", "anc_acc": "4.465e-01", "epoch": 0.00026} {"step": 135, "loss": 2.2424, "grad_norm": "5.033e+00", "learning_rate": "2.680e-05", "dlm_loss": "1.744e+00", "anc_loss": "1.945e+00", "dlm_acc": "3.008e-01", "anc_acc": "3.056e-01", "epoch": 0.00027} {"step": 140, "loss": 2.0034, "grad_norm": "5.298e+00", "learning_rate": "2.780e-05", "dlm_loss": "2.316e+00", "anc_loss": "2.573e+00", "dlm_acc": "2.694e-01", "anc_acc": "2.738e-01", "epoch": 0.00028} {"step": 145, "loss": 1.8367, "grad_norm": "4.400e+00", "learning_rate": "2.880e-05", "dlm_loss": "1.682e+00", "anc_loss": "1.897e+00", "dlm_acc": "4.331e-01", "anc_acc": "4.389e-01", "epoch": 0.00029} {"step": 150, "loss": 1.9913, "grad_norm": "4.373e+00", "learning_rate": "2.980e-05", "dlm_loss": "7.082e-01", "anc_loss": "7.523e-01", "dlm_acc": "5.299e-01", "anc_acc": "5.286e-01", "epoch": 0.0003} {"step": 155, "loss": 2.1308, "grad_norm": "4.955e+00", "learning_rate": "3.080e-05", "dlm_loss": "6.535e-01", "anc_loss": "7.070e-01", "dlm_acc": "5.843e-01", "anc_acc": "5.811e-01", "epoch": 0.00031} {"step": 160, "loss": 1.6695, "grad_norm": "4.391e+00", "learning_rate": "3.180e-05", "dlm_loss": "5.262e-01", "anc_loss": "5.680e-01", "dlm_acc": "6.436e-01", "anc_acc": "6.425e-01", "epoch": 0.00032} {"step": 165, "loss": 1.8265, "grad_norm": "5.808e+00", "learning_rate": "3.280e-05", "dlm_loss": "6.867e-01", "anc_loss": "7.336e-01", "dlm_acc": "5.964e-01", "anc_acc": "5.926e-01", "epoch": 0.00033} {"step": 170, "loss": 1.497, "grad_norm": "4.559e+00", "learning_rate": "3.380e-05", "dlm_loss": "4.914e-01", "anc_loss": "5.145e-01", "dlm_acc": "6.666e-01", "anc_acc": "6.661e-01", "epoch": 0.00034} {"step": 175, "loss": 1.2901, "grad_norm": "2.505e+00", "learning_rate": "3.480e-05", "dlm_loss": "5.918e-01", "anc_loss": "6.301e-01", "dlm_acc": "5.979e-01", "anc_acc": "5.969e-01", "epoch": 0.00035} {"step": 180, "loss": 1.0904, "grad_norm": "3.134e+00", "learning_rate": "3.580e-05", "dlm_loss": "5.164e-01", "anc_loss": "5.555e-01", "dlm_acc": "5.931e-01", "anc_acc": "5.908e-01", "epoch": 0.00036} {"step": 185, "loss": 1.753, "grad_norm": "3.424e+00", "learning_rate": "3.680e-05", "dlm_loss": "1.632e+00", "anc_loss": "1.759e+00", "dlm_acc": "3.676e-01", "anc_acc": "3.725e-01", "epoch": 0.00037} {"step": 190, "loss": 2.0564, "grad_norm": "3.737e+00", "learning_rate": "3.780e-05", "dlm_loss": "8.273e-01", "anc_loss": "8.633e-01", "dlm_acc": "4.646e-01", "anc_acc": "4.656e-01", "epoch": 0.00038} {"step": 195, "loss": 1.811, "grad_norm": "2.498e+00", "learning_rate": "3.880e-05", "dlm_loss": "6.961e-01", "anc_loss": "7.109e-01", "dlm_acc": "5.270e-01", "anc_acc": "5.322e-01", "epoch": 0.00039} {"step": 200, "loss": 1.833, "grad_norm": "2.522e+00", "learning_rate": "3.980e-05", "dlm_loss": "6.570e-01", "anc_loss": "6.859e-01", "dlm_acc": "5.597e-01", "anc_acc": "5.592e-01", "epoch": 0.0004} {"step": 205, "loss": 1.0257, "grad_norm": "2.814e+00", "learning_rate": "4.080e-05", "dlm_loss": "5.891e-01", "anc_loss": "6.082e-01", "dlm_acc": "5.454e-01", "anc_acc": "5.459e-01", "epoch": 0.00041} {"step": 210, "loss": 1.6625, "grad_norm": "3.394e+00", "learning_rate": "4.180e-05", "dlm_loss": "1.452e+00", "anc_loss": "1.578e+00", "dlm_acc": "3.809e-01", "anc_acc": "3.824e-01", "epoch": 0.00042} {"step": 215, "loss": 1.6146, "grad_norm": "1.903e+00", "learning_rate": "4.280e-05", "dlm_loss": "7.414e-01", "anc_loss": "7.625e-01", "dlm_acc": "4.872e-01", "anc_acc": "4.882e-01", "epoch": 0.00043} {"step": 220, "loss": 1.5846, "grad_norm": "2.389e+00", "learning_rate": "4.380e-05", "dlm_loss": "7.375e-01", "anc_loss": "7.602e-01", "dlm_acc": "4.885e-01", "anc_acc": "4.868e-01", "epoch": 0.00044} {"step": 225, "loss": 1.4142, "grad_norm": "2.633e+00", "learning_rate": "4.480e-05", "dlm_loss": "7.773e-01", "anc_loss": "8.039e-01", "dlm_acc": "4.869e-01", "anc_acc": "4.889e-01", "epoch": 0.00045} {"step": 230, "loss": 1.0505, "grad_norm": "2.716e+00", "learning_rate": "4.580e-05", "dlm_loss": "5.832e-01", "anc_loss": "5.984e-01", "dlm_acc": "5.179e-01", "anc_acc": "5.205e-01", "epoch": 0.00046} {"step": 235, "loss": 1.3013, "grad_norm": "2.690e+00", "learning_rate": "4.680e-05", "dlm_loss": "8.797e-01", "anc_loss": "8.992e-01", "dlm_acc": "4.711e-01", "anc_acc": "4.722e-01", "epoch": 0.00047} {"step": 240, "loss": 1.8134, "grad_norm": "2.621e+00", "learning_rate": "4.780e-05", "dlm_loss": "1.955e+00", "anc_loss": "2.050e+00", "dlm_acc": "3.306e-01", "anc_acc": "3.312e-01", "epoch": 0.00048} {"step": 245, "loss": 1.2751, "grad_norm": "5.705e+00", "learning_rate": "4.880e-05", "dlm_loss": "1.413e+00", "anc_loss": "1.477e+00", "dlm_acc": "4.735e-01", "anc_acc": "4.727e-01", "epoch": 0.00049} {"step": 250, "loss": 1.2917, "grad_norm": "1.779e+00", "learning_rate": "4.980e-05", "dlm_loss": "5.195e-01", "anc_loss": "5.328e-01", "dlm_acc": "6.402e-01", "anc_acc": "6.420e-01", "epoch": 0.0005} {"step": 255, "loss": 1.2395, "grad_norm": "1.938e+00", "learning_rate": "5.080e-05", "dlm_loss": "4.555e-01", "anc_loss": "4.715e-01", "dlm_acc": "6.704e-01", "anc_acc": "6.711e-01", "epoch": 0.00051} {"step": 260, "loss": 1.5366, "grad_norm": "1.336e+00", "learning_rate": "5.180e-05", "dlm_loss": "1.191e+00", "anc_loss": "1.258e+00", "dlm_acc": "5.341e-01", "anc_acc": "5.317e-01", "epoch": 0.00052} {"step": 265, "loss": 1.5696, "grad_norm": "1.391e+00", "learning_rate": "5.280e-05", "dlm_loss": "1.925e+00", "anc_loss": "2.036e+00", "dlm_acc": "3.503e-01", "anc_acc": "3.519e-01", "epoch": 0.00053} {"step": 270, "loss": 1.9119, "grad_norm": "2.736e+00", "learning_rate": "5.380e-05", "dlm_loss": "1.991e+00", "anc_loss": "2.078e+00", "dlm_acc": "2.952e-01", "anc_acc": "2.948e-01", "epoch": 0.00054} {"step": 275, "loss": 1.882, "grad_norm": "4.641e+00", "learning_rate": "5.480e-05", "dlm_loss": "2.042e+00", "anc_loss": "2.159e+00", "dlm_acc": "3.549e-01", "anc_acc": "3.524e-01", "epoch": 0.00055} {"step": 280, "loss": 2.3671, "grad_norm": "3.717e+00", "learning_rate": "5.580e-05", "dlm_loss": "2.663e+00", "anc_loss": "2.769e+00", "dlm_acc": "2.827e-01", "anc_acc": "2.830e-01", "epoch": 0.00056} {"step": 285, "loss": 2.1447, "grad_norm": "4.438e+00", "learning_rate": "5.680e-05", "dlm_loss": "2.331e+00", "anc_loss": "2.445e+00", "dlm_acc": "3.280e-01", "anc_acc": "3.273e-01", "epoch": 0.00057} {"step": 290, "loss": 1.5994, "grad_norm": "5.270e+00", "learning_rate": "5.780e-05", "dlm_loss": "1.877e+00", "anc_loss": "1.909e+00", "dlm_acc": "3.160e-01", "anc_acc": "3.308e-01", "epoch": 0.00058} {"step": 295, "loss": 1.6759, "grad_norm": "4.114e+00", "learning_rate": "5.880e-05", "dlm_loss": "1.719e+00", "anc_loss": "1.819e+00", "dlm_acc": "4.268e-01", "anc_acc": "4.246e-01", "epoch": 0.00059} {"step": 300, "loss": 1.541, "grad_norm": "3.829e+00", "learning_rate": "5.980e-05", "dlm_loss": "1.680e+00", "anc_loss": "1.778e+00", "dlm_acc": "3.892e-01", "anc_acc": "3.877e-01", "epoch": 0.0006} {"step": 305, "loss": 1.328, "grad_norm": "4.707e+00", "learning_rate": "6.080e-05", "dlm_loss": "1.856e+00", "anc_loss": "1.942e+00", "dlm_acc": "3.799e-01", "anc_acc": "3.739e-01", "epoch": 0.00061} {"step": 310, "loss": 1.3922, "grad_norm": "1.093e+00", "learning_rate": "6.180e-05", "dlm_loss": "1.028e+00", "anc_loss": "1.098e+00", "dlm_acc": "5.617e-01", "anc_acc": "5.598e-01", "epoch": 0.00062} {"step": 315, "loss": 1.9144, "grad_norm": "2.727e+00", "learning_rate": "6.280e-05", "dlm_loss": "2.266e+00", "anc_loss": "2.367e+00", "dlm_acc": "3.492e-01", "anc_acc": "3.489e-01", "epoch": 0.00063} {"step": 320, "loss": 2.1842, "grad_norm": "2.061e+00", "learning_rate": "6.380e-05", "dlm_loss": "2.531e+00", "anc_loss": "2.650e+00", "dlm_acc": "2.837e-01", "anc_acc": "2.801e-01", "epoch": 0.00064} {"step": 325, "loss": 1.5908, "grad_norm": "1.667e+00", "learning_rate": "6.480e-05", "dlm_loss": "1.996e+00", "anc_loss": "2.084e+00", "dlm_acc": "3.838e-01", "anc_acc": "3.813e-01", "epoch": 0.00065} {"step": 330, "loss": 1.7833, "grad_norm": "4.941e+00", "learning_rate": "6.580e-05", "dlm_loss": "2.136e+00", "anc_loss": "2.252e+00", "dlm_acc": "3.558e-01", "anc_acc": "3.523e-01", "epoch": 0.00066} {"step": 335, "loss": 1.3164, "grad_norm": "2.808e+00", "learning_rate": "6.680e-05", "dlm_loss": "2.025e+00", "anc_loss": "2.125e+00", "dlm_acc": "3.627e-01", "anc_acc": "3.602e-01", "epoch": 0.00067} {"step": 340, "loss": 1.8352, "grad_norm": "2.100e+00", "learning_rate": "6.780e-05", "dlm_loss": "1.883e+00", "anc_loss": "1.965e+00", "dlm_acc": "3.944e-01", "anc_acc": "3.925e-01", "epoch": 0.00068} {"step": 345, "loss": 1.7194, "grad_norm": "1.285e+00", "learning_rate": "6.880e-05", "dlm_loss": "1.881e+00", "anc_loss": "1.977e+00", "dlm_acc": "3.622e-01", "anc_acc": "3.626e-01", "epoch": 0.00069} {"step": 350, "loss": 1.4778, "grad_norm": "3.038e+00", "learning_rate": "6.980e-05", "dlm_loss": "1.408e+00", "anc_loss": "1.454e+00", "dlm_acc": "3.538e-01", "anc_acc": "3.545e-01", "epoch": 0.0007} {"step": 355, "loss": 2.3491, "grad_norm": "1.441e+00", "learning_rate": "7.080e-05", "dlm_loss": "2.475e+00", "anc_loss": "2.572e+00", "dlm_acc": "2.877e-01", "anc_acc": "2.867e-01", "epoch": 0.00071} {"step": 360, "loss": 1.6639, "grad_norm": "1.809e+00", "learning_rate": "7.180e-05", "dlm_loss": "1.798e+00", "anc_loss": "1.881e+00", "dlm_acc": "3.574e-01", "anc_acc": "3.596e-01", "epoch": 0.00072} {"step": 365, "loss": 1.5497, "grad_norm": "3.772e+00", "learning_rate": "7.280e-05", "dlm_loss": "1.900e+00", "anc_loss": "1.959e+00", "dlm_acc": "3.222e-01", "anc_acc": "3.336e-01", "epoch": 0.00073} {"step": 370, "loss": 1.7059, "grad_norm": "5.035e+00", "learning_rate": "7.380e-05", "dlm_loss": "1.710e+00", "anc_loss": "1.785e+00", "dlm_acc": "3.843e-01", "anc_acc": "3.856e-01", "epoch": 0.00074} {"step": 375, "loss": 1.9277, "grad_norm": "2.990e+00", "learning_rate": "7.480e-05", "dlm_loss": "1.997e+00", "anc_loss": "2.094e+00", "dlm_acc": "3.079e-01", "anc_acc": "3.064e-01", "epoch": 0.00075} {"step": 380, "loss": 2.0333, "grad_norm": "2.154e+00", "learning_rate": "7.580e-05", "dlm_loss": "1.905e+00", "anc_loss": "2.003e+00", "dlm_acc": "3.646e-01", "anc_acc": "3.538e-01", "epoch": 0.00076} {"step": 385, "loss": 1.8943, "grad_norm": "2.277e+00", "learning_rate": "7.680e-05", "dlm_loss": "1.678e+00", "anc_loss": "1.758e+00", "dlm_acc": "3.374e-01", "anc_acc": "3.394e-01", "epoch": 0.00077} {"step": 390, "loss": 2.0417, "grad_norm": "1.315e+00", "learning_rate": "7.780e-05", "dlm_loss": "1.898e+00", "anc_loss": "1.992e+00", "dlm_acc": "3.830e-01", "anc_acc": "3.812e-01", "epoch": 0.00078} {"step": 395, "loss": 2.3782, "grad_norm": "2.221e+00", "learning_rate": "7.880e-05", "dlm_loss": "2.139e+00", "anc_loss": "2.219e+00", "dlm_acc": "3.269e-01", "anc_acc": "3.269e-01", "epoch": 0.00079} {"step": 400, "loss": 1.366, "grad_norm": "2.191e+00", "learning_rate": "7.980e-05", "dlm_loss": "1.080e+00", "anc_loss": "1.131e+00", "dlm_acc": "4.812e-01", "anc_acc": "4.837e-01", "epoch": 0.0008} {"step": 405, "loss": 1.665, "grad_norm": "2.266e+00", "learning_rate": "8.080e-05", "dlm_loss": "1.568e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.482e-01", "anc_acc": "4.482e-01", "epoch": 0.00081} {"step": 410, "loss": 1.9757, "grad_norm": "1.998e+00", "learning_rate": "8.180e-05", "dlm_loss": "1.870e+00", "anc_loss": "1.972e+00", "dlm_acc": "4.313e-01", "anc_acc": "4.284e-01", "epoch": 0.00082} {"step": 415, "loss": 1.7123, "grad_norm": "1.356e+00", "learning_rate": "8.280e-05", "dlm_loss": "1.931e+00", "anc_loss": "2.062e+00", "dlm_acc": "3.683e-01", "anc_acc": "3.676e-01", "epoch": 0.00083} {"step": 420, "loss": 1.9249, "grad_norm": "1.630e+00", "learning_rate": "8.380e-05", "dlm_loss": "2.323e+00", "anc_loss": "2.377e+00", "dlm_acc": "1.298e-01", "anc_acc": "1.272e-01", "epoch": 0.00084} {"step": 425, "loss": 2.6002, "grad_norm": "1.852e+00", "learning_rate": "8.480e-05", "dlm_loss": "3.031e+00", "anc_loss": "3.081e+00", "dlm_acc": "2.555e-02", "anc_acc": "2.348e-02", "epoch": 0.00085} {"step": 430, "loss": 2.368, "grad_norm": "1.977e+00", "learning_rate": "8.580e-05", "dlm_loss": "2.962e+00", "anc_loss": "3.009e+00", "dlm_acc": "2.498e-02", "anc_acc": "2.159e-02", "epoch": 0.00086} {"step": 435, "loss": 2.3416, "grad_norm": "1.580e+00", "learning_rate": "8.680e-05", "dlm_loss": "2.866e+00", "anc_loss": "2.903e+00", "dlm_acc": "2.572e-02", "anc_acc": "2.296e-02", "epoch": 0.00087} {"step": 440, "loss": 2.1791, "grad_norm": "2.438e+00", "learning_rate": "8.780e-05", "dlm_loss": "2.191e+00", "anc_loss": "2.225e+00", "dlm_acc": "1.775e-01", "anc_acc": "1.766e-01", "epoch": 0.00088} {"step": 445, "loss": 2.3901, "grad_norm": "2.402e+00", "learning_rate": "8.880e-05", "dlm_loss": "2.173e+00", "anc_loss": "2.245e+00", "dlm_acc": "3.518e-01", "anc_acc": "3.508e-01", "epoch": 0.00089} {"step": 450, "loss": 1.7727, "grad_norm": "2.547e+00", "learning_rate": "8.980e-05", "dlm_loss": "1.581e+00", "anc_loss": "1.659e+00", "dlm_acc": "4.442e-01", "anc_acc": "4.413e-01", "epoch": 0.0009} {"step": 455, "loss": 1.913, "grad_norm": "8.336e-01", "learning_rate": "9.080e-05", "dlm_loss": "1.614e+00", "anc_loss": "1.695e+00", "dlm_acc": "4.257e-01", "anc_acc": "4.223e-01", "epoch": 0.00091} {"step": 460, "loss": 1.9914, "grad_norm": "1.270e+00", "learning_rate": "9.180e-05", "dlm_loss": "1.880e+00", "anc_loss": "1.947e+00", "dlm_acc": "3.804e-01", "anc_acc": "3.761e-01", "epoch": 0.00092} {"step": 465, "loss": 2.0089, "grad_norm": "2.950e+00", "learning_rate": "9.280e-05", "dlm_loss": "1.008e+00", "anc_loss": "1.031e+00", "dlm_acc": "5.064e-01", "anc_acc": "5.079e-01", "epoch": 0.00093} {"step": 470, "loss": 1.7042, "grad_norm": "1.898e+00", "learning_rate": "9.380e-05", "dlm_loss": "1.653e+00", "anc_loss": "1.727e+00", "dlm_acc": "4.666e-01", "anc_acc": "4.631e-01", "epoch": 0.00094} {"step": 475, "loss": 1.4318, "grad_norm": "2.230e+00", "learning_rate": "9.480e-05", "dlm_loss": "9.754e-01", "anc_loss": "9.362e-01", "dlm_acc": "6.483e-01", "anc_acc": "6.500e-01", "epoch": 0.00095} {"step": 480, "loss": 1.7378, "grad_norm": "3.002e+00", "learning_rate": "9.580e-05", "dlm_loss": "8.922e-01", "anc_loss": "9.445e-01", "dlm_acc": "6.742e-01", "anc_acc": "6.762e-01", "epoch": 0.00096} {"step": 485, "loss": 2.2595, "grad_norm": "2.672e+00", "learning_rate": "9.680e-05", "dlm_loss": "1.345e+00", "anc_loss": "1.418e+00", "dlm_acc": "5.580e-01", "anc_acc": "5.608e-01", "epoch": 0.00097} {"step": 490, "loss": 2.0863, "grad_norm": "2.265e+00", "learning_rate": "9.780e-05", "dlm_loss": "1.752e+00", "anc_loss": "1.809e+00", "dlm_acc": "4.039e-01", "anc_acc": "4.026e-01", "epoch": 0.00098} {"step": 495, "loss": 1.8137, "grad_norm": "2.973e+00", "learning_rate": "9.880e-05", "dlm_loss": "1.470e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.039e-01", "anc_acc": "5.014e-01", "epoch": 0.00099} {"step": 500, "loss": 1.6267, "grad_norm": "2.519e+00", "learning_rate": "9.980e-05", "dlm_loss": "1.777e+00", "anc_loss": "1.863e+00", "dlm_acc": "4.183e-01", "anc_acc": "4.185e-01", "epoch": 0.001} {"step": 505, "loss": 1.3922, "grad_norm": "2.065e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.213e+00", "anc_loss": "1.257e+00", "dlm_acc": "5.348e-01", "anc_acc": "5.391e-01", "epoch": 0.00101} {"step": 510, "loss": 2.1319, "grad_norm": "1.855e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.637e+00", "anc_loss": "1.678e+00", "dlm_acc": "3.554e-01", "anc_acc": "3.536e-01", "epoch": 0.00102} {"step": 515, "loss": 2.3858, "grad_norm": "2.234e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.897e+00", "anc_loss": "1.970e+00", "dlm_acc": "3.643e-01", "anc_acc": "3.628e-01", "epoch": 0.00103} {"step": 520, "loss": 1.9642, "grad_norm": "1.622e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.680e+00", "dlm_acc": "3.880e-01", "anc_acc": "3.817e-01", "epoch": 0.00104} {"step": 525, "loss": 1.6761, "grad_norm": "1.196e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.317e+00", "anc_loss": "1.377e+00", "dlm_acc": "4.382e-01", "anc_acc": "4.333e-01", "epoch": 0.00105} {"step": 530, "loss": 1.9357, "grad_norm": "9.906e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.730e+00", "anc_loss": "1.784e+00", "dlm_acc": "3.293e-01", "anc_acc": "3.249e-01", "epoch": 0.00106} {"step": 535, "loss": 2.0269, "grad_norm": "1.317e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.714e+00", "anc_loss": "1.789e+00", "dlm_acc": "4.017e-01", "anc_acc": "3.967e-01", "epoch": 0.00107} {"step": 540, "loss": 1.9689, "grad_norm": "1.541e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.895e+00", "anc_loss": "1.961e+00", "dlm_acc": "3.760e-01", "anc_acc": "3.719e-01", "epoch": 0.00108} {"step": 545, "loss": 2.0041, "grad_norm": "1.229e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.780e+00", "anc_loss": "1.836e+00", "dlm_acc": "3.755e-01", "anc_acc": "3.727e-01", "epoch": 0.00109} {"step": 550, "loss": 2.2539, "grad_norm": "1.911e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.798e+00", "anc_loss": "1.868e+00", "dlm_acc": "4.286e-01", "anc_acc": "4.264e-01", "epoch": 0.0011} {"step": 555, "loss": 1.9403, "grad_norm": "1.520e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.138e+00", "dlm_acc": "6.048e-01", "anc_acc": "6.026e-01", "epoch": 0.00111} {"step": 560, "loss": 1.974, "grad_norm": "1.408e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.734e+00", "anc_loss": "1.798e+00", "dlm_acc": "4.505e-01", "anc_acc": "4.469e-01", "epoch": 0.00112} {"step": 565, "loss": 1.5866, "grad_norm": "2.190e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.334e-01", "anc_loss": "9.611e-01", "dlm_acc": "6.567e-01", "anc_acc": "6.575e-01", "epoch": 0.00113} {"step": 570, "loss": 1.6934, "grad_norm": "7.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.721e-01", "anc_acc": "5.712e-01", "epoch": 0.00114} {"step": 575, "loss": 1.9215, "grad_norm": "1.499e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.412e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.317e-01", "anc_acc": "5.306e-01", "epoch": 0.00115} {"step": 580, "loss": 2.1899, "grad_norm": "1.883e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.704e+00", "anc_loss": "1.759e+00", "dlm_acc": "4.758e-01", "anc_acc": "4.740e-01", "epoch": 0.00116} {"step": 585, "loss": 1.9951, "grad_norm": "1.441e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.539e+00", "anc_loss": "1.578e+00", "dlm_acc": "4.687e-01", "anc_acc": "4.695e-01", "epoch": 0.00117} {"step": 590, "loss": 1.1513, "grad_norm": "1.592e+00", "learning_rate": "1.000e-04", "dlm_loss": "3.535e-01", "anc_loss": "3.656e-01", "dlm_acc": "8.424e-01", "anc_acc": "8.422e-01", "epoch": 0.00118} {"step": 595, "loss": 1.0492, "grad_norm": "1.650e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.848e-02", "anc_loss": "9.019e-02", "dlm_acc": "9.358e-01", "anc_acc": "9.364e-01", "epoch": 0.00119} {"step": 600, "loss": 0.7498, "grad_norm": "1.944e+00", "learning_rate": "1.000e-04", "dlm_loss": "4.514e-02", "anc_loss": "4.734e-02", "dlm_acc": "9.726e-01", "anc_acc": "9.723e-01", "epoch": 0.0012} {"step": 605, "loss": 1.5819, "grad_norm": "1.487e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.470e-02", "anc_loss": "6.791e-02", "dlm_acc": "9.570e-01", "anc_acc": "9.555e-01", "epoch": 0.00121} {"step": 610, "loss": 1.5259, "grad_norm": "1.806e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.080e-02", "anc_loss": "9.302e-02", "dlm_acc": "9.485e-01", "anc_acc": "9.500e-01", "epoch": 0.00122} {"step": 615, "loss": 2.1094, "grad_norm": "1.014e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.991e+00", "anc_loss": "2.070e+00", "dlm_acc": "4.051e-01", "anc_acc": "4.009e-01", "epoch": 0.00123} {"step": 620, "loss": 1.4129, "grad_norm": "5.369e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.106e+00", "dlm_acc": "5.381e-01", "anc_acc": "5.385e-01", "epoch": 0.00124} {"step": 625, "loss": 1.9639, "grad_norm": "1.826e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.998e+00", "anc_loss": "2.055e+00", "dlm_acc": "3.856e-01", "anc_acc": "3.843e-01", "epoch": 0.00125} {"step": 630, "loss": 1.5906, "grad_norm": "7.662e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.243e+00", "dlm_acc": "3.819e-01", "anc_acc": "3.810e-01", "epoch": 0.00126} {"step": 635, "loss": 1.9948, "grad_norm": "2.321e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.820e+00", "anc_loss": "1.853e+00", "dlm_acc": "4.290e-01", "anc_acc": "4.276e-01", "epoch": 0.00127} {"step": 640, "loss": 1.5556, "grad_norm": "2.121e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.107e+00", "dlm_acc": "6.190e-01", "anc_acc": "6.227e-01", "epoch": 0.00128} {"step": 645, "loss": 2.2068, "grad_norm": "3.989e+01", "learning_rate": "1.000e-04", "dlm_loss": "2.017e+00", "anc_loss": "1.923e+00", "dlm_acc": "4.518e-01", "anc_acc": "4.576e-01", "epoch": 0.00129} {"step": 650, "loss": 1.2513, "grad_norm": "1.313e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.543e-01", "anc_loss": "9.973e-01", "dlm_acc": "6.242e-01", "anc_acc": "6.227e-01", "epoch": 0.0013} {"step": 655, "loss": 1.745, "grad_norm": "1.750e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.730e-01", "anc_loss": "1.001e+00", "dlm_acc": "5.304e-01", "anc_acc": "5.306e-01", "epoch": 0.00131} {"step": 660, "loss": 1.691, "grad_norm": "1.034e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.113e-01", "anc_loss": "8.406e-01", "dlm_acc": "6.683e-01", "anc_acc": "6.671e-01", "epoch": 0.00132} {"step": 665, "loss": 1.5535, "grad_norm": "8.874e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.404e+00", "dlm_acc": "4.747e-01", "anc_acc": "4.722e-01", "epoch": 0.00133} {"step": 670, "loss": 1.3478, "grad_norm": "1.026e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.536e+00", "anc_loss": "1.590e+00", "dlm_acc": "4.944e-01", "anc_acc": "4.926e-01", "epoch": 0.00134} {"step": 675, "loss": 1.3147, "grad_norm": "1.065e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.577e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.309e-01", "anc_acc": "4.294e-01", "epoch": 0.00135} {"step": 680, "loss": 1.1447, "grad_norm": "8.932e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.025e+00", "anc_loss": "1.073e+00", "dlm_acc": "6.053e-01", "anc_acc": "6.063e-01", "epoch": 0.00136} {"step": 685, "loss": 1.2481, "grad_norm": "1.849e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.258e+00", "dlm_acc": "5.127e-01", "anc_acc": "5.106e-01", "epoch": 0.00137} {"step": 690, "loss": 1.6533, "grad_norm": "6.252e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.768e+00", "anc_loss": "1.825e+00", "dlm_acc": "4.743e-01", "anc_acc": "4.700e-01", "epoch": 0.00138} {"step": 695, "loss": 1.6888, "grad_norm": "1.049e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.675e+00", "anc_loss": "1.727e+00", "dlm_acc": "4.886e-01", "anc_acc": "4.852e-01", "epoch": 0.00139} {"step": 700, "loss": 1.5604, "grad_norm": "1.633e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.417e-01", "epoch": 0.0014} {"step": 705, "loss": 1.8408, "grad_norm": "1.368e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.396e+00", "anc_loss": "1.430e+00", "dlm_acc": "4.933e-01", "anc_acc": "4.960e-01", "epoch": 0.00141} {"step": 710, "loss": 1.1962, "grad_norm": "9.960e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.242e-01", "anc_loss": "5.312e-01", "dlm_acc": "6.873e-01", "anc_acc": "6.851e-01", "epoch": 0.00142} {"step": 715, "loss": 1.6398, "grad_norm": "7.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.273e+00", "dlm_acc": "5.532e-01", "anc_acc": "5.519e-01", "epoch": 0.00143} {"step": 720, "loss": 1.4972, "grad_norm": "1.047e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.257e+00", "dlm_acc": "5.778e-01", "anc_acc": "5.780e-01", "epoch": 0.00144} {"step": 725, "loss": 1.9919, "grad_norm": "6.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.338e+00", "anc_loss": "1.360e+00", "dlm_acc": "2.800e-01", "anc_acc": "2.781e-01", "epoch": 0.00145} {"step": 730, "loss": 1.8404, "grad_norm": "2.088e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.137e+00", "dlm_acc": "3.042e-01", "anc_acc": "3.014e-01", "epoch": 0.00146} {"step": 735, "loss": 1.8464, "grad_norm": "1.546e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.217e+00", "dlm_acc": "3.123e-01", "anc_acc": "3.108e-01", "epoch": 0.00147} {"step": 740, "loss": 1.7105, "grad_norm": "7.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.378e+00", "anc_loss": "1.424e+00", "dlm_acc": "4.489e-01", "anc_acc": "4.469e-01", "epoch": 0.00148} {"step": 745, "loss": 2.0832, "grad_norm": "1.188e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.820e+00", "anc_loss": "1.880e+00", "dlm_acc": "4.337e-01", "anc_acc": "4.297e-01", "epoch": 0.00149} {"step": 750, "loss": 1.8637, "grad_norm": "1.067e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.368e-01", "anc_acc": "5.369e-01", "epoch": 0.0015} {"step": 755, "loss": 1.8456, "grad_norm": "1.191e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.209e+00", "anc_loss": "2.278e+00", "dlm_acc": "3.782e-01", "anc_acc": "3.767e-01", "epoch": 0.00151} {"step": 760, "loss": 1.5348, "grad_norm": "2.018e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.438e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.236e-01", "anc_acc": "5.174e-01", "epoch": 0.00152} {"step": 765, "loss": 1.8248, "grad_norm": "1.010e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.583e+00", "anc_loss": "1.641e+00", "dlm_acc": "4.785e-01", "anc_acc": "4.744e-01", "epoch": 0.00153} {"step": 770, "loss": 2.2573, "grad_norm": "1.027e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.064e+00", "anc_loss": "2.127e+00", "dlm_acc": "3.767e-01", "anc_acc": "3.737e-01", "epoch": 0.00154} {"step": 775, "loss": 1.7805, "grad_norm": "1.164e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.581e+00", "dlm_acc": "4.695e-01", "anc_acc": "4.645e-01", "epoch": 0.00155} {"step": 780, "loss": 1.68, "grad_norm": "3.231e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.714e+00", "anc_loss": "1.759e+00", "dlm_acc": "4.449e-01", "anc_acc": "4.410e-01", "epoch": 0.00156} {"step": 785, "loss": 1.6275, "grad_norm": "9.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.625e+00", "anc_loss": "1.691e+00", "dlm_acc": "4.853e-01", "anc_acc": "4.799e-01", "epoch": 0.00157} {"step": 790, "loss": 1.8112, "grad_norm": "1.025e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.686e+00", "anc_loss": "1.745e+00", "dlm_acc": "4.403e-01", "anc_acc": "4.348e-01", "epoch": 0.00158} {"step": 795, "loss": 1.8391, "grad_norm": "1.145e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.820e+00", "anc_loss": "1.879e+00", "dlm_acc": "4.171e-01", "anc_acc": "4.137e-01", "epoch": 0.00159} {"step": 800, "loss": 1.9928, "grad_norm": "1.409e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.872e+00", "anc_loss": "1.936e+00", "dlm_acc": "4.422e-01", "anc_acc": "4.376e-01", "epoch": 0.0016} {"step": 805, "loss": 1.6495, "grad_norm": "6.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.669e+00", "anc_loss": "1.720e+00", "dlm_acc": "4.394e-01", "anc_acc": "4.338e-01", "epoch": 0.00161} {"step": 810, "loss": 1.3165, "grad_norm": "9.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.505e+00", "dlm_acc": "4.658e-01", "anc_acc": "4.620e-01", "epoch": 0.00162} {"step": 815, "loss": 1.6328, "grad_norm": "8.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.811e+00", "anc_loss": "1.858e+00", "dlm_acc": "4.032e-01", "anc_acc": "3.991e-01", "epoch": 0.00163} {"step": 820, "loss": 1.397, "grad_norm": "9.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.600e+00", "anc_loss": "1.658e+00", "dlm_acc": "4.597e-01", "anc_acc": "4.563e-01", "epoch": 0.00164} {"step": 825, "loss": 1.4737, "grad_norm": "1.208e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.150e+00", "anc_loss": "2.214e+00", "dlm_acc": "3.688e-01", "anc_acc": "3.650e-01", "epoch": 0.00165} {"step": 830, "loss": 1.1172, "grad_norm": "1.290e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.449e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.030e-01", "anc_acc": "4.995e-01", "epoch": 0.00166} {"step": 835, "loss": 1.4709, "grad_norm": "8.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.943e-01", "anc_loss": "1.037e+00", "dlm_acc": "6.226e-01", "anc_acc": "6.189e-01", "epoch": 0.00167} {"step": 840, "loss": 2.0202, "grad_norm": "8.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.983e+00", "anc_loss": "2.044e+00", "dlm_acc": "4.074e-01", "anc_acc": "4.012e-01", "epoch": 0.00168} {"step": 845, "loss": 1.8692, "grad_norm": "8.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.808e+00", "anc_loss": "1.866e+00", "dlm_acc": "4.131e-01", "anc_acc": "4.084e-01", "epoch": 0.00169} {"step": 850, "loss": 2.2503, "grad_norm": "1.528e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.887e+00", "anc_loss": "1.942e+00", "dlm_acc": "4.568e-01", "anc_acc": "4.542e-01", "epoch": 0.0017} {"step": 855, "loss": 1.5567, "grad_norm": "9.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.463e+00", "dlm_acc": "5.051e-01", "anc_acc": "5.012e-01", "epoch": 0.00171} {"step": 860, "loss": 1.4192, "grad_norm": "7.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.322e+00", "dlm_acc": "5.021e-01", "anc_acc": "4.965e-01", "epoch": 0.00172} {"step": 865, "loss": 1.4132, "grad_norm": "7.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.201e+00", "dlm_acc": "5.190e-01", "anc_acc": "5.140e-01", "epoch": 0.00173} {"step": 870, "loss": 1.293, "grad_norm": "1.637e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.343e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.049e-01", "anc_acc": "5.000e-01", "epoch": 0.00174} {"step": 875, "loss": 1.9695, "grad_norm": "1.284e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.939e+00", "anc_loss": "1.991e+00", "dlm_acc": "4.054e-01", "anc_acc": "4.025e-01", "epoch": 0.00175} {"step": 880, "loss": 1.3078, "grad_norm": "7.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.311e+00", "dlm_acc": "5.188e-01", "anc_acc": "5.129e-01", "epoch": 0.00176} {"step": 885, "loss": 1.436, "grad_norm": "9.131e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.018e-01", "anc_acc": "4.954e-01", "epoch": 0.00177} {"step": 890, "loss": 1.8453, "grad_norm": "1.076e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.664e+00", "anc_loss": "1.717e+00", "dlm_acc": "4.593e-01", "anc_acc": "4.535e-01", "epoch": 0.00178} {"step": 895, "loss": 1.5139, "grad_norm": "1.026e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.517e+00", "dlm_acc": "5.085e-01", "anc_acc": "5.040e-01", "epoch": 0.00179} {"step": 900, "loss": 1.5708, "grad_norm": "8.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.545e+00", "anc_loss": "1.595e+00", "dlm_acc": "4.652e-01", "anc_acc": "4.601e-01", "epoch": 0.0018} {"step": 905, "loss": 1.6487, "grad_norm": "1.088e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.953e+00", "anc_loss": "2.009e+00", "dlm_acc": "4.119e-01", "anc_acc": "4.072e-01", "epoch": 0.00181} {"step": 910, "loss": 1.4469, "grad_norm": "7.951e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.447e+00", "dlm_acc": "5.313e-01", "anc_acc": "5.268e-01", "epoch": 0.00182} {"step": 915, "loss": 1.4444, "grad_norm": "4.267e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.435e+00", "anc_loss": "1.483e+00", "dlm_acc": "4.783e-01", "anc_acc": "4.729e-01", "epoch": 0.00183} {"step": 920, "loss": 1.5594, "grad_norm": "7.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.648e+00", "anc_loss": "1.703e+00", "dlm_acc": "4.591e-01", "anc_acc": "4.541e-01", "epoch": 0.00184} {"step": 925, "loss": 1.5455, "grad_norm": "9.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.568e+00", "anc_loss": "1.620e+00", "dlm_acc": "4.523e-01", "anc_acc": "4.485e-01", "epoch": 0.00185} {"step": 930, "loss": 1.3229, "grad_norm": "1.103e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.348e+00", "dlm_acc": "5.590e-01", "anc_acc": "5.548e-01", "epoch": 0.00186} {"step": 935, "loss": 1.5363, "grad_norm": "8.639e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.673e+00", "anc_loss": "1.731e+00", "dlm_acc": "4.872e-01", "anc_acc": "4.836e-01", "epoch": 0.00187} {"step": 940, "loss": 1.5766, "grad_norm": "7.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.392e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.406e-01", "anc_acc": "5.363e-01", "epoch": 0.00188} {"step": 945, "loss": 1.6183, "grad_norm": "1.045e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.616e+00", "dlm_acc": "4.746e-01", "anc_acc": "4.682e-01", "epoch": 0.00189} {"step": 950, "loss": 1.3261, "grad_norm": "5.485e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.276e+00", "anc_loss": "1.318e+00", "dlm_acc": "5.330e-01", "anc_acc": "5.294e-01", "epoch": 0.0019} {"step": 955, "loss": 2.0677, "grad_norm": "9.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.169e+00", "anc_loss": "2.222e+00", "dlm_acc": "4.234e-01", "anc_acc": "4.181e-01", "epoch": 0.00191} {"step": 960, "loss": 1.8467, "grad_norm": "7.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.609e+00", "anc_loss": "1.648e+00", "dlm_acc": "4.300e-01", "anc_acc": "4.252e-01", "epoch": 0.00192} {"step": 965, "loss": 1.4678, "grad_norm": "8.263e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.577e+00", "dlm_acc": "4.052e-01", "anc_acc": "4.041e-01", "epoch": 0.00193} {"step": 970, "loss": 2.1063, "grad_norm": "1.189e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.417e+00", "anc_loss": "2.450e+00", "dlm_acc": "2.241e-01", "anc_acc": "2.240e-01", "epoch": 0.00194} {"step": 975, "loss": 1.5256, "grad_norm": "1.253e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.836e+00", "anc_loss": "1.883e+00", "dlm_acc": "4.156e-01", "anc_acc": "4.162e-01", "epoch": 0.00195} {"step": 980, "loss": 1.729, "grad_norm": "1.063e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.667e+00", "anc_loss": "1.709e+00", "dlm_acc": "4.075e-01", "anc_acc": "4.031e-01", "epoch": 0.00196} {"step": 985, "loss": 1.3246, "grad_norm": "1.004e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.516e-01", "anc_loss": "9.766e-01", "dlm_acc": "4.903e-01", "anc_acc": "4.868e-01", "epoch": 0.00197} {"step": 990, "loss": 1.9325, "grad_norm": "9.873e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.695e+00", "anc_loss": "1.736e+00", "dlm_acc": "3.818e-01", "anc_acc": "3.778e-01", "epoch": 0.00198} {"step": 995, "loss": 1.6963, "grad_norm": "8.227e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.412e+00", "anc_loss": "1.456e+00", "dlm_acc": "5.080e-01", "anc_acc": "5.042e-01", "epoch": 0.00199} {"step": 1000, "loss": 1.116, "grad_norm": "6.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e-01", "anc_loss": "1.533e-01", "dlm_acc": "9.146e-01", "anc_acc": "9.285e-01", "epoch": 0.002} {"step": 1005, "loss": 1.6513, "grad_norm": "6.161e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.495e+00", "dlm_acc": "4.839e-01", "anc_acc": "4.809e-01", "epoch": 0.00201} {"step": 1010, "loss": 1.1105, "grad_norm": "6.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.066e-01", "anc_acc": "5.053e-01", "epoch": 0.00202} {"step": 1015, "loss": 1.9702, "grad_norm": "1.374e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.539e+00", "dlm_acc": "4.633e-01", "anc_acc": "4.583e-01", "epoch": 0.00203} {"step": 1020, "loss": 1.5813, "grad_norm": "1.019e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.258e-01", "anc_acc": "5.225e-01", "epoch": 0.00204} {"step": 1025, "loss": 1.5826, "grad_norm": "1.131e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.492e+00", "anc_loss": "1.556e+00", "dlm_acc": "4.241e-01", "anc_acc": "4.135e-01", "epoch": 0.00205} {"step": 1030, "loss": 1.3324, "grad_norm": "8.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.411e+00", "dlm_acc": "4.637e-01", "anc_acc": "4.522e-01", "epoch": 0.00206} {"step": 1035, "loss": 1.4674, "grad_norm": "6.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.218e-01", "anc_acc": "5.152e-01", "epoch": 0.00207} {"step": 1040, "loss": 1.804, "grad_norm": "9.347e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.183e+00", "anc_loss": "2.231e+00", "dlm_acc": "3.166e-01", "anc_acc": "3.155e-01", "epoch": 0.00208} {"step": 1045, "loss": 1.6006, "grad_norm": "1.147e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.549e+00", "anc_loss": "1.585e+00", "dlm_acc": "4.548e-01", "anc_acc": "4.536e-01", "epoch": 0.00209} {"step": 1050, "loss": 1.493, "grad_norm": "1.009e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.455e+00", "dlm_acc": "4.775e-01", "anc_acc": "4.757e-01", "epoch": 0.0021} {"step": 1055, "loss": 1.6802, "grad_norm": "8.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.887e+00", "anc_loss": "1.941e+00", "dlm_acc": "3.799e-01", "anc_acc": "3.763e-01", "epoch": 0.00211} {"step": 1060, "loss": 1.8553, "grad_norm": "5.466e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.989e+00", "anc_loss": "2.036e+00", "dlm_acc": "3.840e-01", "anc_acc": "3.814e-01", "epoch": 0.00212} {"step": 1065, "loss": 2.2348, "grad_norm": "1.078e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.334e+00", "anc_loss": "2.392e+00", "dlm_acc": "3.463e-01", "anc_acc": "3.432e-01", "epoch": 0.00213} {"step": 1070, "loss": 1.214, "grad_norm": "3.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.208e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.431e-01", "epoch": 0.00214} {"step": 1075, "loss": 1.3294, "grad_norm": "7.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.398e+00", "dlm_acc": "4.152e-01", "anc_acc": "4.125e-01", "epoch": 0.00215} {"step": 1080, "loss": 1.2669, "grad_norm": "6.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.324e-01", "anc_loss": "7.766e-01", "dlm_acc": "6.974e-01", "anc_acc": "6.894e-01", "epoch": 0.00216} {"step": 1085, "loss": 1.4141, "grad_norm": "1.209e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.484e-01", "anc_acc": "5.423e-01", "epoch": 0.00217} {"step": 1090, "loss": 1.0441, "grad_norm": "6.616e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.133e-01", "anc_loss": "9.539e-01", "dlm_acc": "6.129e-01", "anc_acc": "6.089e-01", "epoch": 0.00218} {"step": 1095, "loss": 1.4063, "grad_norm": "8.372e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.459e+00", "dlm_acc": "4.941e-01", "anc_acc": "4.904e-01", "epoch": 0.00219} {"step": 1100, "loss": 1.4551, "grad_norm": "9.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.470e+00", "dlm_acc": "4.637e-01", "anc_acc": "4.584e-01", "epoch": 0.0022} {"step": 1105, "loss": 1.3136, "grad_norm": "8.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.678e+00", "anc_loss": "1.730e+00", "dlm_acc": "4.415e-01", "anc_acc": "4.390e-01", "epoch": 0.00221} {"step": 1110, "loss": 1.5814, "grad_norm": "1.060e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.257e+00", "dlm_acc": "5.166e-01", "anc_acc": "5.135e-01", "epoch": 0.00222} {"step": 1115, "loss": 1.321, "grad_norm": "5.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.324e+00", "dlm_acc": "4.873e-01", "anc_acc": "4.822e-01", "epoch": 0.00223} {"step": 1120, "loss": 1.273, "grad_norm": "5.234e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.949e-01", "anc_loss": "9.285e-01", "dlm_acc": "6.351e-01", "anc_acc": "6.314e-01", "epoch": 0.00224} {"step": 1125, "loss": 0.9576, "grad_norm": "4.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.732e-01", "anc_loss": "4.980e-01", "dlm_acc": "7.329e-01", "anc_acc": "7.291e-01", "epoch": 0.00225} {"step": 1130, "loss": 1.4665, "grad_norm": "5.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.703e-01", "anc_loss": "9.688e-01", "dlm_acc": "5.823e-01", "anc_acc": "5.831e-01", "epoch": 0.00226} {"step": 1135, "loss": 1.8438, "grad_norm": "7.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.482e+00", "anc_loss": "1.520e+00", "dlm_acc": "4.527e-01", "anc_acc": "4.493e-01", "epoch": 0.00227} {"step": 1140, "loss": 1.4904, "grad_norm": "1.123e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.068e+00", "anc_loss": "1.086e+00", "dlm_acc": "4.252e-01", "anc_acc": "4.193e-01", "epoch": 0.00228} {"step": 1145, "loss": 1.418, "grad_norm": "5.937e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.189e+00", "anc_loss": "1.229e+00", "dlm_acc": "4.603e-01", "anc_acc": "4.553e-01", "epoch": 0.00229} {"step": 1150, "loss": 2.1647, "grad_norm": "1.499e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.309e+00", "anc_loss": "2.345e+00", "dlm_acc": "3.265e-01", "anc_acc": "3.227e-01", "epoch": 0.0023} {"step": 1155, "loss": 1.5516, "grad_norm": "9.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.837e+00", "anc_loss": "1.887e+00", "dlm_acc": "4.139e-01", "anc_acc": "4.097e-01", "epoch": 0.00231} {"step": 1160, "loss": 1.2828, "grad_norm": "7.328e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.411e+00", "dlm_acc": "4.967e-01", "anc_acc": "4.960e-01", "epoch": 0.00232} {"step": 1165, "loss": 1.713, "grad_norm": "4.969e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.730e+00", "anc_loss": "1.772e+00", "dlm_acc": "4.347e-01", "anc_acc": "4.308e-01", "epoch": 0.00233} {"step": 1170, "loss": 1.5038, "grad_norm": "8.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.299e+00", "anc_loss": "1.368e+00", "dlm_acc": "4.544e-01", "anc_acc": "4.469e-01", "epoch": 0.00234} {"step": 1175, "loss": 2.1723, "grad_norm": "1.050e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.971e+00", "anc_loss": "2.023e+00", "dlm_acc": "4.232e-01", "anc_acc": "4.259e-01", "epoch": 0.00235} {"step": 1180, "loss": 1.7406, "grad_norm": "4.603e+01", "learning_rate": "1.000e-04", "dlm_loss": "1.719e+00", "anc_loss": "1.722e+00", "dlm_acc": "4.478e-01", "anc_acc": "4.440e-01", "epoch": 0.00236} {"step": 1185, "loss": 1.0494, "grad_norm": "1.180e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.156e+00", "dlm_acc": "5.469e-01", "anc_acc": "5.412e-01", "epoch": 0.00237} {"step": 1190, "loss": 1.6408, "grad_norm": "2.721e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.114e+00", "anc_loss": "2.159e+00", "dlm_acc": "3.926e-01", "anc_acc": "3.903e-01", "epoch": 0.00238} {"step": 1195, "loss": 1.1834, "grad_norm": "5.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.559e+00", "anc_loss": "1.608e+00", "dlm_acc": "4.550e-01", "anc_acc": "4.514e-01", "epoch": 0.00239} {"step": 1200, "loss": 1.2166, "grad_norm": "6.128e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.349e+00", "anc_loss": "1.394e+00", "dlm_acc": "4.848e-01", "anc_acc": "4.814e-01", "epoch": 0.0024} {"step": 1205, "loss": 1.7315, "grad_norm": "8.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.431e+00", "dlm_acc": "5.057e-01", "anc_acc": "5.019e-01", "epoch": 0.00241} {"step": 1210, "loss": 2.0215, "grad_norm": "1.111e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.002e+00", "anc_loss": "2.056e+00", "dlm_acc": "4.249e-01", "anc_acc": "4.207e-01", "epoch": 0.00242} {"step": 1215, "loss": 1.9067, "grad_norm": "1.515e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.686e+00", "anc_loss": "1.723e+00", "dlm_acc": "4.418e-01", "anc_acc": "4.379e-01", "epoch": 0.00243} {"step": 1220, "loss": 2.0239, "grad_norm": "1.187e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.695e+00", "anc_loss": "1.748e+00", "dlm_acc": "4.647e-01", "anc_acc": "4.612e-01", "epoch": 0.00244} {"step": 1225, "loss": 1.5452, "grad_norm": "1.038e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.556e+00", "dlm_acc": "4.868e-01", "anc_acc": "4.810e-01", "epoch": 0.00245} {"step": 1230, "loss": 1.8112, "grad_norm": "1.010e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.952e+00", "anc_loss": "2.004e+00", "dlm_acc": "4.047e-01", "anc_acc": "4.020e-01", "epoch": 0.00246} {"step": 1235, "loss": 1.5348, "grad_norm": "7.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.784e+00", "anc_loss": "1.831e+00", "dlm_acc": "4.166e-01", "anc_acc": "4.132e-01", "epoch": 0.00247} {"step": 1240, "loss": 1.4456, "grad_norm": "6.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.177e+00", "dlm_acc": "5.846e-01", "anc_acc": "5.808e-01", "epoch": 0.00248} {"step": 1245, "loss": 1.8153, "grad_norm": "5.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.418e+00", "anc_loss": "1.467e+00", "dlm_acc": "5.432e-01", "anc_acc": "5.401e-01", "epoch": 0.00249} {"step": 1250, "loss": 1.3981, "grad_norm": "1.307e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.472e+00", "anc_loss": "1.516e+00", "dlm_acc": "4.513e-01", "anc_acc": "4.468e-01", "epoch": 0.0025} {"step": 1255, "loss": 1.6157, "grad_norm": "9.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.516e+00", "dlm_acc": "4.973e-01", "anc_acc": "4.928e-01", "epoch": 0.00251} {"step": 1260, "loss": 1.6554, "grad_norm": "5.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.798e+00", "anc_loss": "1.847e+00", "dlm_acc": "4.258e-01", "anc_acc": "4.202e-01", "epoch": 0.00252} {"step": 1265, "loss": 1.7604, "grad_norm": "6.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.546e+00", "dlm_acc": "5.237e-01", "anc_acc": "5.195e-01", "epoch": 0.00253} {"step": 1270, "loss": 1.6807, "grad_norm": "1.323e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.415e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.224e-01", "anc_acc": "5.195e-01", "epoch": 0.00254} {"step": 1275, "loss": 1.8033, "grad_norm": "4.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.951e+00", "anc_loss": "2.006e+00", "dlm_acc": "3.954e-01", "anc_acc": "3.911e-01", "epoch": 0.00255} {"step": 1280, "loss": 1.4712, "grad_norm": "6.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.565e+00", "anc_loss": "1.617e+00", "dlm_acc": "5.034e-01", "anc_acc": "4.998e-01", "epoch": 0.00256} {"step": 1285, "loss": 1.3663, "grad_norm": "7.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.341e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.350e-01", "anc_acc": "5.293e-01", "epoch": 0.00257} {"step": 1290, "loss": 1.3932, "grad_norm": "4.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.538e-01", "anc_acc": "5.532e-01", "epoch": 0.00258} {"step": 1295, "loss": 1.5504, "grad_norm": "7.690e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.648e-01", "anc_acc": "5.602e-01", "epoch": 0.00259} {"step": 1300, "loss": 1.892, "grad_norm": "7.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.895e+00", "anc_loss": "1.960e+00", "dlm_acc": "4.394e-01", "anc_acc": "4.342e-01", "epoch": 0.0026} {"step": 1305, "loss": 1.5711, "grad_norm": "4.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.624e-01", "anc_acc": "5.580e-01", "epoch": 0.00261} {"step": 1310, "loss": 1.0888, "grad_norm": "4.185e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.267e+00", "dlm_acc": "5.419e-01", "anc_acc": "5.367e-01", "epoch": 0.00262} {"step": 1315, "loss": 1.6924, "grad_norm": "5.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.803e+00", "anc_loss": "1.863e+00", "dlm_acc": "4.553e-01", "anc_acc": "4.508e-01", "epoch": 0.00263} {"step": 1320, "loss": 1.7936, "grad_norm": "6.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.822e+00", "anc_loss": "1.867e+00", "dlm_acc": "4.233e-01", "anc_acc": "4.210e-01", "epoch": 0.00264} {"step": 1325, "loss": 1.5985, "grad_norm": "6.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.625e+00", "anc_loss": "1.667e+00", "dlm_acc": "4.813e-01", "anc_acc": "4.757e-01", "epoch": 0.00265} {"step": 1330, "loss": 1.0518, "grad_norm": "1.618e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.010e-01", "anc_acc": "4.976e-01", "epoch": 0.00266} {"step": 1335, "loss": 1.176, "grad_norm": "8.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.409e+00", "dlm_acc": "4.963e-01", "anc_acc": "4.926e-01", "epoch": 0.00267} {"step": 1340, "loss": 1.2548, "grad_norm": "5.234e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.536e+00", "anc_loss": "1.581e+00", "dlm_acc": "3.803e-01", "anc_acc": "3.748e-01", "epoch": 0.00268} {"step": 1345, "loss": 0.9756, "grad_norm": "1.735e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.369e+00", "anc_loss": "1.388e+00", "dlm_acc": "4.614e-01", "anc_acc": "4.555e-01", "epoch": 0.00269} {"step": 1350, "loss": 1.6054, "grad_norm": "5.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.248e+00", "anc_loss": "2.297e+00", "dlm_acc": "2.819e-01", "anc_acc": "2.786e-01", "epoch": 0.0027} {"step": 1355, "loss": 1.6765, "grad_norm": "8.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.514e+00", "anc_loss": "1.549e+00", "dlm_acc": "4.463e-01", "anc_acc": "4.445e-01", "epoch": 0.00271} {"step": 1360, "loss": 1.6818, "grad_norm": "1.013e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.410e+00", "dlm_acc": "5.110e-01", "anc_acc": "5.030e-01", "epoch": 0.00272} {"step": 1365, "loss": 1.565, "grad_norm": "8.157e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.167e+00", "anc_loss": "1.211e+00", "dlm_acc": "5.520e-01", "anc_acc": "5.478e-01", "epoch": 0.00273} {"step": 1370, "loss": 1.7722, "grad_norm": "8.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.449e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.043e-01", "anc_acc": "5.006e-01", "epoch": 0.00274} {"step": 1375, "loss": 1.5258, "grad_norm": "1.029e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.466e+00", "dlm_acc": "4.753e-01", "anc_acc": "4.696e-01", "epoch": 0.00275} {"step": 1380, "loss": 1.5091, "grad_norm": "6.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.407e+00", "anc_loss": "1.449e+00", "dlm_acc": "4.959e-01", "anc_acc": "4.911e-01", "epoch": 0.00276} {"step": 1385, "loss": 2.1426, "grad_norm": "4.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.700e+00", "anc_loss": "2.737e+00", "dlm_acc": "1.601e-01", "anc_acc": "1.586e-01", "epoch": 0.00277} {"step": 1390, "loss": 1.8173, "grad_norm": "8.074e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.322e+00", "anc_loss": "2.343e+00", "dlm_acc": "2.179e-01", "anc_acc": "2.182e-01", "epoch": 0.00278} {"step": 1395, "loss": 1.6193, "grad_norm": "1.121e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.525e+00", "anc_loss": "1.565e+00", "dlm_acc": "4.595e-01", "anc_acc": "4.565e-01", "epoch": 0.00279} {"step": 1400, "loss": 1.7299, "grad_norm": "8.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.608e+00", "anc_loss": "1.656e+00", "dlm_acc": "4.679e-01", "anc_acc": "4.653e-01", "epoch": 0.0028} {"step": 1405, "loss": 1.6731, "grad_norm": "1.085e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.610e+00", "anc_loss": "1.645e+00", "dlm_acc": "4.447e-01", "anc_acc": "4.421e-01", "epoch": 0.00281} {"step": 1410, "loss": 1.457, "grad_norm": "7.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.979e-01", "anc_loss": "9.254e-01", "dlm_acc": "6.134e-01", "anc_acc": "6.112e-01", "epoch": 0.00282} {"step": 1415, "loss": 1.5389, "grad_norm": "6.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.712e-01", "anc_acc": "5.674e-01", "epoch": 0.00283} {"step": 1420, "loss": 1.221, "grad_norm": "4.884e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.146e+00", "dlm_acc": "4.341e-01", "anc_acc": "4.303e-01", "epoch": 0.00284} {"step": 1425, "loss": 1.4838, "grad_norm": "3.770e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.521e+00", "dlm_acc": "5.239e-01", "anc_acc": "5.187e-01", "epoch": 0.00285} {"step": 1430, "loss": 1.5578, "grad_norm": "7.304e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.742e+00", "anc_loss": "1.789e+00", "dlm_acc": "4.051e-01", "anc_acc": "4.004e-01", "epoch": 0.00286} {"step": 1435, "loss": 1.3974, "grad_norm": "8.372e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.113e+00", "dlm_acc": "5.836e-01", "anc_acc": "5.796e-01", "epoch": 0.00287} {"step": 1440, "loss": 1.5963, "grad_norm": "6.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.620e+00", "anc_loss": "1.670e+00", "dlm_acc": "4.636e-01", "anc_acc": "4.586e-01", "epoch": 0.00288} {"step": 1445, "loss": 1.3848, "grad_norm": "5.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.111e+00", "anc_loss": "1.145e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.579e-01", "epoch": 0.00289} {"step": 1450, "loss": 1.8328, "grad_norm": "7.956e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.973e+00", "anc_loss": "1.996e+00", "dlm_acc": "3.005e-01", "anc_acc": "2.980e-01", "epoch": 0.0029} {"step": 1455, "loss": 1.2948, "grad_norm": "7.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.548e-01", "anc_acc": "5.534e-01", "epoch": 0.00291} {"step": 1460, "loss": 1.2112, "grad_norm": "9.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.301e+00", "anc_loss": "1.342e+00", "dlm_acc": "5.435e-01", "anc_acc": "5.393e-01", "epoch": 0.00292} {"step": 1465, "loss": 1.0711, "grad_norm": "6.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.340e+00", "anc_loss": "1.376e+00", "dlm_acc": "4.882e-01", "anc_acc": "4.838e-01", "epoch": 0.00293} {"step": 1470, "loss": 1.4153, "grad_norm": "6.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.006e+00", "anc_loss": "2.011e+00", "dlm_acc": "3.404e-01", "anc_acc": "3.386e-01", "epoch": 0.00294} {"step": 1475, "loss": 1.9289, "grad_norm": "8.832e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.628e+00", "anc_loss": "2.669e+00", "dlm_acc": "1.637e-01", "anc_acc": "1.624e-01", "epoch": 0.00295} {"step": 1480, "loss": 1.3197, "grad_norm": "1.034e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.236e-01", "anc_acc": "5.184e-01", "epoch": 0.00296} {"step": 1485, "loss": 1.2893, "grad_norm": "7.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.623e+00", "anc_loss": "1.663e+00", "dlm_acc": "4.623e-01", "anc_acc": "4.604e-01", "epoch": 0.00297} {"step": 1490, "loss": 1.3647, "grad_norm": "9.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.432e+00", "dlm_acc": "4.927e-01", "anc_acc": "4.903e-01", "epoch": 0.00298} {"step": 1495, "loss": 1.6886, "grad_norm": "5.628e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.417e+00", "anc_loss": "1.457e+00", "dlm_acc": "5.660e-01", "anc_acc": "5.622e-01", "epoch": 0.00299} {"step": 1500, "loss": 1.5333, "grad_norm": "1.002e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.876e-01", "anc_loss": "9.055e-01", "dlm_acc": "7.639e-01", "anc_acc": "7.628e-01", "epoch": 0.003} {"step": 1505, "loss": 1.4802, "grad_norm": "5.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.096e-01", "anc_acc": "5.039e-01", "epoch": 0.00301} {"step": 1510, "loss": 1.575, "grad_norm": "8.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.613e+00", "anc_loss": "1.663e+00", "dlm_acc": "4.491e-01", "anc_acc": "4.449e-01", "epoch": 0.00302} {"step": 1515, "loss": 1.0484, "grad_norm": "6.071e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.510e-01", "anc_loss": "6.682e-01", "dlm_acc": "7.069e-01", "anc_acc": "7.043e-01", "epoch": 0.00303} {"step": 1520, "loss": 1.7267, "grad_norm": "6.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.109e-01", "anc_loss": "6.223e-01", "dlm_acc": "7.023e-01", "anc_acc": "7.005e-01", "epoch": 0.00304} {"step": 1525, "loss": 0.97, "grad_norm": "6.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.743e-01", "anc_loss": "6.953e-01", "dlm_acc": "6.678e-01", "anc_acc": "6.641e-01", "epoch": 0.00305} {"step": 1530, "loss": 1.3204, "grad_norm": "1.008e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.390e+00", "anc_loss": "1.432e+00", "dlm_acc": "4.333e-01", "anc_acc": "4.280e-01", "epoch": 0.00306} {"step": 1535, "loss": 1.7565, "grad_norm": "7.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.811e+00", "anc_loss": "1.864e+00", "dlm_acc": "4.221e-01", "anc_acc": "4.177e-01", "epoch": 0.00307} {"step": 1540, "loss": 1.9175, "grad_norm": "8.569e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.995e+00", "anc_loss": "2.045e+00", "dlm_acc": "3.946e-01", "anc_acc": "3.909e-01", "epoch": 0.00308} {"step": 1545, "loss": 1.6271, "grad_norm": "1.732e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.506e+00", "anc_loss": "1.548e+00", "dlm_acc": "5.086e-01", "anc_acc": "5.028e-01", "epoch": 0.00309} {"step": 1550, "loss": 1.4536, "grad_norm": "4.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.506e+00", "anc_loss": "1.550e+00", "dlm_acc": "4.970e-01", "anc_acc": "4.929e-01", "epoch": 0.0031} {"step": 1555, "loss": 1.2033, "grad_norm": "4.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.370e+00", "dlm_acc": "4.943e-01", "anc_acc": "4.882e-01", "epoch": 0.00311} {"step": 1560, "loss": 1.3173, "grad_norm": "3.947e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e+00", "anc_loss": "1.402e+00", "dlm_acc": "4.915e-01", "anc_acc": "4.864e-01", "epoch": 0.00312} {"step": 1565, "loss": 1.4036, "grad_norm": "4.761e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.121e-01", "anc_acc": "5.082e-01", "epoch": 0.00313} {"step": 1570, "loss": 1.4002, "grad_norm": "5.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.255e+00", "anc_loss": "1.295e+00", "dlm_acc": "5.664e-01", "anc_acc": "5.616e-01", "epoch": 0.00314} {"step": 1575, "loss": 1.4128, "grad_norm": "8.680e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.078e-01", "anc_loss": "9.219e-01", "dlm_acc": "5.388e-01", "anc_acc": "5.359e-01", "epoch": 0.00315} {"step": 1580, "loss": 1.7619, "grad_norm": "2.287e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.458e+00", "dlm_acc": "3.468e-01", "anc_acc": "3.556e-01", "epoch": 0.00316} {"step": 1585, "loss": 1.8061, "grad_norm": "6.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.730e+00", "anc_loss": "1.778e+00", "dlm_acc": "4.539e-01", "anc_acc": "4.477e-01", "epoch": 0.00317} {"step": 1590, "loss": 1.4621, "grad_norm": "9.874e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.554e+00", "anc_loss": "1.581e+00", "dlm_acc": "4.361e-01", "anc_acc": "4.322e-01", "epoch": 0.00318} {"step": 1595, "loss": 1.4645, "grad_norm": "6.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.716e+00", "anc_loss": "1.758e+00", "dlm_acc": "3.636e-01", "anc_acc": "3.596e-01", "epoch": 0.00319} {"step": 1600, "loss": 1.5362, "grad_norm": "7.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.639e+00", "anc_loss": "1.681e+00", "dlm_acc": "4.600e-01", "anc_acc": "4.548e-01", "epoch": 0.0032} {"step": 1605, "loss": 1.1909, "grad_norm": "5.429e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.551e-01", "anc_acc": "5.503e-01", "epoch": 0.00321} {"step": 1610, "loss": 1.1507, "grad_norm": "6.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.511e+00", "anc_loss": "1.561e+00", "dlm_acc": "4.868e-01", "anc_acc": "4.815e-01", "epoch": 0.00322} {"step": 1615, "loss": 1.2289, "grad_norm": "6.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.258e+00", "dlm_acc": "5.721e-01", "anc_acc": "5.661e-01", "epoch": 0.00323} {"step": 1620, "loss": 1.0595, "grad_norm": "6.141e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.462e+00", "dlm_acc": "3.761e-01", "anc_acc": "3.716e-01", "epoch": 0.00324} {"step": 1625, "loss": 1.5631, "grad_norm": "1.232e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.178e-01", "anc_acc": "5.129e-01", "epoch": 0.00325} {"step": 1630, "loss": 1.6414, "grad_norm": "4.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.204e+00", "dlm_acc": "5.153e-01", "anc_acc": "5.108e-01", "epoch": 0.00326} {"step": 1635, "loss": 1.3324, "grad_norm": "9.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.266e-01", "anc_loss": "7.496e-01", "dlm_acc": "6.752e-01", "anc_acc": "6.720e-01", "epoch": 0.00327} {"step": 1640, "loss": 1.3078, "grad_norm": "5.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.912e-01", "anc_loss": "1.022e+00", "dlm_acc": "6.023e-01", "anc_acc": "5.983e-01", "epoch": 0.00328} {"step": 1645, "loss": 0.8829, "grad_norm": "3.458e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.790e-01", "anc_loss": "1.903e-01", "dlm_acc": "9.067e-01", "anc_acc": "9.018e-01", "epoch": 0.00329} {"step": 1650, "loss": 1.3591, "grad_norm": "8.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.051e+00", "dlm_acc": "6.910e-01", "anc_acc": "6.876e-01", "epoch": 0.0033} {"step": 1655, "loss": 1.2545, "grad_norm": "7.684e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.486e+00", "anc_loss": "1.540e+00", "dlm_acc": "4.719e-01", "anc_acc": "4.664e-01", "epoch": 0.00331} {"step": 1660, "loss": 1.596, "grad_norm": "8.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.824e+00", "anc_loss": "1.902e+00", "dlm_acc": "4.550e-01", "anc_acc": "4.459e-01", "epoch": 0.00332} {"step": 1665, "loss": 1.5302, "grad_norm": "7.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.353e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.328e-01", "anc_acc": "5.304e-01", "epoch": 0.00333} {"step": 1670, "loss": 1.4224, "grad_norm": "6.942e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.550e+00", "anc_loss": "1.603e+00", "dlm_acc": "4.606e-01", "anc_acc": "4.571e-01", "epoch": 0.00334} {"step": 1675, "loss": 1.3953, "grad_norm": "5.818e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.200e+00", "anc_loss": "1.237e+00", "dlm_acc": "5.406e-01", "anc_acc": "5.362e-01", "epoch": 0.00335} {"step": 1680, "loss": 1.3227, "grad_norm": "4.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.558e+00", "dlm_acc": "4.399e-01", "anc_acc": "4.364e-01", "epoch": 0.00336} {"step": 1685, "loss": 1.2202, "grad_norm": "7.636e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.820e+00", "anc_loss": "1.869e+00", "dlm_acc": "3.454e-01", "anc_acc": "3.433e-01", "epoch": 0.00337} {"step": 1690, "loss": 1.1751, "grad_norm": "2.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.309e+00", "dlm_acc": "4.937e-01", "anc_acc": "4.902e-01", "epoch": 0.00338} {"step": 1695, "loss": 1.1729, "grad_norm": "7.159e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.482e+00", "dlm_acc": "5.120e-01", "anc_acc": "5.088e-01", "epoch": 0.00339} {"step": 1700, "loss": 1.216, "grad_norm": "7.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.494e+00", "dlm_acc": "4.545e-01", "anc_acc": "4.494e-01", "epoch": 0.0034} {"step": 1705, "loss": 1.737, "grad_norm": "7.405e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.641e+00", "anc_loss": "1.676e+00", "dlm_acc": "3.410e-01", "anc_acc": "3.375e-01", "epoch": 0.00341} {"step": 1710, "loss": 1.6548, "grad_norm": "7.830e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.986e+00", "anc_loss": "2.020e+00", "dlm_acc": "2.415e-01", "anc_acc": "2.416e-01", "epoch": 0.00342} {"step": 1715, "loss": 1.4515, "grad_norm": "6.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.717e+00", "anc_loss": "1.750e+00", "dlm_acc": "3.592e-01", "anc_acc": "3.548e-01", "epoch": 0.00343} {"step": 1720, "loss": 1.7058, "grad_norm": "1.042e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.956e+00", "anc_loss": "2.094e+00", "dlm_acc": "3.644e-01", "anc_acc": "3.501e-01", "epoch": 0.00344} {"step": 1725, "loss": 1.3709, "grad_norm": "3.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.405e-01", "anc_acc": "5.325e-01", "epoch": 0.00345} {"step": 1730, "loss": 1.5254, "grad_norm": "5.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.852e+00", "anc_loss": "1.898e+00", "dlm_acc": "4.188e-01", "anc_acc": "4.142e-01", "epoch": 0.00346} {"step": 1735, "loss": 1.6998, "grad_norm": "5.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.641e+00", "anc_loss": "1.678e+00", "dlm_acc": "4.466e-01", "anc_acc": "4.443e-01", "epoch": 0.00347} {"step": 1740, "loss": 1.4397, "grad_norm": "2.757e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.756e+00", "dlm_acc": "4.530e-01", "anc_acc": "4.474e-01", "epoch": 0.00348} {"step": 1745, "loss": 1.5445, "grad_norm": "5.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.961e+00", "anc_loss": "2.013e+00", "dlm_acc": "3.984e-01", "anc_acc": "3.933e-01", "epoch": 0.00349} {"step": 1750, "loss": 1.3255, "grad_norm": "1.303e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.066e+00", "anc_loss": "2.117e+00", "dlm_acc": "3.401e-01", "anc_acc": "3.368e-01", "epoch": 0.0035} {"step": 1755, "loss": 0.9703, "grad_norm": "5.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.050e+00", "dlm_acc": "5.774e-01", "anc_acc": "5.714e-01", "epoch": 0.00351} {"step": 1760, "loss": 1.2502, "grad_norm": "7.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.367e-01", "anc_loss": "7.648e-01", "dlm_acc": "5.877e-01", "anc_acc": "5.779e-01", "epoch": 0.00352} {"step": 1765, "loss": 1.2149, "grad_norm": "4.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.375e-01", "anc_loss": "9.500e-01", "dlm_acc": "4.258e-01", "anc_acc": "4.227e-01", "epoch": 0.00353} {"step": 1770, "loss": 1.2496, "grad_norm": "3.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.758e-01", "anc_loss": "6.797e-01", "dlm_acc": "4.822e-01", "anc_acc": "4.814e-01", "epoch": 0.00354} {"step": 1775, "loss": 0.742, "grad_norm": "2.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.148e-01", "anc_loss": "6.203e-01", "dlm_acc": "5.049e-01", "anc_acc": "5.014e-01", "epoch": 0.00355} {"step": 1780, "loss": 0.8421, "grad_norm": "5.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.727e-01", "anc_loss": "6.789e-01", "dlm_acc": "5.030e-01", "anc_acc": "5.015e-01", "epoch": 0.00356} {"step": 1785, "loss": 1.4155, "grad_norm": "6.279e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.732e+00", "anc_loss": "1.764e+00", "dlm_acc": "3.567e-01", "anc_acc": "3.543e-01", "epoch": 0.00357} {"step": 1790, "loss": 1.1549, "grad_norm": "8.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.660e-01", "anc_loss": "7.715e-01", "dlm_acc": "5.508e-01", "anc_acc": "5.469e-01", "epoch": 0.00358} {"step": 1795, "loss": 1.2371, "grad_norm": "5.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.246e-01", "anc_loss": "8.402e-01", "dlm_acc": "6.906e-01", "anc_acc": "6.897e-01", "epoch": 0.00359} {"step": 1800, "loss": 1.1568, "grad_norm": "4.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.938e-01", "anc_loss": "1.009e+00", "dlm_acc": "4.942e-01", "anc_acc": "4.943e-01", "epoch": 0.0036} {"step": 1805, "loss": 1.3193, "grad_norm": "7.404e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.235e+00", "dlm_acc": "4.076e-01", "anc_acc": "4.021e-01", "epoch": 0.00361} {"step": 1810, "loss": 1.139, "grad_norm": "4.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.484e-01", "anc_loss": "8.578e-01", "dlm_acc": "5.429e-01", "anc_acc": "5.404e-01", "epoch": 0.00362} {"step": 1815, "loss": 1.5751, "grad_norm": "8.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.217e+00", "anc_loss": "1.252e+00", "dlm_acc": "6.092e-01", "anc_acc": "6.060e-01", "epoch": 0.00363} {"step": 1820, "loss": 1.1675, "grad_norm": "8.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.414e-01", "anc_loss": "8.680e-01", "dlm_acc": "6.064e-01", "anc_acc": "6.049e-01", "epoch": 0.00364} {"step": 1825, "loss": 1.1385, "grad_norm": "1.017e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.151e+00", "dlm_acc": "4.692e-01", "anc_acc": "4.660e-01", "epoch": 0.00365} {"step": 1830, "loss": 1.3133, "grad_norm": "5.650e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.828e-01", "anc_loss": "9.992e-01", "dlm_acc": "5.051e-01", "anc_acc": "5.036e-01", "epoch": 0.00366} {"step": 1835, "loss": 1.2395, "grad_norm": "7.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.454e+00", "anc_loss": "1.500e+00", "dlm_acc": "5.433e-01", "anc_acc": "5.409e-01", "epoch": 0.00367} {"step": 1840, "loss": 1.4749, "grad_norm": "4.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.609e+00", "anc_loss": "1.656e+00", "dlm_acc": "4.867e-01", "anc_acc": "4.846e-01", "epoch": 0.00368} {"step": 1845, "loss": 1.6566, "grad_norm": "8.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.256e+00", "anc_loss": "1.280e+00", "dlm_acc": "4.999e-01", "anc_acc": "4.978e-01", "epoch": 0.00369} {"step": 1850, "loss": 1.3655, "grad_norm": "7.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.918e-01", "anc_loss": "7.064e-01", "dlm_acc": "6.330e-01", "anc_acc": "6.313e-01", "epoch": 0.0037} {"step": 1855, "loss": 1.3445, "grad_norm": "7.004e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.633e-01", "anc_loss": "6.844e-01", "dlm_acc": "7.278e-01", "anc_acc": "7.273e-01", "epoch": 0.00371} {"step": 1860, "loss": 1.2511, "grad_norm": "9.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.149e+00", "dlm_acc": "5.937e-01", "anc_acc": "5.898e-01", "epoch": 0.00372} {"step": 1865, "loss": 1.5587, "grad_norm": "6.280e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.550e+00", "anc_loss": "1.591e+00", "dlm_acc": "4.472e-01", "anc_acc": "4.433e-01", "epoch": 0.00373} {"step": 1870, "loss": 1.2312, "grad_norm": "6.327e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.132e+00", "anc_loss": "1.121e+00", "dlm_acc": "5.672e-01", "anc_acc": "5.596e-01", "epoch": 0.00374} {"step": 1875, "loss": 1.2993, "grad_norm": "8.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.190e+00", "dlm_acc": "5.112e-01", "anc_acc": "5.082e-01", "epoch": 0.00375} {"step": 1880, "loss": 1.4672, "grad_norm": "5.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.067e+00", "anc_loss": "1.098e+00", "dlm_acc": "6.003e-01", "anc_acc": "5.974e-01", "epoch": 0.00376} {"step": 1885, "loss": 1.6784, "grad_norm": "4.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.367e+00", "dlm_acc": "4.706e-01", "anc_acc": "4.689e-01", "epoch": 0.00377} {"step": 1890, "loss": 1.4806, "grad_norm": "6.186e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.738e-01", "anc_loss": "8.836e-01", "dlm_acc": "5.015e-01", "anc_acc": "4.985e-01", "epoch": 0.00378} {"step": 1895, "loss": 1.8639, "grad_norm": "8.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.522e+00", "dlm_acc": "4.853e-01", "anc_acc": "4.815e-01", "epoch": 0.00379} {"step": 1900, "loss": 2.0394, "grad_norm": "6.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.502e+00", "dlm_acc": "4.512e-01", "anc_acc": "4.479e-01", "epoch": 0.0038} {"step": 1905, "loss": 0.8402, "grad_norm": "4.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e-01", "anc_loss": "1.129e-01", "dlm_acc": "9.077e-01", "anc_acc": "9.076e-01", "epoch": 0.00381} {"step": 1910, "loss": 1.2048, "grad_norm": "3.580e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.187e-01", "anc_loss": "8.383e-01", "dlm_acc": "6.440e-01", "anc_acc": "6.418e-01", "epoch": 0.00382} {"step": 1915, "loss": 1.4396, "grad_norm": "4.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.312e+00", "dlm_acc": "4.913e-01", "anc_acc": "4.898e-01", "epoch": 0.00383} {"step": 1920, "loss": 1.5608, "grad_norm": "7.794e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.133e-01", "anc_loss": "7.164e-01", "dlm_acc": "5.335e-01", "anc_acc": "5.316e-01", "epoch": 0.00384} {"step": 1925, "loss": 1.0645, "grad_norm": "9.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.816e-01", "anc_loss": "5.836e-01", "dlm_acc": "5.813e-01", "anc_acc": "5.804e-01", "epoch": 0.00385} {"step": 1930, "loss": 1.2067, "grad_norm": "3.139e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.262e-01", "anc_loss": "6.281e-01", "dlm_acc": "5.618e-01", "anc_acc": "5.597e-01", "epoch": 0.00386} {"step": 1935, "loss": 1.5037, "grad_norm": "9.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.594e-01", "anc_loss": "7.609e-01", "dlm_acc": "5.404e-01", "anc_acc": "5.394e-01", "epoch": 0.00387} {"step": 1940, "loss": 1.4012, "grad_norm": "5.292e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.047e-01", "anc_loss": "8.168e-01", "dlm_acc": "5.594e-01", "anc_acc": "5.568e-01", "epoch": 0.00388} {"step": 1945, "loss": 0.977, "grad_norm": "5.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.336e-01", "anc_loss": "6.496e-01", "dlm_acc": "6.697e-01", "anc_acc": "6.675e-01", "epoch": 0.00389} {"step": 1950, "loss": 1.3827, "grad_norm": "1.427e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.045e-01", "anc_acc": "4.997e-01", "epoch": 0.0039} {"step": 1955, "loss": 1.5996, "grad_norm": "9.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.285e-01", "anc_loss": "8.348e-01", "dlm_acc": "4.435e-01", "anc_acc": "4.425e-01", "epoch": 0.00391} {"step": 1960, "loss": 1.2139, "grad_norm": "4.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.836e-01", "anc_loss": "7.875e-01", "dlm_acc": "3.836e-01", "anc_acc": "3.824e-01", "epoch": 0.00392} {"step": 1965, "loss": 0.8999, "grad_norm": "4.629e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.885e-01", "anc_loss": "7.949e-01", "dlm_acc": "4.816e-01", "anc_acc": "4.756e-01", "epoch": 0.00393} {"step": 1970, "loss": 0.8949, "grad_norm": "4.497e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.094e-01", "anc_loss": "9.125e-01", "dlm_acc": "3.587e-01", "anc_acc": "3.545e-01", "epoch": 0.00394} {"step": 1975, "loss": 0.8371, "grad_norm": "2.498e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.086e-01", "anc_loss": "9.172e-01", "dlm_acc": "3.645e-01", "anc_acc": "3.549e-01", "epoch": 0.00395} {"step": 1980, "loss": 1.2063, "grad_norm": "7.552e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.742e-01", "anc_loss": "8.836e-01", "dlm_acc": "3.933e-01", "anc_acc": "3.781e-01", "epoch": 0.00396} {"step": 1985, "loss": 1.3518, "grad_norm": "4.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.310e+00", "dlm_acc": "5.321e-01", "anc_acc": "5.254e-01", "epoch": 0.00397} {"step": 1990, "loss": 1.4431, "grad_norm": "7.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.214e-01", "anc_acc": "5.138e-01", "epoch": 0.00398} {"step": 1995, "loss": 1.3006, "grad_norm": "4.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.349e+00", "dlm_acc": "5.760e-01", "anc_acc": "5.716e-01", "epoch": 0.00399} {"step": 2000, "loss": 1.1034, "grad_norm": "4.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.586e-01", "anc_loss": "5.703e-01", "dlm_acc": "7.251e-01", "anc_acc": "7.227e-01", "epoch": 0.004} {"step": 2005, "loss": 1.1747, "grad_norm": "6.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.441e-01", "anc_loss": "4.504e-01", "dlm_acc": "7.337e-01", "anc_acc": "7.336e-01", "epoch": 0.00401} {"step": 2010, "loss": 1.1592, "grad_norm": "7.012e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.676e-01", "anc_loss": "3.711e-01", "dlm_acc": "7.856e-01", "anc_acc": "7.857e-01", "epoch": 0.00402} {"step": 2015, "loss": 1.2082, "grad_norm": "4.430e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.504e-01", "anc_loss": "9.734e-01", "dlm_acc": "6.458e-01", "anc_acc": "6.439e-01", "epoch": 0.00403} {"step": 2020, "loss": 0.9967, "grad_norm": "3.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.961e-01", "anc_loss": "1.036e+00", "dlm_acc": "6.549e-01", "anc_acc": "6.498e-01", "epoch": 0.00404} {"step": 2025, "loss": 1.1576, "grad_norm": "3.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.335e+00", "anc_loss": "1.388e+00", "dlm_acc": "5.061e-01", "anc_acc": "5.006e-01", "epoch": 0.00405} {"step": 2030, "loss": 0.8464, "grad_norm": "3.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.326e+00", "anc_loss": "1.374e+00", "dlm_acc": "5.199e-01", "anc_acc": "5.128e-01", "epoch": 0.00406} {"step": 2035, "loss": 1.1718, "grad_norm": "5.236e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.134e+00", "dlm_acc": "4.428e-01", "anc_acc": "4.399e-01", "epoch": 0.00407} {"step": 2040, "loss": 1.0534, "grad_norm": "8.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.025e+00", "dlm_acc": "6.474e-01", "anc_acc": "6.455e-01", "epoch": 0.00408} {"step": 2045, "loss": 0.9572, "grad_norm": "3.792e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.206e+00", "dlm_acc": "5.330e-01", "anc_acc": "5.297e-01", "epoch": 0.00409} {"step": 2050, "loss": 0.9263, "grad_norm": "5.624e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.033e-01", "anc_loss": "9.281e-01", "dlm_acc": "6.513e-01", "anc_acc": "6.476e-01", "epoch": 0.0041} {"step": 2055, "loss": 1.3087, "grad_norm": "9.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.707e-01", "anc_loss": "4.711e-01", "dlm_acc": "7.241e-01", "anc_acc": "7.248e-01", "epoch": 0.00411} {"step": 2060, "loss": 1.1253, "grad_norm": "5.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.849e-01", "anc_loss": "1.005e+00", "dlm_acc": "6.157e-01", "anc_acc": "6.158e-01", "epoch": 0.00412} {"step": 2065, "loss": 1.1864, "grad_norm": "5.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.887e-01", "anc_loss": "4.949e-01", "dlm_acc": "7.104e-01", "anc_acc": "7.104e-01", "epoch": 0.00413} {"step": 2070, "loss": 0.8872, "grad_norm": "2.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.025e-01", "anc_loss": "3.063e-01", "dlm_acc": "7.984e-01", "anc_acc": "7.949e-01", "epoch": 0.00414} {"step": 2075, "loss": 0.7802, "grad_norm": "2.385e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.581e-01", "anc_loss": "2.635e-01", "dlm_acc": "8.256e-01", "anc_acc": "8.230e-01", "epoch": 0.00415} {"step": 2080, "loss": 0.9887, "grad_norm": "4.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.148e-01", "anc_loss": "4.188e-01", "dlm_acc": "7.493e-01", "anc_acc": "7.479e-01", "epoch": 0.00416} {"step": 2085, "loss": 1.0261, "grad_norm": "4.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.219e-01", "anc_loss": "3.264e-01", "dlm_acc": "7.954e-01", "anc_acc": "7.943e-01", "epoch": 0.00417} {"step": 2090, "loss": 1.1264, "grad_norm": "5.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.402e-01", "anc_loss": "3.447e-01", "dlm_acc": "7.954e-01", "anc_acc": "7.931e-01", "epoch": 0.00418} {"step": 2095, "loss": 1.2826, "grad_norm": "6.388e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.416e-01", "anc_loss": "6.554e-01", "dlm_acc": "7.322e-01", "anc_acc": "7.300e-01", "epoch": 0.00419} {"step": 2100, "loss": 1.2741, "grad_norm": "4.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.410e-01", "anc_loss": "7.551e-01", "dlm_acc": "6.198e-01", "anc_acc": "6.243e-01", "epoch": 0.0042} {"step": 2105, "loss": 1.0998, "grad_norm": "9.344e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.965e-01", "anc_loss": "7.234e-01", "dlm_acc": "6.933e-01", "anc_acc": "6.897e-01", "epoch": 0.00421} {"step": 2110, "loss": 1.39, "grad_norm": "6.666e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.024e+00", "anc_loss": "1.056e+00", "dlm_acc": "6.268e-01", "anc_acc": "6.239e-01", "epoch": 0.00422} {"step": 2115, "loss": 1.438, "grad_norm": "5.349e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.019e+00", "anc_loss": "1.052e+00", "dlm_acc": "6.661e-01", "anc_acc": "6.629e-01", "epoch": 0.00423} {"step": 2120, "loss": 1.2782, "grad_norm": "5.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.666e-01", "anc_loss": "9.959e-01", "dlm_acc": "6.746e-01", "anc_acc": "6.709e-01", "epoch": 0.00424} {"step": 2125, "loss": 1.0515, "grad_norm": "5.434e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.145e-01", "anc_loss": "8.421e-01", "dlm_acc": "7.348e-01", "anc_acc": "7.302e-01", "epoch": 0.00425} {"step": 2130, "loss": 1.0201, "grad_norm": "3.469e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.889e-01", "anc_loss": "6.146e-01", "dlm_acc": "7.363e-01", "anc_acc": "7.331e-01", "epoch": 0.00426} {"step": 2135, "loss": 0.909, "grad_norm": "2.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.445e-01", "anc_loss": "7.685e-01", "dlm_acc": "6.929e-01", "anc_acc": "6.881e-01", "epoch": 0.00427} {"step": 2140, "loss": 0.9943, "grad_norm": "4.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.312e-01", "anc_loss": "7.635e-01", "dlm_acc": "6.987e-01", "anc_acc": "6.930e-01", "epoch": 0.00428} {"step": 2145, "loss": 1.3454, "grad_norm": "6.845e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.043e+00", "dlm_acc": "5.978e-01", "anc_acc": "5.939e-01", "epoch": 0.00429} {"step": 2150, "loss": 1.2043, "grad_norm": "7.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.953e-01", "anc_loss": "5.145e-01", "dlm_acc": "7.446e-01", "anc_acc": "7.407e-01", "epoch": 0.0043} {"step": 2155, "loss": 1.061, "grad_norm": "8.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.133e-01", "anc_loss": "8.416e-01", "dlm_acc": "6.586e-01", "anc_acc": "6.549e-01", "epoch": 0.00431} {"step": 2160, "loss": 1.4699, "grad_norm": "7.136e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.041e+00", "dlm_acc": "4.612e-01", "anc_acc": "4.595e-01", "epoch": 0.00432} {"step": 2165, "loss": 1.2853, "grad_norm": "4.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.937e-01", "anc_loss": "8.152e-01", "dlm_acc": "6.696e-01", "anc_acc": "6.607e-01", "epoch": 0.00433} {"step": 2170, "loss": 1.0367, "grad_norm": "4.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.820e-01", "anc_loss": "3.910e-01", "dlm_acc": "7.187e-01", "anc_acc": "7.174e-01", "epoch": 0.00434} {"step": 2175, "loss": 1.1468, "grad_norm": "1.027e+00", "learning_rate": "1.000e-04", "dlm_loss": "3.441e-01", "anc_loss": "3.523e-01", "dlm_acc": "7.491e-01", "anc_acc": "7.453e-01", "epoch": 0.00435} {"step": 2180, "loss": 1.2422, "grad_norm": "3.926e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.109e-01", "anc_loss": "5.246e-01", "dlm_acc": "7.183e-01", "anc_acc": "7.148e-01", "epoch": 0.00436} {"step": 2185, "loss": 0.9723, "grad_norm": "4.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.648e-01", "anc_loss": "3.727e-01", "dlm_acc": "7.403e-01", "anc_acc": "7.382e-01", "epoch": 0.00437} {"step": 2190, "loss": 0.6879, "grad_norm": "4.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.465e-01", "anc_loss": "4.637e-01", "dlm_acc": "7.220e-01", "anc_acc": "7.191e-01", "epoch": 0.00438} {"step": 2195, "loss": 0.8851, "grad_norm": "8.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.305e-01", "anc_loss": "4.367e-01", "dlm_acc": "7.260e-01", "anc_acc": "7.252e-01", "epoch": 0.00439} {"step": 2200, "loss": 1.0682, "grad_norm": "7.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.125e-01", "anc_loss": "7.291e-01", "dlm_acc": "6.612e-01", "anc_acc": "6.607e-01", "epoch": 0.0044} {"step": 2205, "loss": 1.3822, "grad_norm": "7.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.047e+00", "dlm_acc": "5.966e-01", "anc_acc": "5.909e-01", "epoch": 0.00441} {"step": 2210, "loss": 1.6879, "grad_norm": "4.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.173e+00", "dlm_acc": "5.662e-01", "anc_acc": "5.624e-01", "epoch": 0.00442} {"step": 2215, "loss": 1.4299, "grad_norm": "3.089e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.305e-01", "anc_loss": "7.484e-01", "dlm_acc": "6.189e-01", "anc_acc": "6.157e-01", "epoch": 0.00443} {"step": 2220, "loss": 1.6129, "grad_norm": "8.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.396e+00", "dlm_acc": "5.530e-01", "anc_acc": "5.470e-01", "epoch": 0.00444} {"step": 2225, "loss": 1.1918, "grad_norm": "8.963e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.806e-01", "anc_loss": "8.026e-01", "dlm_acc": "7.279e-01", "anc_acc": "7.253e-01", "epoch": 0.00445} {"step": 2230, "loss": 1.8713, "grad_norm": "7.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.672e+00", "anc_loss": "1.728e+00", "dlm_acc": "5.100e-01", "anc_acc": "5.046e-01", "epoch": 0.00446} {"step": 2235, "loss": 1.3992, "grad_norm": "4.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.284e+00", "dlm_acc": "5.877e-01", "anc_acc": "5.819e-01", "epoch": 0.00447} {"step": 2240, "loss": 1.1133, "grad_norm": "8.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.094e+00", "dlm_acc": "5.073e-01", "anc_acc": "5.061e-01", "epoch": 0.00448} {"step": 2245, "loss": 1.2127, "grad_norm": "6.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.476e+00", "anc_loss": "1.509e+00", "dlm_acc": "3.962e-01", "anc_acc": "3.928e-01", "epoch": 0.00449} {"step": 2250, "loss": 1.2734, "grad_norm": "4.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.547e+00", "dlm_acc": "4.897e-01", "anc_acc": "4.840e-01", "epoch": 0.0045} {"step": 2255, "loss": 1.3792, "grad_norm": "1.056e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.317e+00", "dlm_acc": "5.479e-01", "anc_acc": "5.425e-01", "epoch": 0.00451} {"step": 2260, "loss": 1.7612, "grad_norm": "5.479e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.741e+00", "anc_loss": "1.797e+00", "dlm_acc": "4.734e-01", "anc_acc": "4.671e-01", "epoch": 0.00452} {"step": 2265, "loss": 1.3675, "grad_norm": "7.909e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.404e+00", "dlm_acc": "4.737e-01", "anc_acc": "4.636e-01", "epoch": 0.00453} {"step": 2270, "loss": 1.2001, "grad_norm": "5.162e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.410e-01", "anc_loss": "9.805e-01", "dlm_acc": "6.402e-01", "anc_acc": "6.357e-01", "epoch": 0.00454} {"step": 2275, "loss": 1.4796, "grad_norm": "4.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.613e-01", "anc_loss": "9.945e-01", "dlm_acc": "6.346e-01", "anc_acc": "6.298e-01", "epoch": 0.00455} {"step": 2280, "loss": 1.5434, "grad_norm": "7.736e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.082e-01", "anc_loss": "9.484e-01", "dlm_acc": "6.571e-01", "anc_acc": "6.554e-01", "epoch": 0.00456} {"step": 2285, "loss": 1.5529, "grad_norm": "1.074e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.573e+00", "anc_loss": "1.619e+00", "dlm_acc": "4.520e-01", "anc_acc": "4.459e-01", "epoch": 0.00457} {"step": 2290, "loss": 1.7246, "grad_norm": "8.532e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.809e+00", "anc_loss": "1.866e+00", "dlm_acc": "4.420e-01", "anc_acc": "4.368e-01", "epoch": 0.00458} {"step": 2295, "loss": 1.8074, "grad_norm": "7.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.393e+00", "anc_loss": "1.440e+00", "dlm_acc": "5.248e-01", "anc_acc": "5.200e-01", "epoch": 0.00459} {"step": 2300, "loss": 1.7562, "grad_norm": "8.980e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.654e+00", "anc_loss": "1.710e+00", "dlm_acc": "4.654e-01", "anc_acc": "4.605e-01", "epoch": 0.0046} {"step": 2305, "loss": 1.9496, "grad_norm": "1.031e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.840e+00", "anc_loss": "1.895e+00", "dlm_acc": "4.473e-01", "anc_acc": "4.401e-01", "epoch": 0.00461} {"step": 2310, "loss": 1.7262, "grad_norm": "3.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.602e+00", "anc_loss": "1.655e+00", "dlm_acc": "4.579e-01", "anc_acc": "4.516e-01", "epoch": 0.00462} {"step": 2315, "loss": 1.4577, "grad_norm": "7.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.478e+00", "anc_loss": "1.534e+00", "dlm_acc": "4.828e-01", "anc_acc": "4.757e-01", "epoch": 0.00463} {"step": 2320, "loss": 1.2689, "grad_norm": "7.479e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.442e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.035e-01", "anc_acc": "4.976e-01", "epoch": 0.00464} {"step": 2325, "loss": 1.3053, "grad_norm": "4.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.268e+00", "anc_loss": "1.295e+00", "dlm_acc": "4.894e-01", "anc_acc": "4.874e-01", "epoch": 0.00465} {"step": 2330, "loss": 1.8473, "grad_norm": "6.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.541e+00", "dlm_acc": "4.978e-01", "anc_acc": "4.925e-01", "epoch": 0.00466} {"step": 2335, "loss": 1.3202, "grad_norm": "4.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.307e-01", "anc_acc": "5.262e-01", "epoch": 0.00467} {"step": 2340, "loss": 1.7105, "grad_norm": "4.347e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.498e+00", "dlm_acc": "4.500e-01", "anc_acc": "4.450e-01", "epoch": 0.00468} {"step": 2345, "loss": 1.2768, "grad_norm": "3.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.776e+00", "anc_loss": "1.814e+00", "dlm_acc": "3.724e-01", "anc_acc": "3.680e-01", "epoch": 0.00469} {"step": 2350, "loss": 1.2393, "grad_norm": "2.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.124e+00", "anc_loss": "1.149e+00", "dlm_acc": "5.537e-01", "anc_acc": "5.508e-01", "epoch": 0.0047} {"step": 2355, "loss": 1.1597, "grad_norm": "5.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.290e+00", "anc_loss": "1.389e+00", "dlm_acc": "5.392e-01", "anc_acc": "5.328e-01", "epoch": 0.00471} {"step": 2360, "loss": 1.4927, "grad_norm": "8.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.648e+00", "anc_loss": "1.703e+00", "dlm_acc": "4.751e-01", "anc_acc": "4.665e-01", "epoch": 0.00472} {"step": 2365, "loss": 1.1249, "grad_norm": "6.968e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.540e-01", "anc_loss": "6.681e-01", "dlm_acc": "7.655e-01", "anc_acc": "7.689e-01", "epoch": 0.00473} {"step": 2370, "loss": 1.4446, "grad_norm": "7.563e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.308e+00", "anc_loss": "1.361e+00", "dlm_acc": "5.557e-01", "anc_acc": "5.483e-01", "epoch": 0.00474} {"step": 2375, "loss": 0.8468, "grad_norm": "4.942e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.996e-01", "anc_loss": "9.453e-01", "dlm_acc": "6.258e-01", "anc_acc": "6.179e-01", "epoch": 0.00475} {"step": 2380, "loss": 1.3193, "grad_norm": "2.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.399e+00", "anc_loss": "1.424e+00", "dlm_acc": "4.656e-01", "anc_acc": "4.618e-01", "epoch": 0.00476} {"step": 2385, "loss": 1.5802, "grad_norm": "4.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.362e+00", "anc_loss": "1.410e+00", "dlm_acc": "5.012e-01", "anc_acc": "4.966e-01", "epoch": 0.00477} {"step": 2390, "loss": 2.026, "grad_norm": "4.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.653e+00", "anc_loss": "1.691e+00", "dlm_acc": "4.014e-01", "anc_acc": "4.018e-01", "epoch": 0.00478} {"step": 2395, "loss": 1.2645, "grad_norm": "3.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.100e+00", "dlm_acc": "5.551e-01", "anc_acc": "5.472e-01", "epoch": 0.00479} {"step": 2400, "loss": 1.5028, "grad_norm": "7.466e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.102e+00", "dlm_acc": "5.366e-01", "anc_acc": "5.312e-01", "epoch": 0.0048} {"step": 2405, "loss": 1.1693, "grad_norm": "4.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.199e+00", "dlm_acc": "5.527e-01", "anc_acc": "5.469e-01", "epoch": 0.00481} {"step": 2410, "loss": 1.1609, "grad_norm": "5.756e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.609e+00", "anc_loss": "1.659e+00", "dlm_acc": "4.616e-01", "anc_acc": "4.578e-01", "epoch": 0.00482} {"step": 2415, "loss": 1.7001, "grad_norm": "5.004e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.780e+00", "anc_loss": "1.836e+00", "dlm_acc": "4.415e-01", "anc_acc": "4.364e-01", "epoch": 0.00483} {"step": 2420, "loss": 1.7313, "grad_norm": "6.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.794e+00", "anc_loss": "1.848e+00", "dlm_acc": "4.530e-01", "anc_acc": "4.457e-01", "epoch": 0.00484} {"step": 2425, "loss": 1.48, "grad_norm": "6.479e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.650e+00", "anc_loss": "1.714e+00", "dlm_acc": "5.148e-01", "anc_acc": "5.087e-01", "epoch": 0.00485} {"step": 2430, "loss": 1.2302, "grad_norm": "3.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.457e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.209e-01", "anc_acc": "5.162e-01", "epoch": 0.00486} {"step": 2435, "loss": 1.5213, "grad_norm": "3.206e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.531e+00", "anc_loss": "1.592e+00", "dlm_acc": "4.878e-01", "anc_acc": "4.829e-01", "epoch": 0.00487} {"step": 2440, "loss": 1.3412, "grad_norm": "5.576e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.325e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.256e-01", "anc_acc": "5.182e-01", "epoch": 0.00488} {"step": 2445, "loss": 1.9774, "grad_norm": "7.154e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.494e+00", "anc_loss": "1.547e+00", "dlm_acc": "4.919e-01", "anc_acc": "4.860e-01", "epoch": 0.00489} {"step": 2450, "loss": 1.8552, "grad_norm": "7.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.361e+00", "dlm_acc": "5.293e-01", "anc_acc": "5.213e-01", "epoch": 0.0049} {"step": 2455, "loss": 1.7047, "grad_norm": "7.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.736e+00", "anc_loss": "1.789e+00", "dlm_acc": "4.983e-01", "anc_acc": "4.908e-01", "epoch": 0.00491} {"step": 2460, "loss": 1.3104, "grad_norm": "7.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.783e+00", "anc_loss": "1.842e+00", "dlm_acc": "4.361e-01", "anc_acc": "4.297e-01", "epoch": 0.00492} {"step": 2465, "loss": 1.0874, "grad_norm": "4.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.219e+00", "dlm_acc": "5.788e-01", "anc_acc": "5.719e-01", "epoch": 0.00493} {"step": 2470, "loss": 1.5968, "grad_norm": "4.925e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.731e+00", "anc_loss": "1.798e+00", "dlm_acc": "4.866e-01", "anc_acc": "4.790e-01", "epoch": 0.00494} {"step": 2475, "loss": 1.0614, "grad_norm": "4.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.496e+00", "anc_loss": "1.545e+00", "dlm_acc": "5.076e-01", "anc_acc": "5.013e-01", "epoch": 0.00495} {"step": 2480, "loss": 1.0577, "grad_norm": "5.225e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.465e+00", "anc_loss": "1.524e+00", "dlm_acc": "5.160e-01", "anc_acc": "5.090e-01", "epoch": 0.00496} {"step": 2485, "loss": 1.3489, "grad_norm": "3.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.808e+00", "anc_loss": "1.864e+00", "dlm_acc": "4.112e-01", "anc_acc": "4.046e-01", "epoch": 0.00497} {"step": 2490, "loss": 1.2001, "grad_norm": "5.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.555e+00", "anc_loss": "1.605e+00", "dlm_acc": "5.003e-01", "anc_acc": "4.943e-01", "epoch": 0.00498} {"step": 2495, "loss": 1.3748, "grad_norm": "4.035e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.512e+00", "anc_loss": "1.558e+00", "dlm_acc": "5.074e-01", "anc_acc": "5.010e-01", "epoch": 0.00499} {"step": 2500, "loss": 1.2049, "grad_norm": "4.945e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.741e+00", "anc_loss": "1.786e+00", "dlm_acc": "4.261e-01", "anc_acc": "4.197e-01", "epoch": 0.005} {"step": 2505, "loss": 0.809, "grad_norm": "6.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.201e+00", "anc_loss": "1.249e+00", "dlm_acc": "5.532e-01", "anc_acc": "5.466e-01", "epoch": 0.00501} {"step": 2510, "loss": 1.2532, "grad_norm": "4.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.656e+00", "anc_loss": "1.712e+00", "dlm_acc": "4.867e-01", "anc_acc": "4.787e-01", "epoch": 0.00502} {"step": 2515, "loss": 1.377, "grad_norm": "5.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.534e+00", "anc_loss": "1.579e+00", "dlm_acc": "5.080e-01", "anc_acc": "5.024e-01", "epoch": 0.00503} {"step": 2520, "loss": 1.307, "grad_norm": "6.327e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.761e+00", "dlm_acc": "4.955e-01", "anc_acc": "4.862e-01", "epoch": 0.00504} {"step": 2525, "loss": 1.6857, "grad_norm": "3.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.845e+00", "anc_loss": "1.895e+00", "dlm_acc": "4.358e-01", "anc_acc": "4.293e-01", "epoch": 0.00505} {"step": 2530, "loss": 1.7918, "grad_norm": "3.508e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.790e+00", "anc_loss": "1.841e+00", "dlm_acc": "4.719e-01", "anc_acc": "4.652e-01", "epoch": 0.00506} {"step": 2535, "loss": 1.1562, "grad_norm": "3.744e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.231e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.486e-01", "anc_acc": "5.389e-01", "epoch": 0.00507} {"step": 2540, "loss": 1.3795, "grad_norm": "3.344e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.451e+00", "anc_loss": "1.499e+00", "dlm_acc": "4.937e-01", "anc_acc": "4.863e-01", "epoch": 0.00508} {"step": 2545, "loss": 1.7663, "grad_norm": "4.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.809e+00", "anc_loss": "1.864e+00", "dlm_acc": "4.565e-01", "anc_acc": "4.504e-01", "epoch": 0.00509} {"step": 2550, "loss": 1.7412, "grad_norm": "4.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.618e+00", "anc_loss": "1.674e+00", "dlm_acc": "4.782e-01", "anc_acc": "4.713e-01", "epoch": 0.0051} {"step": 2555, "loss": 1.6591, "grad_norm": "4.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.529e+00", "dlm_acc": "4.560e-01", "anc_acc": "4.442e-01", "epoch": 0.00511} {"step": 2560, "loss": 2.0731, "grad_norm": "7.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.977e+00", "anc_loss": "2.019e+00", "dlm_acc": "4.017e-01", "anc_acc": "3.952e-01", "epoch": 0.00512} {"step": 2565, "loss": 1.7708, "grad_norm": "4.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.761e+00", "anc_loss": "1.808e+00", "dlm_acc": "4.074e-01", "anc_acc": "4.007e-01", "epoch": 0.00513} {"step": 2570, "loss": 1.9736, "grad_norm": "7.473e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.472e+00", "anc_loss": "1.555e+00", "dlm_acc": "5.189e-01", "anc_acc": "5.120e-01", "epoch": 0.00514} {"step": 2575, "loss": 1.5888, "grad_norm": "4.265e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.261e+00", "dlm_acc": "5.948e-01", "anc_acc": "5.884e-01", "epoch": 0.00515} {"step": 2580, "loss": 1.5587, "grad_norm": "3.372e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.438e+00", "dlm_acc": "4.738e-01", "anc_acc": "4.693e-01", "epoch": 0.00516} {"step": 2585, "loss": 1.3978, "grad_norm": "7.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.392e+00", "dlm_acc": "5.233e-01", "anc_acc": "5.168e-01", "epoch": 0.00517} {"step": 2590, "loss": 1.2723, "grad_norm": "2.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.141e-01", "anc_loss": "7.316e-01", "dlm_acc": "6.149e-01", "anc_acc": "6.147e-01", "epoch": 0.00518} {"step": 2595, "loss": 1.3281, "grad_norm": "4.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.124e+00", "dlm_acc": "5.866e-01", "anc_acc": "5.831e-01", "epoch": 0.00519} {"step": 2600, "loss": 1.2892, "grad_norm": "4.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.107e-01", "anc_acc": "5.059e-01", "epoch": 0.0052} {"step": 2605, "loss": 1.4522, "grad_norm": "5.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.207e+00", "anc_loss": "1.249e+00", "dlm_acc": "5.877e-01", "anc_acc": "5.810e-01", "epoch": 0.00521} {"step": 2610, "loss": 1.3761, "grad_norm": "4.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.494e+00", "dlm_acc": "4.725e-01", "anc_acc": "4.667e-01", "epoch": 0.00522} {"step": 2615, "loss": 1.7315, "grad_norm": "6.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.872e+00", "anc_loss": "1.923e+00", "dlm_acc": "4.175e-01", "anc_acc": "4.131e-01", "epoch": 0.00523} {"step": 2620, "loss": 1.5137, "grad_norm": "5.211e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.631e+00", "dlm_acc": "4.688e-01", "anc_acc": "4.607e-01", "epoch": 0.00524} {"step": 2625, "loss": 1.6791, "grad_norm": "6.595e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.934e+00", "anc_loss": "2.002e+00", "dlm_acc": "4.068e-01", "anc_acc": "4.006e-01", "epoch": 0.00525} {"step": 2630, "loss": 1.5686, "grad_norm": "3.008e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.607e+00", "anc_loss": "1.661e+00", "dlm_acc": "4.735e-01", "anc_acc": "4.657e-01", "epoch": 0.00526} {"step": 2635, "loss": 1.7602, "grad_norm": "8.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.959e+00", "anc_loss": "2.005e+00", "dlm_acc": "4.160e-01", "anc_acc": "4.091e-01", "epoch": 0.00527} {"step": 2640, "loss": 1.1924, "grad_norm": "4.672e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.312e+00", "dlm_acc": "4.778e-01", "anc_acc": "4.716e-01", "epoch": 0.00528} {"step": 2645, "loss": 1.4566, "grad_norm": "4.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.795e+00", "anc_loss": "1.873e+00", "dlm_acc": "4.115e-01", "anc_acc": "4.015e-01", "epoch": 0.00529} {"step": 2650, "loss": 1.4628, "grad_norm": "6.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.615e+00", "anc_loss": "1.668e+00", "dlm_acc": "4.819e-01", "anc_acc": "4.748e-01", "epoch": 0.0053} {"step": 2655, "loss": 1.7185, "grad_norm": "5.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.798e+00", "anc_loss": "1.850e+00", "dlm_acc": "4.411e-01", "anc_acc": "4.350e-01", "epoch": 0.00531} {"step": 2660, "loss": 1.5653, "grad_norm": "4.958e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.289e+00", "dlm_acc": "5.047e-01", "anc_acc": "4.979e-01", "epoch": 0.00532} {"step": 2665, "loss": 1.8422, "grad_norm": "1.375e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.374e+00", "anc_loss": "1.418e+00", "dlm_acc": "5.358e-01", "anc_acc": "5.295e-01", "epoch": 0.00533} {"step": 2670, "loss": 2.0752, "grad_norm": "8.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.906e-01", "anc_loss": "9.227e-01", "dlm_acc": "6.293e-01", "anc_acc": "6.300e-01", "epoch": 0.00534} {"step": 2675, "loss": 2.301, "grad_norm": "5.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.457e+00", "anc_loss": "1.493e+00", "dlm_acc": "5.005e-01", "anc_acc": "4.981e-01", "epoch": 0.00535} {"step": 2680, "loss": 1.7028, "grad_norm": "5.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.659e+00", "dlm_acc": "4.653e-01", "anc_acc": "4.613e-01", "epoch": 0.00536} {"step": 2685, "loss": 1.2295, "grad_norm": "5.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.594e+00", "anc_loss": "1.641e+00", "dlm_acc": "4.804e-01", "anc_acc": "4.737e-01", "epoch": 0.00537} {"step": 2690, "loss": 1.4848, "grad_norm": "4.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.777e+00", "anc_loss": "1.831e+00", "dlm_acc": "4.607e-01", "anc_acc": "4.561e-01", "epoch": 0.00538} {"step": 2695, "loss": 1.0178, "grad_norm": "4.050e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.215e-01", "anc_acc": "5.155e-01", "epoch": 0.00539} {"step": 2700, "loss": 1.8883, "grad_norm": "6.211e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.941e+00", "anc_loss": "1.989e+00", "dlm_acc": "3.871e-01", "anc_acc": "3.821e-01", "epoch": 0.0054} {"step": 2705, "loss": 1.1601, "grad_norm": "8.299e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.526e+00", "dlm_acc": "4.838e-01", "anc_acc": "4.763e-01", "epoch": 0.00541} {"step": 2710, "loss": 1.3153, "grad_norm": "2.165e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.508e+00", "dlm_acc": "4.735e-01", "anc_acc": "4.696e-01", "epoch": 0.00542} {"step": 2715, "loss": 1.2813, "grad_norm": "5.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.042e+00", "anc_loss": "2.077e+00", "dlm_acc": "3.291e-01", "anc_acc": "3.254e-01", "epoch": 0.00543} {"step": 2720, "loss": 1.3316, "grad_norm": "7.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.063e+00", "dlm_acc": "5.598e-01", "anc_acc": "5.535e-01", "epoch": 0.00544} {"step": 2725, "loss": 1.4275, "grad_norm": "4.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.581e-01", "anc_acc": "5.501e-01", "epoch": 0.00545} {"step": 2730, "loss": 1.3718, "grad_norm": "4.450e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.512e+00", "dlm_acc": "4.034e-01", "anc_acc": "3.982e-01", "epoch": 0.00546} {"step": 2735, "loss": 1.274, "grad_norm": "5.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.388e+00", "dlm_acc": "5.197e-01", "anc_acc": "5.156e-01", "epoch": 0.00547} {"step": 2740, "loss": 1.2197, "grad_norm": "4.431e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.734e-01", "anc_loss": "1.028e+00", "dlm_acc": "5.922e-01", "anc_acc": "5.808e-01", "epoch": 0.00548} {"step": 2745, "loss": 1.5276, "grad_norm": "5.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.306e+00", "dlm_acc": "4.901e-01", "anc_acc": "4.876e-01", "epoch": 0.00549} {"step": 2750, "loss": 1.5121, "grad_norm": "7.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.484e+00", "dlm_acc": "4.815e-01", "anc_acc": "4.727e-01", "epoch": 0.0055} {"step": 2755, "loss": 2.0638, "grad_norm": "8.892e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.255e+00", "anc_loss": "2.284e+00", "dlm_acc": "2.882e-01", "anc_acc": "2.863e-01", "epoch": 0.00551} {"step": 2760, "loss": 1.2257, "grad_norm": "7.765e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.069e+00", "anc_loss": "1.109e+00", "dlm_acc": "5.653e-01", "anc_acc": "5.597e-01", "epoch": 0.00552} {"step": 2765, "loss": 1.6308, "grad_norm": "4.515e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.377e+00", "dlm_acc": "4.474e-01", "anc_acc": "4.453e-01", "epoch": 0.00553} {"step": 2770, "loss": 1.2613, "grad_norm": "4.751e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.505e+00", "dlm_acc": "5.227e-01", "anc_acc": "5.172e-01", "epoch": 0.00554} {"step": 2775, "loss": 0.9209, "grad_norm": "6.182e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.562e-01", "anc_loss": "8.738e-01", "dlm_acc": "5.035e-01", "anc_acc": "5.005e-01", "epoch": 0.00555} {"step": 2780, "loss": 1.2335, "grad_norm": "3.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.559e+00", "dlm_acc": "4.755e-01", "anc_acc": "4.677e-01", "epoch": 0.00556} {"step": 2785, "loss": 1.6877, "grad_norm": "5.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.553e+00", "anc_loss": "1.602e+00", "dlm_acc": "4.806e-01", "anc_acc": "4.741e-01", "epoch": 0.00557} {"step": 2790, "loss": 1.7639, "grad_norm": "1.249e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.670e+00", "anc_loss": "1.700e+00", "dlm_acc": "4.332e-01", "anc_acc": "4.313e-01", "epoch": 0.00558} {"step": 2795, "loss": 1.9373, "grad_norm": "7.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.414e+00", "anc_loss": "2.436e+00", "dlm_acc": "1.671e-01", "anc_acc": "1.652e-01", "epoch": 0.00559} {"step": 2800, "loss": 2.1752, "grad_norm": "4.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.131e+00", "anc_loss": "3.138e+00", "dlm_acc": "2.030e-02", "anc_acc": "1.938e-02", "epoch": 0.0056} {"step": 2805, "loss": 1.8913, "grad_norm": "9.748e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.919e+00", "anc_loss": "2.931e+00", "dlm_acc": "2.016e-02", "anc_acc": "2.090e-02", "epoch": 0.00561} {"step": 2810, "loss": 1.5207, "grad_norm": "1.058e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.139e+00", "anc_loss": "2.170e+00", "dlm_acc": "2.940e-01", "anc_acc": "2.903e-01", "epoch": 0.00562} {"step": 2815, "loss": 1.3259, "grad_norm": "4.636e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.664e-01", "anc_loss": "9.082e-01", "dlm_acc": "6.382e-01", "anc_acc": "6.320e-01", "epoch": 0.00563} {"step": 2820, "loss": 1.3629, "grad_norm": "7.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.555e+00", "dlm_acc": "4.812e-01", "anc_acc": "4.722e-01", "epoch": 0.00564} {"step": 2825, "loss": 1.0972, "grad_norm": "5.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.168e-01", "anc_loss": "8.531e-01", "dlm_acc": "6.659e-01", "anc_acc": "6.595e-01", "epoch": 0.00565} {"step": 2830, "loss": 1.6798, "grad_norm": "8.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.754e-01", "anc_acc": "5.660e-01", "epoch": 0.00566} {"step": 2835, "loss": 0.9128, "grad_norm": "4.725e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.086e-01", "anc_loss": "6.258e-01", "dlm_acc": "6.519e-01", "anc_acc": "6.470e-01", "epoch": 0.00567} {"step": 2840, "loss": 0.9925, "grad_norm": "3.842e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.898e-01", "anc_loss": "6.922e-01", "dlm_acc": "4.099e-01", "anc_acc": "4.081e-01", "epoch": 0.00568} {"step": 2845, "loss": 1.3188, "grad_norm": "4.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.364e+00", "anc_loss": "1.384e+00", "dlm_acc": "4.690e-01", "anc_acc": "4.652e-01", "epoch": 0.00569} {"step": 2850, "loss": 1.657, "grad_norm": "3.984e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.623e+00", "anc_loss": "1.656e+00", "dlm_acc": "4.405e-01", "anc_acc": "4.383e-01", "epoch": 0.0057} {"step": 2855, "loss": 1.5931, "grad_norm": "6.601e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.592e+00", "anc_loss": "1.644e+00", "dlm_acc": "4.388e-01", "anc_acc": "4.339e-01", "epoch": 0.00571} {"step": 2860, "loss": 1.3256, "grad_norm": "4.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.444e-01", "anc_acc": "5.386e-01", "epoch": 0.00572} {"step": 2865, "loss": 1.2166, "grad_norm": "4.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.296e+00", "dlm_acc": "4.798e-01", "anc_acc": "4.727e-01", "epoch": 0.00573} {"step": 2870, "loss": 1.0994, "grad_norm": "5.871e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.034e+00", "dlm_acc": "6.363e-01", "anc_acc": "6.309e-01", "epoch": 0.00574} {"step": 2875, "loss": 1.5361, "grad_norm": "6.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.394e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.247e-01", "anc_acc": "5.170e-01", "epoch": 0.00575} {"step": 2880, "loss": 1.4009, "grad_norm": "7.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.458e+00", "dlm_acc": "5.309e-01", "anc_acc": "5.258e-01", "epoch": 0.00576} {"step": 2885, "loss": 1.5992, "grad_norm": "4.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.551e+00", "anc_loss": "1.607e+00", "dlm_acc": "4.728e-01", "anc_acc": "4.656e-01", "epoch": 0.00577} {"step": 2890, "loss": 1.2673, "grad_norm": "5.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.179e+00", "dlm_acc": "5.389e-01", "anc_acc": "5.336e-01", "epoch": 0.00578} {"step": 2895, "loss": 1.164, "grad_norm": "5.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.727e-01", "anc_loss": "9.094e-01", "dlm_acc": "6.194e-01", "anc_acc": "6.113e-01", "epoch": 0.00579} {"step": 2900, "loss": 1.288, "grad_norm": "4.081e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.746e-01", "anc_loss": "7.941e-01", "dlm_acc": "6.508e-01", "anc_acc": "6.466e-01", "epoch": 0.0058} {"step": 2905, "loss": 1.4249, "grad_norm": "4.386e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.382e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.015e-01", "anc_acc": "4.956e-01", "epoch": 0.00581} {"step": 2910, "loss": 1.0309, "grad_norm": "8.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.643e-01", "anc_loss": "8.982e-01", "dlm_acc": "6.662e-01", "anc_acc": "6.621e-01", "epoch": 0.00582} {"step": 2915, "loss": 1.3974, "grad_norm": "3.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.669e-01", "anc_acc": "5.601e-01", "epoch": 0.00583} {"step": 2920, "loss": 1.234, "grad_norm": "4.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.153e+00", "anc_loss": "1.204e+00", "dlm_acc": "5.479e-01", "anc_acc": "5.385e-01", "epoch": 0.00584} {"step": 2925, "loss": 1.383, "grad_norm": "4.773e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.381e+00", "anc_loss": "1.434e+00", "dlm_acc": "4.915e-01", "anc_acc": "4.841e-01", "epoch": 0.00585} {"step": 2930, "loss": 0.8374, "grad_norm": "4.109e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.992e-01", "anc_loss": "9.445e-01", "dlm_acc": "6.117e-01", "anc_acc": "6.042e-01", "epoch": 0.00586} {"step": 2935, "loss": 1.3114, "grad_norm": "2.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.412e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.204e-01", "anc_acc": "5.137e-01", "epoch": 0.00587} {"step": 2940, "loss": 1.2207, "grad_norm": "3.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.309e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.265e-01", "anc_acc": "5.181e-01", "epoch": 0.00588} {"step": 2945, "loss": 1.2935, "grad_norm": "3.197e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.361e+00", "anc_loss": "1.416e+00", "dlm_acc": "5.128e-01", "anc_acc": "5.038e-01", "epoch": 0.00589} {"step": 2950, "loss": 1.4968, "grad_norm": "4.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.670e+00", "anc_loss": "1.730e+00", "dlm_acc": "4.731e-01", "anc_acc": "4.647e-01", "epoch": 0.0059} {"step": 2955, "loss": 1.621, "grad_norm": "4.694e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.535e+00", "dlm_acc": "5.311e-01", "anc_acc": "5.219e-01", "epoch": 0.00591} {"step": 2960, "loss": 1.5195, "grad_norm": "9.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.461e+00", "anc_loss": "1.510e+00", "dlm_acc": "5.090e-01", "anc_acc": "5.019e-01", "epoch": 0.00592} {"step": 2965, "loss": 1.1909, "grad_norm": "6.373e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.926e-01", "anc_acc": "5.862e-01", "epoch": 0.00593} {"step": 2970, "loss": 1.2296, "grad_norm": "5.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.566e+00", "anc_loss": "1.634e+00", "dlm_acc": "5.182e-01", "anc_acc": "5.092e-01", "epoch": 0.00594} {"step": 2975, "loss": 1.2806, "grad_norm": "4.653e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.806e+00", "anc_loss": "1.863e+00", "dlm_acc": "3.958e-01", "anc_acc": "3.904e-01", "epoch": 0.00595} {"step": 2980, "loss": 1.4268, "grad_norm": "7.712e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.258e+00", "anc_loss": "2.284e+00", "dlm_acc": "1.467e-01", "anc_acc": "1.440e-01", "epoch": 0.00596} {"step": 2985, "loss": 1.4536, "grad_norm": "9.893e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.836e+00", "anc_loss": "1.887e+00", "dlm_acc": "3.885e-01", "anc_acc": "3.826e-01", "epoch": 0.00597} {"step": 2990, "loss": 1.457, "grad_norm": "6.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.905e+00", "anc_loss": "1.955e+00", "dlm_acc": "3.736e-01", "anc_acc": "3.663e-01", "epoch": 0.00598} {"step": 2995, "loss": 1.2391, "grad_norm": "4.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.197e+00", "dlm_acc": "4.877e-01", "anc_acc": "4.815e-01", "epoch": 0.00599} {"step": 3000, "loss": 1.3116, "grad_norm": "4.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.027e-01", "anc_loss": "7.377e-01", "dlm_acc": "7.721e-01", "anc_acc": "7.682e-01", "epoch": 0.006} {"step": 3005, "loss": 1.5906, "grad_norm": "8.114e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.071e+00", "anc_loss": "1.111e+00", "dlm_acc": "6.166e-01", "anc_acc": "6.115e-01", "epoch": 0.00601} {"step": 3010, "loss": 1.4357, "grad_norm": "3.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.182e+00", "anc_loss": "1.228e+00", "dlm_acc": "5.355e-01", "anc_acc": "5.266e-01", "epoch": 0.00602} {"step": 3015, "loss": 1.7373, "grad_norm": "4.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.670e+00", "anc_loss": "1.712e+00", "dlm_acc": "4.230e-01", "anc_acc": "4.167e-01", "epoch": 0.00603} {"step": 3020, "loss": 1.6396, "grad_norm": "4.406e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.288e+00", "dlm_acc": "4.908e-01", "anc_acc": "4.863e-01", "epoch": 0.00604} {"step": 3025, "loss": 1.5344, "grad_norm": "7.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.039e+00", "anc_loss": "2.087e+00", "dlm_acc": "2.973e-01", "anc_acc": "2.937e-01", "epoch": 0.00605} {"step": 3030, "loss": 1.1256, "grad_norm": "5.856e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.273e-01", "anc_loss": "9.680e-01", "dlm_acc": "6.209e-01", "anc_acc": "6.125e-01", "epoch": 0.00606} {"step": 3035, "loss": 1.8686, "grad_norm": "8.845e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.723e+00", "anc_loss": "1.777e+00", "dlm_acc": "4.389e-01", "anc_acc": "4.330e-01", "epoch": 0.00607} {"step": 3040, "loss": 1.1965, "grad_norm": "5.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.180e+00", "dlm_acc": "5.846e-01", "anc_acc": "5.800e-01", "epoch": 0.00608} {"step": 3045, "loss": 1.1105, "grad_norm": "3.257e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.102e+00", "dlm_acc": "5.605e-01", "anc_acc": "5.516e-01", "epoch": 0.00609} {"step": 3050, "loss": 1.1675, "grad_norm": "6.137e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.406e+00", "anc_loss": "1.456e+00", "dlm_acc": "4.738e-01", "anc_acc": "4.682e-01", "epoch": 0.0061} {"step": 3055, "loss": 1.1287, "grad_norm": "8.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.399e-01", "anc_acc": "5.322e-01", "epoch": 0.00611} {"step": 3060, "loss": 1.0839, "grad_norm": "4.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.153e+00", "anc_loss": "1.188e+00", "dlm_acc": "5.963e-01", "anc_acc": "5.919e-01", "epoch": 0.00612} {"step": 3065, "loss": 1.0475, "grad_norm": "6.820e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.095e+00", "dlm_acc": "5.924e-01", "anc_acc": "5.838e-01", "epoch": 0.00613} {"step": 3070, "loss": 0.8584, "grad_norm": "2.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.170e+00", "dlm_acc": "5.172e-01", "anc_acc": "5.096e-01", "epoch": 0.00614} {"step": 3075, "loss": 0.9438, "grad_norm": "4.008e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.501e+00", "anc_loss": "1.546e+00", "dlm_acc": "4.431e-01", "anc_acc": "4.372e-01", "epoch": 0.00615} {"step": 3080, "loss": 1.0692, "grad_norm": "2.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.531e-01", "anc_loss": "9.711e-01", "dlm_acc": "4.626e-01", "anc_acc": "4.570e-01", "epoch": 0.00616} {"step": 3085, "loss": 1.717, "grad_norm": "2.148e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.898e+00", "anc_loss": "1.915e+00", "dlm_acc": "2.654e-01", "anc_acc": "2.638e-01", "epoch": 0.00617} {"step": 3090, "loss": 1.1439, "grad_norm": "4.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.331e+00", "anc_loss": "1.400e+00", "dlm_acc": "4.025e-01", "anc_acc": "4.005e-01", "epoch": 0.00618} {"step": 3095, "loss": 1.3781, "grad_norm": "4.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.547e+00", "dlm_acc": "4.685e-01", "anc_acc": "4.625e-01", "epoch": 0.00619} {"step": 3100, "loss": 1.4924, "grad_norm": "1.036e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.701e+00", "anc_loss": "1.763e+00", "dlm_acc": "4.642e-01", "anc_acc": "4.589e-01", "epoch": 0.0062} {"step": 3105, "loss": 1.5916, "grad_norm": "1.985e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.613e-01", "anc_acc": "5.545e-01", "epoch": 0.00621} {"step": 3110, "loss": 1.2924, "grad_norm": "3.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.047e+00", "dlm_acc": "5.730e-01", "anc_acc": "5.648e-01", "epoch": 0.00622} {"step": 3115, "loss": 1.1944, "grad_norm": "8.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.332e+00", "dlm_acc": "4.892e-01", "anc_acc": "4.834e-01", "epoch": 0.00623} {"step": 3120, "loss": 1.1988, "grad_norm": "5.765e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.641e+00", "dlm_acc": "4.593e-01", "anc_acc": "4.519e-01", "epoch": 0.00624} {"step": 3125, "loss": 1.4082, "grad_norm": "7.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.514e-01", "anc_loss": "5.635e-01", "dlm_acc": "6.058e-01", "anc_acc": "6.026e-01", "epoch": 0.00625} {"step": 3130, "loss": 0.9609, "grad_norm": "2.773e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.555e-01", "anc_loss": "4.727e-01", "dlm_acc": "7.059e-01", "anc_acc": "7.036e-01", "epoch": 0.00626} {"step": 3135, "loss": 1.3261, "grad_norm": "4.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.033e+00", "anc_loss": "2.069e+00", "dlm_acc": "3.214e-01", "anc_acc": "3.150e-01", "epoch": 0.00627} {"step": 3140, "loss": 0.857, "grad_norm": "3.491e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.104e+00", "dlm_acc": "5.917e-01", "anc_acc": "5.851e-01", "epoch": 0.00628} {"step": 3145, "loss": 1.2441, "grad_norm": "8.366e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.263e+00", "anc_loss": "2.446e+00", "dlm_acc": "3.221e-01", "anc_acc": "3.183e-01", "epoch": 0.00629} {"step": 3150, "loss": 1.1219, "grad_norm": "8.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.484e+00", "dlm_acc": "4.179e-01", "anc_acc": "4.124e-01", "epoch": 0.0063} {"step": 3155, "loss": 1.4997, "grad_norm": "8.335e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.540e+00", "anc_loss": "1.588e+00", "dlm_acc": "4.223e-01", "anc_acc": "4.145e-01", "epoch": 0.00631} {"step": 3160, "loss": 1.2097, "grad_norm": "7.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.586e-01", "anc_loss": "8.945e-01", "dlm_acc": "5.927e-01", "anc_acc": "5.897e-01", "epoch": 0.00632} {"step": 3165, "loss": 1.1801, "grad_norm": "3.440e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.000e+00", "anc_loss": "1.032e+00", "dlm_acc": "5.419e-01", "anc_acc": "5.387e-01", "epoch": 0.00633} {"step": 3170, "loss": 1.232, "grad_norm": "9.320e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.148e+00", "dlm_acc": "5.846e-01", "anc_acc": "5.769e-01", "epoch": 0.00634} {"step": 3175, "loss": 1.4345, "grad_norm": "5.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.566e-01", "anc_acc": "5.490e-01", "epoch": 0.00635} {"step": 3180, "loss": 1.3976, "grad_norm": "9.293e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.241e+00", "dlm_acc": "5.796e-01", "anc_acc": "5.726e-01", "epoch": 0.00636} {"step": 3185, "loss": 1.0387, "grad_norm": "4.239e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.239e+00", "dlm_acc": "5.504e-01", "anc_acc": "5.416e-01", "epoch": 0.00637} {"step": 3190, "loss": 1.1557, "grad_norm": "3.875e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.041e+00", "dlm_acc": "5.888e-01", "anc_acc": "5.827e-01", "epoch": 0.00638} {"step": 3195, "loss": 1.4785, "grad_norm": "4.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.950e+00", "anc_loss": "1.998e+00", "dlm_acc": "2.534e-01", "anc_acc": "2.506e-01", "epoch": 0.00639} {"step": 3200, "loss": 1.689, "grad_norm": "5.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.597e+00", "anc_loss": "2.641e+00", "dlm_acc": "8.832e-02", "anc_acc": "8.540e-02", "epoch": 0.0064} {"step": 3205, "loss": 1.9062, "grad_norm": "2.502e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.582e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.049e-01", "anc_acc": "4.982e-01", "epoch": 0.00641} {"step": 3210, "loss": 1.2486, "grad_norm": "2.559e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.684e-01", "anc_acc": "5.619e-01", "epoch": 0.00642} {"step": 3215, "loss": 1.618, "grad_norm": "6.382e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.208e+00", "anc_loss": "1.241e+00", "dlm_acc": "4.350e-01", "anc_acc": "4.258e-01", "epoch": 0.00643} {"step": 3220, "loss": 1.8878, "grad_norm": "1.059e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.000e-01", "anc_loss": "9.023e-01", "dlm_acc": "4.145e-01", "anc_acc": "4.114e-01", "epoch": 0.00644} {"step": 3225, "loss": 1.4443, "grad_norm": "8.327e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.590e-01", "anc_loss": "6.629e-01", "dlm_acc": "5.391e-01", "anc_acc": "5.385e-01", "epoch": 0.00645} {"step": 3230, "loss": 1.7625, "grad_norm": "4.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.854e-01", "anc_loss": "4.967e-01", "dlm_acc": "6.947e-01", "anc_acc": "6.876e-01", "epoch": 0.00646} {"step": 3235, "loss": 1.3556, "grad_norm": "5.328e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.512e-01", "anc_loss": "3.645e-01", "dlm_acc": "7.376e-01", "anc_acc": "7.301e-01", "epoch": 0.00647} {"step": 3240, "loss": 1.4176, "grad_norm": "4.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.285e-01", "anc_loss": "7.410e-01", "dlm_acc": "6.206e-01", "anc_acc": "6.162e-01", "epoch": 0.00648} {"step": 3245, "loss": 1.7021, "grad_norm": "8.532e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.169e+00", "anc_loss": "2.183e+00", "dlm_acc": "2.356e-01", "anc_acc": "2.342e-01", "epoch": 0.00649} {"step": 3250, "loss": 1.4359, "grad_norm": "5.458e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.047e+00", "anc_loss": "2.065e+00", "dlm_acc": "3.851e-01", "anc_acc": "3.828e-01", "epoch": 0.0065} {"step": 3255, "loss": 1.3578, "grad_norm": "6.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.941e+00", "anc_loss": "1.953e+00", "dlm_acc": "3.896e-01", "anc_acc": "3.865e-01", "epoch": 0.00651} {"step": 3260, "loss": 1.4811, "grad_norm": "4.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.733e+00", "dlm_acc": "3.881e-01", "anc_acc": "3.836e-01", "epoch": 0.00652} {"step": 3265, "loss": 1.5324, "grad_norm": "4.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.703e-01", "anc_loss": "9.023e-01", "dlm_acc": "5.263e-01", "anc_acc": "5.177e-01", "epoch": 0.00653} {"step": 3270, "loss": 1.3251, "grad_norm": "4.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.243e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.459e-01", "anc_acc": "5.377e-01", "epoch": 0.00654} {"step": 3275, "loss": 1.5591, "grad_norm": "4.180e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.577e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.813e-01", "anc_acc": "4.740e-01", "epoch": 0.00655} {"step": 3280, "loss": 1.1934, "grad_norm": "2.545e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.361e+00", "anc_loss": "1.403e+00", "dlm_acc": "4.358e-01", "anc_acc": "4.265e-01", "epoch": 0.00656} {"step": 3285, "loss": 1.6836, "grad_norm": "5.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.272e+00", "anc_loss": "2.325e+00", "dlm_acc": "2.347e-01", "anc_acc": "2.316e-01", "epoch": 0.00657} {"step": 3290, "loss": 1.0544, "grad_norm": "1.135e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.566e-01", "anc_loss": "8.848e-01", "dlm_acc": "6.410e-01", "anc_acc": "6.371e-01", "epoch": 0.00658} {"step": 3295, "loss": 1.738, "grad_norm": "9.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.533e+00", "anc_loss": "1.567e+00", "dlm_acc": "5.090e-01", "anc_acc": "5.092e-01", "epoch": 0.00659} {"step": 3300, "loss": 1.5818, "grad_norm": "4.728e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.258e+00", "anc_loss": "2.280e+00", "dlm_acc": "2.422e-01", "anc_acc": "2.386e-01", "epoch": 0.0066} {"step": 3305, "loss": 1.5109, "grad_norm": "7.747e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.016e+00", "anc_loss": "2.055e+00", "dlm_acc": "2.903e-01", "anc_acc": "2.849e-01", "epoch": 0.00661} {"step": 3310, "loss": 1.352, "grad_norm": "4.701e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.260e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.706e-01", "anc_acc": "5.647e-01", "epoch": 0.00662} {"step": 3315, "loss": 1.5246, "grad_norm": "5.359e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.597e+00", "dlm_acc": "5.050e-01", "anc_acc": "4.988e-01", "epoch": 0.00663} {"step": 3320, "loss": 1.1445, "grad_norm": "4.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.278e+00", "dlm_acc": "4.945e-01", "anc_acc": "4.852e-01", "epoch": 0.00664} {"step": 3325, "loss": 1.0134, "grad_norm": "3.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.938e-01", "anc_loss": "1.024e+00", "dlm_acc": "5.254e-01", "anc_acc": "5.186e-01", "epoch": 0.00665} {"step": 3330, "loss": 1.3616, "grad_norm": "4.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.520e+00", "anc_loss": "1.583e+00", "dlm_acc": "4.625e-01", "anc_acc": "4.520e-01", "epoch": 0.00666} {"step": 3335, "loss": 1.6264, "grad_norm": "3.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.636e+00", "anc_loss": "1.688e+00", "dlm_acc": "4.757e-01", "anc_acc": "4.677e-01", "epoch": 0.00667} {"step": 3340, "loss": 2.1886, "grad_norm": "8.997e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.837e+00", "anc_loss": "2.861e+00", "dlm_acc": "1.335e-01", "anc_acc": "1.333e-01", "epoch": 0.00668} {"step": 3345, "loss": 1.7695, "grad_norm": "1.130e+01", "learning_rate": "1.000e-04", "dlm_loss": "2.406e+00", "anc_loss": "2.456e+00", "dlm_acc": "2.766e-01", "anc_acc": "2.728e-01", "epoch": 0.00669} {"step": 3350, "loss": 0.9515, "grad_norm": "4.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.189e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.045e-01", "anc_acc": "4.987e-01", "epoch": 0.0067} {"step": 3355, "loss": 1.0761, "grad_norm": "3.768e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.559e-01", "anc_loss": "9.891e-01", "dlm_acc": "5.213e-01", "anc_acc": "5.139e-01", "epoch": 0.00671} {"step": 3360, "loss": 1.3232, "grad_norm": "5.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.387e+00", "dlm_acc": "4.899e-01", "anc_acc": "4.839e-01", "epoch": 0.00672} {"step": 3365, "loss": 1.6534, "grad_norm": "5.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.459e+00", "anc_loss": "1.516e+00", "dlm_acc": "4.572e-01", "anc_acc": "4.474e-01", "epoch": 0.00673} {"step": 3370, "loss": 1.422, "grad_norm": "6.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.282e-01", "anc_acc": "5.166e-01", "epoch": 0.00674} {"step": 3375, "loss": 1.553, "grad_norm": "9.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.222e+00", "dlm_acc": "5.823e-01", "anc_acc": "5.768e-01", "epoch": 0.00675} {"step": 3380, "loss": 1.5247, "grad_norm": "6.871e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.357e+00", "dlm_acc": "4.989e-01", "anc_acc": "4.941e-01", "epoch": 0.00676} {"step": 3385, "loss": 1.5242, "grad_norm": "5.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.294e+00", "anc_loss": "2.334e+00", "dlm_acc": "2.072e-01", "anc_acc": "2.031e-01", "epoch": 0.00677} {"step": 3390, "loss": 1.2196, "grad_norm": "1.117e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.372e+00", "anc_loss": "1.416e+00", "dlm_acc": "4.787e-01", "anc_acc": "4.694e-01", "epoch": 0.00678} {"step": 3395, "loss": 1.4037, "grad_norm": "4.938e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.390e+00", "anc_loss": "1.434e+00", "dlm_acc": "4.895e-01", "anc_acc": "4.828e-01", "epoch": 0.00679} {"step": 3400, "loss": 1.7138, "grad_norm": "7.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.627e+00", "dlm_acc": "4.721e-01", "anc_acc": "4.659e-01", "epoch": 0.0068} {"step": 3405, "loss": 1.474, "grad_norm": "5.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.373e+00", "dlm_acc": "5.447e-01", "anc_acc": "5.362e-01", "epoch": 0.00681} {"step": 3410, "loss": 1.36, "grad_norm": "5.152e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.545e+00", "dlm_acc": "4.873e-01", "anc_acc": "4.786e-01", "epoch": 0.00682} {"step": 3415, "loss": 1.1206, "grad_norm": "4.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.519e+00", "anc_loss": "1.577e+00", "dlm_acc": "4.760e-01", "anc_acc": "4.685e-01", "epoch": 0.00683} {"step": 3420, "loss": 1.7799, "grad_norm": "6.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.988e+00", "anc_loss": "2.050e+00", "dlm_acc": "3.935e-01", "anc_acc": "3.864e-01", "epoch": 0.00684} {"step": 3425, "loss": 1.3613, "grad_norm": "4.337e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.802e+00", "anc_loss": "1.859e+00", "dlm_acc": "4.171e-01", "anc_acc": "4.104e-01", "epoch": 0.00685} {"step": 3430, "loss": 1.0863, "grad_norm": "1.011e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.475e+00", "dlm_acc": "4.843e-01", "anc_acc": "4.771e-01", "epoch": 0.00686} {"step": 3435, "loss": 1.6091, "grad_norm": "5.462e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.675e+00", "dlm_acc": "4.995e-01", "anc_acc": "4.923e-01", "epoch": 0.00687} {"step": 3440, "loss": 2.0935, "grad_norm": "5.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.679e+00", "anc_loss": "1.743e+00", "dlm_acc": "4.809e-01", "anc_acc": "4.717e-01", "epoch": 0.00688} {"step": 3445, "loss": 2.0147, "grad_norm": "4.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.253e+00", "anc_loss": "2.302e+00", "dlm_acc": "2.645e-01", "anc_acc": "2.632e-01", "epoch": 0.00689} {"step": 3450, "loss": 1.4016, "grad_norm": "3.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.839e+00", "anc_loss": "1.878e+00", "dlm_acc": "3.144e-01", "anc_acc": "3.088e-01", "epoch": 0.0069} {"step": 3455, "loss": 1.8789, "grad_norm": "4.260e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.633e+00", "anc_loss": "1.688e+00", "dlm_acc": "5.108e-01", "anc_acc": "5.045e-01", "epoch": 0.00691} {"step": 3460, "loss": 1.2896, "grad_norm": "4.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.182e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.913e-01", "anc_acc": "5.849e-01", "epoch": 0.00692} {"step": 3465, "loss": 1.387, "grad_norm": "5.557e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.401e+00", "anc_loss": "1.446e+00", "dlm_acc": "4.654e-01", "anc_acc": "4.607e-01", "epoch": 0.00693} {"step": 3470, "loss": 1.6113, "grad_norm": "4.802e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.387e-01", "anc_acc": "5.300e-01", "epoch": 0.00694} {"step": 3475, "loss": 1.544, "grad_norm": "2.879e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.295e-01", "anc_acc": "5.207e-01", "epoch": 0.00695} {"step": 3480, "loss": 1.3797, "grad_norm": "4.470e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.350e+00", "anc_loss": "1.402e+00", "dlm_acc": "5.106e-01", "anc_acc": "5.033e-01", "epoch": 0.00696} {"step": 3485, "loss": 1.4645, "grad_norm": "6.036e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.624e+00", "anc_loss": "1.685e+00", "dlm_acc": "5.008e-01", "anc_acc": "4.930e-01", "epoch": 0.00697} {"step": 3490, "loss": 1.0166, "grad_norm": "7.980e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.597e-01", "anc_acc": "5.509e-01", "epoch": 0.00698} {"step": 3495, "loss": 1.2801, "grad_norm": "4.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.653e+00", "dlm_acc": "4.730e-01", "anc_acc": "4.649e-01", "epoch": 0.00699} {"step": 3500, "loss": 1.2665, "grad_norm": "5.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.763e-01", "anc_acc": "5.671e-01", "epoch": 0.007} {"step": 3505, "loss": 1.5922, "grad_norm": "7.335e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.201e+00", "anc_loss": "1.232e+00", "dlm_acc": "5.226e-01", "anc_acc": "5.194e-01", "epoch": 0.00701} {"step": 3510, "loss": 2.1369, "grad_norm": "5.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.035e+00", "anc_loss": "1.072e+00", "dlm_acc": "6.344e-01", "anc_acc": "6.303e-01", "epoch": 0.00702} {"step": 3515, "loss": 1.2122, "grad_norm": "5.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.770e-01", "anc_loss": "9.129e-01", "dlm_acc": "6.021e-01", "anc_acc": "5.951e-01", "epoch": 0.00703} {"step": 3520, "loss": 1.2566, "grad_norm": "3.401e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.687e-01", "anc_loss": "6.859e-01", "dlm_acc": "5.966e-01", "anc_acc": "5.926e-01", "epoch": 0.00704} {"step": 3525, "loss": 1.4977, "grad_norm": "3.877e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.513e+00", "anc_loss": "1.574e+00", "dlm_acc": "4.712e-01", "anc_acc": "4.638e-01", "epoch": 0.00705} {"step": 3530, "loss": 1.2948, "grad_norm": "1.048e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.164e+00", "dlm_acc": "5.616e-01", "anc_acc": "5.524e-01", "epoch": 0.00706} {"step": 3535, "loss": 1.441, "grad_norm": "1.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.148e-01", "anc_loss": "9.414e-01", "dlm_acc": "5.146e-01", "anc_acc": "5.099e-01", "epoch": 0.00707} {"step": 3540, "loss": 1.2417, "grad_norm": "3.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.384e-01", "anc_acc": "5.328e-01", "epoch": 0.00708} {"step": 3545, "loss": 1.733, "grad_norm": "3.878e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.361e+00", "dlm_acc": "4.902e-01", "anc_acc": "4.851e-01", "epoch": 0.00709} {"step": 3550, "loss": 1.4093, "grad_norm": "4.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.536e+00", "anc_loss": "1.586e+00", "dlm_acc": "4.986e-01", "anc_acc": "4.898e-01", "epoch": 0.0071} {"step": 3555, "loss": 1.257, "grad_norm": "5.399e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.467e+00", "anc_loss": "1.516e+00", "dlm_acc": "5.250e-01", "anc_acc": "5.172e-01", "epoch": 0.00711} {"step": 3560, "loss": 1.3775, "grad_norm": "4.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.209e+00", "dlm_acc": "6.100e-01", "anc_acc": "6.011e-01", "epoch": 0.00712} {"step": 3565, "loss": 1.3863, "grad_norm": "3.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.165e+00", "dlm_acc": "4.554e-01", "anc_acc": "4.510e-01", "epoch": 0.00713} {"step": 3570, "loss": 1.3582, "grad_norm": "6.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.637e+00", "anc_loss": "1.697e+00", "dlm_acc": "4.846e-01", "anc_acc": "4.763e-01", "epoch": 0.00714} {"step": 3575, "loss": 1.0634, "grad_norm": "2.736e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.174e+00", "dlm_acc": "5.461e-01", "anc_acc": "5.383e-01", "epoch": 0.00715} {"step": 3580, "loss": 1.1847, "grad_norm": "3.879e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.470e-01", "anc_loss": "7.739e-01", "dlm_acc": "6.592e-01", "anc_acc": "6.535e-01", "epoch": 0.00716} {"step": 3585, "loss": 0.8854, "grad_norm": "3.931e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.625e-01", "anc_loss": "9.129e-01", "dlm_acc": "6.818e-01", "anc_acc": "6.731e-01", "epoch": 0.00717} {"step": 3590, "loss": 1.2648, "grad_norm": "3.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.438e-01", "anc_loss": "8.766e-01", "dlm_acc": "6.263e-01", "anc_acc": "6.195e-01", "epoch": 0.00718} {"step": 3595, "loss": 1.6439, "grad_norm": "4.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.574e+00", "anc_loss": "1.672e+00", "dlm_acc": "5.107e-01", "anc_acc": "5.037e-01", "epoch": 0.00719} {"step": 3600, "loss": 1.187, "grad_norm": "6.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.900e-01", "anc_loss": "9.213e-01", "dlm_acc": "6.108e-01", "anc_acc": "6.043e-01", "epoch": 0.0072} {"step": 3605, "loss": 1.4815, "grad_norm": "6.187e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.310e+00", "dlm_acc": "4.969e-01", "anc_acc": "4.875e-01", "epoch": 0.00721} {"step": 3610, "loss": 1.4058, "grad_norm": "5.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.516e+00", "anc_loss": "1.578e+00", "dlm_acc": "5.447e-01", "anc_acc": "5.366e-01", "epoch": 0.00722} {"step": 3615, "loss": 1.3315, "grad_norm": "4.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.776e-01", "anc_acc": "5.712e-01", "epoch": 0.00723} {"step": 3620, "loss": 0.9994, "grad_norm": "5.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.070e+00", "dlm_acc": "6.247e-01", "anc_acc": "6.179e-01", "epoch": 0.00724} {"step": 3625, "loss": 1.1908, "grad_norm": "3.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.466e+00", "anc_loss": "1.514e+00", "dlm_acc": "4.585e-01", "anc_acc": "4.477e-01", "epoch": 0.00725} {"step": 3630, "loss": 1.0974, "grad_norm": "4.950e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.709e+00", "anc_loss": "1.750e+00", "dlm_acc": "4.215e-01", "anc_acc": "4.152e-01", "epoch": 0.00726} {"step": 3635, "loss": 1.5001, "grad_norm": "2.224e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.059e+00", "anc_loss": "2.106e+00", "dlm_acc": "3.879e-01", "anc_acc": "3.796e-01", "epoch": 0.00727} {"step": 3640, "loss": 0.959, "grad_norm": "3.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.891e-01", "anc_loss": "1.034e+00", "dlm_acc": "6.130e-01", "anc_acc": "6.075e-01", "epoch": 0.00728} {"step": 3645, "loss": 1.1494, "grad_norm": "4.479e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.481e+00", "anc_loss": "1.533e+00", "dlm_acc": "4.955e-01", "anc_acc": "4.889e-01", "epoch": 0.00729} {"step": 3650, "loss": 1.3143, "grad_norm": "4.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.349e+00", "anc_loss": "1.390e+00", "dlm_acc": "5.407e-01", "anc_acc": "5.342e-01", "epoch": 0.0073} {"step": 3655, "loss": 1.1517, "grad_norm": "2.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.401e+00", "anc_loss": "1.457e+00", "dlm_acc": "4.681e-01", "anc_acc": "4.571e-01", "epoch": 0.00731} {"step": 3660, "loss": 1.0501, "grad_norm": "2.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.114e-01", "anc_loss": "9.490e-01", "dlm_acc": "6.361e-01", "anc_acc": "6.264e-01", "epoch": 0.00732} {"step": 3665, "loss": 1.1283, "grad_norm": "1.220e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.321e+00", "dlm_acc": "5.305e-01", "anc_acc": "5.253e-01", "epoch": 0.00733} {"step": 3670, "loss": 1.6743, "grad_norm": "3.945e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.566e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.661e-01", "anc_acc": "4.562e-01", "epoch": 0.00734} {"step": 3675, "loss": 1.6639, "grad_norm": "4.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.558e+00", "dlm_acc": "4.719e-01", "anc_acc": "4.655e-01", "epoch": 0.00735} {"step": 3680, "loss": 1.3817, "grad_norm": "5.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.034e+00", "anc_loss": "1.068e+00", "dlm_acc": "5.973e-01", "anc_acc": "5.921e-01", "epoch": 0.00736} {"step": 3685, "loss": 1.2008, "grad_norm": "3.980e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.346e+00", "dlm_acc": "5.304e-01", "anc_acc": "5.237e-01", "epoch": 0.00737} {"step": 3690, "loss": 1.6128, "grad_norm": "4.650e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.446e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.478e-01", "anc_acc": "5.428e-01", "epoch": 0.00738} {"step": 3695, "loss": 1.4813, "grad_norm": "6.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.490e+00", "dlm_acc": "5.391e-01", "anc_acc": "5.308e-01", "epoch": 0.00739} {"step": 3700, "loss": 1.7116, "grad_norm": "5.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.159e+00", "anc_loss": "2.192e+00", "dlm_acc": "2.504e-01", "anc_acc": "2.463e-01", "epoch": 0.0074} {"step": 3705, "loss": 1.7507, "grad_norm": "5.370e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.619e+00", "dlm_acc": "4.478e-01", "anc_acc": "4.396e-01", "epoch": 0.00741} {"step": 3710, "loss": 1.1137, "grad_norm": "3.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.243e+00", "dlm_acc": "5.563e-01", "anc_acc": "5.493e-01", "epoch": 0.00742} {"step": 3715, "loss": 1.2939, "grad_norm": "6.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.055e-01", "anc_loss": "9.305e-01", "dlm_acc": "5.556e-01", "anc_acc": "5.518e-01", "epoch": 0.00743} {"step": 3720, "loss": 1.4012, "grad_norm": "5.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.237e+00", "anc_loss": "1.305e+00", "dlm_acc": "4.684e-01", "anc_acc": "4.498e-01", "epoch": 0.00744} {"step": 3725, "loss": 1.6791, "grad_norm": "4.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.694e+00", "dlm_acc": "4.128e-01", "anc_acc": "4.012e-01", "epoch": 0.00745} {"step": 3730, "loss": 1.3159, "grad_norm": "3.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.245e+00", "dlm_acc": "4.855e-01", "anc_acc": "4.707e-01", "epoch": 0.00746} {"step": 3735, "loss": 1.1589, "grad_norm": "7.791e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.144e+00", "anc_loss": "1.192e+00", "dlm_acc": "5.762e-01", "anc_acc": "5.689e-01", "epoch": 0.00747} {"step": 3740, "loss": 1.1089, "grad_norm": "3.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.335e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.124e-01", "anc_acc": "5.054e-01", "epoch": 0.00748} {"step": 3745, "loss": 0.9956, "grad_norm": "4.482e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.475e+00", "dlm_acc": "4.587e-01", "anc_acc": "4.537e-01", "epoch": 0.00749} {"step": 3750, "loss": 1.0215, "grad_norm": "3.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.094e+00", "anc_loss": "1.129e+00", "dlm_acc": "5.394e-01", "anc_acc": "5.310e-01", "epoch": 0.0075} {"step": 3755, "loss": 1.5385, "grad_norm": "7.818e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.717e+00", "anc_loss": "1.775e+00", "dlm_acc": "4.701e-01", "anc_acc": "4.623e-01", "epoch": 0.00751} {"step": 3760, "loss": 1.6723, "grad_norm": "1.601e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.630e+00", "anc_loss": "1.686e+00", "dlm_acc": "4.741e-01", "anc_acc": "4.650e-01", "epoch": 0.00752} {"step": 3765, "loss": 1.8739, "grad_norm": "7.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.566e+00", "anc_loss": "1.608e+00", "dlm_acc": "4.886e-01", "anc_acc": "4.802e-01", "epoch": 0.00753} {"step": 3770, "loss": 1.5545, "grad_norm": "2.510e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.290e-01", "anc_acc": "5.205e-01", "epoch": 0.00754} {"step": 3775, "loss": 1.8902, "grad_norm": "7.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.911e+00", "anc_loss": "1.967e+00", "dlm_acc": "3.955e-01", "anc_acc": "3.930e-01", "epoch": 0.00755} {"step": 3780, "loss": 1.617, "grad_norm": "1.005e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.258e+00", "anc_loss": "1.295e+00", "dlm_acc": "4.781e-01", "anc_acc": "4.721e-01", "epoch": 0.00756} {"step": 3785, "loss": 1.7119, "grad_norm": "9.983e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.477e+00", "anc_loss": "2.498e+00", "dlm_acc": "1.278e-01", "anc_acc": "1.259e-01", "epoch": 0.00757} {"step": 3790, "loss": 2.0061, "grad_norm": "4.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.944e+00", "anc_loss": "2.953e+00", "dlm_acc": "3.865e-02", "anc_acc": "3.801e-02", "epoch": 0.00758} {"step": 3795, "loss": 1.4271, "grad_norm": "3.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.311e+00", "dlm_acc": "4.400e-01", "anc_acc": "4.314e-01", "epoch": 0.00759} {"step": 3800, "loss": 1.4273, "grad_norm": "4.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.488e+00", "dlm_acc": "4.891e-01", "anc_acc": "4.823e-01", "epoch": 0.0076} {"step": 3805, "loss": 1.5448, "grad_norm": "4.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.362e+00", "dlm_acc": "5.545e-01", "anc_acc": "5.487e-01", "epoch": 0.00761} {"step": 3810, "loss": 1.3928, "grad_norm": "4.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.207e-01", "anc_loss": "8.508e-01", "dlm_acc": "6.330e-01", "anc_acc": "6.255e-01", "epoch": 0.00762} {"step": 3815, "loss": 1.4156, "grad_norm": "4.470e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.160e-01", "anc_loss": "6.314e-01", "dlm_acc": "6.678e-01", "anc_acc": "6.664e-01", "epoch": 0.00763} {"step": 3820, "loss": 1.0116, "grad_norm": "3.183e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.633e-01", "anc_loss": "1.010e+00", "dlm_acc": "6.218e-01", "anc_acc": "6.143e-01", "epoch": 0.00764} {"step": 3825, "loss": 1.4672, "grad_norm": "7.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.844e-01", "anc_loss": "1.016e+00", "dlm_acc": "5.718e-01", "anc_acc": "5.658e-01", "epoch": 0.00765} {"step": 3830, "loss": 1.3293, "grad_norm": "6.921e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.324e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.041e-01", "anc_acc": "4.975e-01", "epoch": 0.00766} {"step": 3835, "loss": 0.9635, "grad_norm": "3.802e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.953e-01", "anc_loss": "6.094e-01", "dlm_acc": "6.094e-01", "anc_acc": "6.055e-01", "epoch": 0.00767} {"step": 3840, "loss": 1.1108, "grad_norm": "3.265e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.918e-01", "anc_loss": "9.281e-01", "dlm_acc": "5.865e-01", "anc_acc": "5.789e-01", "epoch": 0.00768} {"step": 3845, "loss": 1.5142, "grad_norm": "3.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.409e+00", "anc_loss": "1.469e+00", "dlm_acc": "5.279e-01", "anc_acc": "5.204e-01", "epoch": 0.00769} {"step": 3850, "loss": 1.2874, "grad_norm": "5.815e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.233e+00", "dlm_acc": "5.544e-01", "anc_acc": "5.498e-01", "epoch": 0.0077} {"step": 3855, "loss": 1.3547, "grad_norm": "3.420e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.219e-01", "anc_loss": "6.305e-01", "dlm_acc": "5.237e-01", "anc_acc": "5.204e-01", "epoch": 0.00771} {"step": 3860, "loss": 1.6869, "grad_norm": "4.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.453e+00", "dlm_acc": "4.750e-01", "anc_acc": "4.711e-01", "epoch": 0.00772} {"step": 3865, "loss": 1.2415, "grad_norm": "4.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.165e+00", "dlm_acc": "4.873e-01", "anc_acc": "4.792e-01", "epoch": 0.00773} {"step": 3870, "loss": 1.4028, "grad_norm": "4.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.133e+00", "dlm_acc": "5.425e-01", "anc_acc": "5.348e-01", "epoch": 0.00774} {"step": 3875, "loss": 1.4246, "grad_norm": "2.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.128e+00", "anc_loss": "1.146e+00", "dlm_acc": "3.924e-01", "anc_acc": "3.902e-01", "epoch": 0.00775} {"step": 3880, "loss": 1.1301, "grad_norm": "2.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.074e+00", "dlm_acc": "6.228e-01", "anc_acc": "6.151e-01", "epoch": 0.00776} {"step": 3885, "loss": 1.1563, "grad_norm": "1.894e+00", "learning_rate": "1.000e-04", "dlm_loss": "7.311e-01", "anc_loss": "7.559e-01", "dlm_acc": "6.397e-01", "anc_acc": "6.332e-01", "epoch": 0.00777} {"step": 3890, "loss": 1.4148, "grad_norm": "6.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.201e+00", "anc_loss": "1.243e+00", "dlm_acc": "5.315e-01", "anc_acc": "5.219e-01", "epoch": 0.00778} {"step": 3895, "loss": 1.2478, "grad_norm": "4.299e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.387e-01", "anc_loss": "3.659e-01", "dlm_acc": "8.513e-01", "anc_acc": "8.400e-01", "epoch": 0.00779} {"step": 3900, "loss": 1.0666, "grad_norm": "3.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.812e-01", "anc_loss": "9.062e-01", "dlm_acc": "4.940e-01", "anc_acc": "4.904e-01", "epoch": 0.0078} {"step": 3905, "loss": 1.051, "grad_norm": "2.122e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.148e-01", "anc_loss": "9.195e-01", "dlm_acc": "4.117e-01", "anc_acc": "4.103e-01", "epoch": 0.00781} {"step": 3910, "loss": 0.9896, "grad_norm": "1.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.711e-01", "anc_loss": "6.762e-01", "dlm_acc": "4.325e-01", "anc_acc": "4.307e-01", "epoch": 0.00782} {"step": 3915, "loss": 1.2596, "grad_norm": "3.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.695e-01", "anc_loss": "7.742e-01", "dlm_acc": "4.276e-01", "anc_acc": "4.253e-01", "epoch": 0.00783} {"step": 3920, "loss": 1.3534, "grad_norm": "4.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.500e-01", "anc_loss": "7.547e-01", "dlm_acc": "4.205e-01", "anc_acc": "4.196e-01", "epoch": 0.00784} {"step": 3925, "loss": 1.6921, "grad_norm": "5.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.290e+00", "dlm_acc": "4.133e-01", "anc_acc": "4.097e-01", "epoch": 0.00785} {"step": 3930, "loss": 1.1709, "grad_norm": "6.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.371e-01", "anc_loss": "9.691e-01", "dlm_acc": "5.812e-01", "anc_acc": "5.773e-01", "epoch": 0.00786} {"step": 3935, "loss": 1.533, "grad_norm": "3.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.199e+00", "anc_loss": "1.249e+00", "dlm_acc": "5.962e-01", "anc_acc": "5.889e-01", "epoch": 0.00787} {"step": 3940, "loss": 1.1338, "grad_norm": "5.744e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.313e-01", "anc_loss": "8.692e-01", "dlm_acc": "6.498e-01", "anc_acc": "6.437e-01", "epoch": 0.00788} {"step": 3945, "loss": 1.2098, "grad_norm": "7.398e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.193e+00", "anc_loss": "1.237e+00", "dlm_acc": "5.457e-01", "anc_acc": "5.381e-01", "epoch": 0.00789} {"step": 3950, "loss": 0.8422, "grad_norm": "7.654e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.906e-01", "anc_loss": "9.104e-01", "dlm_acc": "5.779e-01", "anc_acc": "5.714e-01", "epoch": 0.0079} {"step": 3955, "loss": 1.2076, "grad_norm": "7.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.574e-01", "anc_loss": "9.997e-01", "dlm_acc": "6.222e-01", "anc_acc": "6.150e-01", "epoch": 0.00791} {"step": 3960, "loss": 1.15, "grad_norm": "5.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.191e+00", "dlm_acc": "4.949e-01", "anc_acc": "4.974e-01", "epoch": 0.00792} {"step": 3965, "loss": 1.2082, "grad_norm": "6.573e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.477e-01", "anc_loss": "9.805e-01", "dlm_acc": "5.621e-01", "anc_acc": "5.575e-01", "epoch": 0.00793} {"step": 3970, "loss": 1.616, "grad_norm": "6.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.602e+00", "anc_loss": "1.648e+00", "dlm_acc": "3.936e-01", "anc_acc": "3.872e-01", "epoch": 0.00794} {"step": 3975, "loss": 1.7047, "grad_norm": "4.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.759e+00", "anc_loss": "1.816e+00", "dlm_acc": "4.366e-01", "anc_acc": "4.274e-01", "epoch": 0.00795} {"step": 3980, "loss": 1.3091, "grad_norm": "4.352e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.118e+00", "anc_loss": "1.160e+00", "dlm_acc": "5.995e-01", "anc_acc": "5.918e-01", "epoch": 0.00796} {"step": 3985, "loss": 1.4068, "grad_norm": "3.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.451e+00", "anc_loss": "1.502e+00", "dlm_acc": "4.598e-01", "anc_acc": "4.502e-01", "epoch": 0.00797} {"step": 3990, "loss": 1.286, "grad_norm": "5.950e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.250e-01", "anc_loss": "8.648e-01", "dlm_acc": "7.015e-01", "anc_acc": "6.936e-01", "epoch": 0.00798} {"step": 3995, "loss": 1.102, "grad_norm": "4.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.104e+00", "anc_loss": "1.166e+00", "dlm_acc": "5.805e-01", "anc_acc": "5.686e-01", "epoch": 0.00799} {"step": 4000, "loss": 1.172, "grad_norm": "4.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.307e+00", "dlm_acc": "4.965e-01", "anc_acc": "4.905e-01", "epoch": 0.008} {"step": 4005, "loss": 1.3793, "grad_norm": "2.424e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.497e+00", "anc_loss": "1.538e+00", "dlm_acc": "4.642e-01", "anc_acc": "4.586e-01", "epoch": 0.00801} {"step": 4010, "loss": 0.8651, "grad_norm": "2.326e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.664e-01", "anc_loss": "6.805e-01", "dlm_acc": "5.237e-01", "anc_acc": "5.219e-01", "epoch": 0.00802} {"step": 4015, "loss": 1.7223, "grad_norm": "8.252e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.690e+00", "anc_loss": "1.741e+00", "dlm_acc": "4.394e-01", "anc_acc": "4.296e-01", "epoch": 0.00803} {"step": 4020, "loss": 1.1223, "grad_norm": "4.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.115e+00", "dlm_acc": "6.065e-01", "anc_acc": "6.014e-01", "epoch": 0.00804} {"step": 4025, "loss": 1.0824, "grad_norm": "4.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.156e+00", "anc_loss": "1.195e+00", "dlm_acc": "5.467e-01", "anc_acc": "5.410e-01", "epoch": 0.00805} {"step": 4030, "loss": 1.4134, "grad_norm": "6.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.286e+00", "anc_loss": "1.343e+00", "dlm_acc": "5.103e-01", "anc_acc": "5.011e-01", "epoch": 0.00806} {"step": 4035, "loss": 1.4582, "grad_norm": "2.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.078e+00", "anc_loss": "1.116e+00", "dlm_acc": "5.034e-01", "anc_acc": "4.939e-01", "epoch": 0.00807} {"step": 4040, "loss": 1.3168, "grad_norm": "3.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.082e+00", "dlm_acc": "5.614e-01", "anc_acc": "5.507e-01", "epoch": 0.00808} {"step": 4045, "loss": 1.5291, "grad_norm": "3.230e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.666e+00", "anc_loss": "1.724e+00", "dlm_acc": "4.614e-01", "anc_acc": "4.550e-01", "epoch": 0.00809} {"step": 4050, "loss": 1.1744, "grad_norm": "3.972e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.036e+00", "anc_loss": "1.071e+00", "dlm_acc": "5.962e-01", "anc_acc": "5.916e-01", "epoch": 0.0081} {"step": 4055, "loss": 1.0722, "grad_norm": "4.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.120e+00", "dlm_acc": "5.661e-01", "anc_acc": "5.590e-01", "epoch": 0.00811} {"step": 4060, "loss": 1.0661, "grad_norm": "4.257e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.272e+00", "anc_loss": "1.316e+00", "dlm_acc": "5.565e-01", "anc_acc": "5.493e-01", "epoch": 0.00812} {"step": 4065, "loss": 1.2026, "grad_norm": "3.808e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.476e+00", "anc_loss": "1.513e+00", "dlm_acc": "4.884e-01", "anc_acc": "4.825e-01", "epoch": 0.00813} {"step": 4070, "loss": 1.244, "grad_norm": "5.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.376e+00", "anc_loss": "1.431e+00", "dlm_acc": "5.454e-01", "anc_acc": "5.358e-01", "epoch": 0.00814} {"step": 4075, "loss": 1.2037, "grad_norm": "5.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.858e-01", "anc_acc": "5.795e-01", "epoch": 0.00815} {"step": 4080, "loss": 1.4432, "grad_norm": "3.438e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.711e+00", "anc_loss": "1.775e+00", "dlm_acc": "4.738e-01", "anc_acc": "4.657e-01", "epoch": 0.00816} {"step": 4085, "loss": 1.6614, "grad_norm": "4.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.667e+00", "anc_loss": "1.725e+00", "dlm_acc": "4.498e-01", "anc_acc": "4.394e-01", "epoch": 0.00817} {"step": 4090, "loss": 1.2256, "grad_norm": "3.899e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.268e+00", "dlm_acc": "5.515e-01", "anc_acc": "5.407e-01", "epoch": 0.00818} {"step": 4095, "loss": 1.2402, "grad_norm": "6.219e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.267e+00", "dlm_acc": "4.840e-01", "anc_acc": "4.774e-01", "epoch": 0.00819} {"step": 4100, "loss": 0.7889, "grad_norm": "2.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.283e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.205e-01", "anc_acc": "5.112e-01", "epoch": 0.0082} {"step": 4105, "loss": 0.948, "grad_norm": "2.866e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.141e-01", "anc_loss": "8.258e-01", "dlm_acc": "5.025e-01", "anc_acc": "5.014e-01", "epoch": 0.00821} {"step": 4110, "loss": 1.327, "grad_norm": "8.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.766e+00", "anc_loss": "1.817e+00", "dlm_acc": "4.583e-01", "anc_acc": "4.514e-01", "epoch": 0.00822} {"step": 4115, "loss": 1.6093, "grad_norm": "7.806e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.683e+00", "anc_loss": "1.740e+00", "dlm_acc": "4.636e-01", "anc_acc": "4.545e-01", "epoch": 0.00823} {"step": 4120, "loss": 1.1836, "grad_norm": "3.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.286e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.212e-01", "anc_acc": "5.144e-01", "epoch": 0.00824} {"step": 4125, "loss": 1.0164, "grad_norm": "2.089e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.361e-01", "anc_loss": "8.619e-01", "dlm_acc": "6.332e-01", "anc_acc": "6.274e-01", "epoch": 0.00825} {"step": 4130, "loss": 0.9865, "grad_norm": "3.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.258e-01", "anc_loss": "8.609e-01", "dlm_acc": "5.801e-01", "anc_acc": "5.668e-01", "epoch": 0.00826} {"step": 4135, "loss": 0.8583, "grad_norm": "6.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.461e-01", "anc_loss": "9.906e-01", "dlm_acc": "5.862e-01", "anc_acc": "5.753e-01", "epoch": 0.00827} {"step": 4140, "loss": 0.9589, "grad_norm": "2.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.207e+00", "anc_loss": "1.265e+00", "dlm_acc": "5.419e-01", "anc_acc": "5.311e-01", "epoch": 0.00828} {"step": 4145, "loss": 1.625, "grad_norm": "6.908e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.425e+00", "dlm_acc": "5.186e-01", "anc_acc": "5.094e-01", "epoch": 0.00829} {"step": 4150, "loss": 1.1313, "grad_norm": "5.410e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.369e+00", "anc_loss": "1.430e+00", "dlm_acc": "4.882e-01", "anc_acc": "4.786e-01", "epoch": 0.0083} {"step": 4155, "loss": 1.2289, "grad_norm": "5.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.081e-01", "anc_acc": "4.977e-01", "epoch": 0.00831} {"step": 4160, "loss": 1.0223, "grad_norm": "2.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.410e+00", "anc_loss": "1.468e+00", "dlm_acc": "5.123e-01", "anc_acc": "5.021e-01", "epoch": 0.00832} {"step": 4165, "loss": 1.1998, "grad_norm": "5.765e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.499e+00", "anc_loss": "1.553e+00", "dlm_acc": "4.972e-01", "anc_acc": "4.872e-01", "epoch": 0.00833} {"step": 4170, "loss": 1.1467, "grad_norm": "3.375e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.398e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.455e-01", "anc_acc": "5.349e-01", "epoch": 0.00834} {"step": 4175, "loss": 1.3093, "grad_norm": "4.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.500e+00", "anc_loss": "1.562e+00", "dlm_acc": "5.192e-01", "anc_acc": "5.088e-01", "epoch": 0.00835} {"step": 4180, "loss": 1.0899, "grad_norm": "3.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.350e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.276e-01", "anc_acc": "5.176e-01", "epoch": 0.00836} {"step": 4185, "loss": 1.7887, "grad_norm": "6.702e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.612e+00", "anc_loss": "1.680e+00", "dlm_acc": "4.648e-01", "anc_acc": "4.528e-01", "epoch": 0.00837} {"step": 4190, "loss": 1.3203, "grad_norm": "1.006e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.722e+00", "anc_loss": "1.780e+00", "dlm_acc": "4.610e-01", "anc_acc": "4.544e-01", "epoch": 0.00838} {"step": 4195, "loss": 1.6374, "grad_norm": "4.653e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.670e+00", "anc_loss": "1.733e+00", "dlm_acc": "4.509e-01", "anc_acc": "4.430e-01", "epoch": 0.00839} {"step": 4200, "loss": 1.5981, "grad_norm": "3.220e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.589e+00", "dlm_acc": "5.352e-01", "anc_acc": "5.263e-01", "epoch": 0.0084} {"step": 4205, "loss": 1.6969, "grad_norm": "5.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.817e+00", "anc_loss": "1.894e+00", "dlm_acc": "4.631e-01", "anc_acc": "4.529e-01", "epoch": 0.00841} {"step": 4210, "loss": 1.7445, "grad_norm": "7.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.434e-01", "anc_acc": "5.364e-01", "epoch": 0.00842} {"step": 4215, "loss": 1.6577, "grad_norm": "6.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.607e+00", "anc_loss": "1.669e+00", "dlm_acc": "4.869e-01", "anc_acc": "4.785e-01", "epoch": 0.00843} {"step": 4220, "loss": 0.9509, "grad_norm": "2.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.180e+00", "dlm_acc": "5.776e-01", "anc_acc": "5.683e-01", "epoch": 0.00844} {"step": 4225, "loss": 1.145, "grad_norm": "4.011e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.821e-01", "anc_acc": "5.719e-01", "epoch": 0.00845} {"step": 4230, "loss": 1.4437, "grad_norm": "3.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.350e+00", "anc_loss": "1.404e+00", "dlm_acc": "5.601e-01", "anc_acc": "5.517e-01", "epoch": 0.00846} {"step": 4235, "loss": 1.5458, "grad_norm": "6.362e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.673e+00", "anc_loss": "1.731e+00", "dlm_acc": "4.760e-01", "anc_acc": "4.675e-01", "epoch": 0.00847} {"step": 4240, "loss": 1.2119, "grad_norm": "4.725e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.367e-01", "epoch": 0.00848} {"step": 4245, "loss": 1.2675, "grad_norm": "4.690e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.512e+00", "dlm_acc": "5.040e-01", "anc_acc": "4.968e-01", "epoch": 0.00849} {"step": 4250, "loss": 1.2714, "grad_norm": "4.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.106e+00", "anc_loss": "1.159e+00", "dlm_acc": "5.833e-01", "anc_acc": "5.714e-01", "epoch": 0.0085} {"step": 4255, "loss": 1.3303, "grad_norm": "6.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.607e-01", "anc_acc": "5.499e-01", "epoch": 0.00851} {"step": 4260, "loss": 1.15, "grad_norm": "5.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.168e+00", "dlm_acc": "6.276e-01", "anc_acc": "6.170e-01", "epoch": 0.00852} {"step": 4265, "loss": 1.1049, "grad_norm": "3.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.047e+00", "anc_loss": "1.100e+00", "dlm_acc": "6.165e-01", "anc_acc": "6.053e-01", "epoch": 0.00853} {"step": 4270, "loss": 1.6051, "grad_norm": "4.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.852e+00", "anc_loss": "1.911e+00", "dlm_acc": "4.423e-01", "anc_acc": "4.362e-01", "epoch": 0.00854} {"step": 4275, "loss": 1.3864, "grad_norm": "4.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.496e+00", "anc_loss": "1.560e+00", "dlm_acc": "5.536e-01", "anc_acc": "5.449e-01", "epoch": 0.00855} {"step": 4280, "loss": 1.3282, "grad_norm": "2.525e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.376e+00", "anc_loss": "1.435e+00", "dlm_acc": "5.323e-01", "anc_acc": "5.220e-01", "epoch": 0.00856} {"step": 4285, "loss": 1.4188, "grad_norm": "3.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.493e+00", "anc_loss": "1.543e+00", "dlm_acc": "5.086e-01", "anc_acc": "5.011e-01", "epoch": 0.00857} {"step": 4290, "loss": 1.6493, "grad_norm": "1.069e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.708e+00", "anc_loss": "1.777e+00", "dlm_acc": "4.844e-01", "anc_acc": "4.754e-01", "epoch": 0.00858} {"step": 4295, "loss": 1.3856, "grad_norm": "6.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.406e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.214e-01", "anc_acc": "5.155e-01", "epoch": 0.00859} {"step": 4300, "loss": 1.0788, "grad_norm": "3.583e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.732e-01", "anc_loss": "6.936e-01", "dlm_acc": "6.424e-01", "anc_acc": "6.385e-01", "epoch": 0.0086} {"step": 4305, "loss": 1.3347, "grad_norm": "3.727e+00", "learning_rate": "1.000e-04", "dlm_loss": "4.352e-01", "anc_loss": "4.287e-01", "dlm_acc": "7.427e-01", "anc_acc": "7.430e-01", "epoch": 0.00861} {"step": 4310, "loss": 1.4128, "grad_norm": "4.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.412e-01", "anc_loss": "3.516e-01", "dlm_acc": "7.296e-01", "anc_acc": "7.233e-01", "epoch": 0.00862} {"step": 4315, "loss": 1.2431, "grad_norm": "3.506e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.253e+00", "dlm_acc": "5.446e-01", "anc_acc": "5.405e-01", "epoch": 0.00863} {"step": 4320, "loss": 1.4548, "grad_norm": "3.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.358e+00", "anc_loss": "1.403e+00", "dlm_acc": "5.654e-01", "anc_acc": "5.598e-01", "epoch": 0.00864} {"step": 4325, "loss": 1.1935, "grad_norm": "4.046e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.060e+00", "anc_loss": "1.102e+00", "dlm_acc": "6.445e-01", "anc_acc": "6.369e-01", "epoch": 0.00865} {"step": 4330, "loss": 1.2694, "grad_norm": "4.261e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.175e+00", "dlm_acc": "5.270e-01", "anc_acc": "5.198e-01", "epoch": 0.00866} {"step": 4335, "loss": 1.2377, "grad_norm": "5.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.828e-01", "anc_loss": "6.867e-01", "dlm_acc": "4.961e-01", "anc_acc": "4.941e-01", "epoch": 0.00867} {"step": 4340, "loss": 1.4788, "grad_norm": "4.389e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.156e-01", "anc_loss": "7.172e-01", "dlm_acc": "4.744e-01", "anc_acc": "4.717e-01", "epoch": 0.00868} {"step": 4345, "loss": 1.7216, "grad_norm": "5.780e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.727e-01", "anc_loss": "9.984e-01", "dlm_acc": "5.385e-01", "anc_acc": "5.353e-01", "epoch": 0.00869} {"step": 4350, "loss": 1.2856, "grad_norm": "3.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.445e-01", "anc_loss": "8.594e-01", "dlm_acc": "5.438e-01", "anc_acc": "5.408e-01", "epoch": 0.0087} {"step": 4355, "loss": 1.3089, "grad_norm": "4.511e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.587e+00", "anc_loss": "1.658e+00", "dlm_acc": "4.849e-01", "anc_acc": "4.744e-01", "epoch": 0.00871} {"step": 4360, "loss": 1.4181, "grad_norm": "4.216e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.264e+00", "anc_loss": "1.302e+00", "dlm_acc": "5.139e-01", "anc_acc": "5.112e-01", "epoch": 0.00872} {"step": 4365, "loss": 1.2823, "grad_norm": "4.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.172e-01", "anc_loss": "8.180e-01", "dlm_acc": "5.416e-01", "anc_acc": "5.434e-01", "epoch": 0.00873} {"step": 4370, "loss": 1.5049, "grad_norm": "2.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.184e+00", "dlm_acc": "4.927e-01", "anc_acc": "4.879e-01", "epoch": 0.00874} {"step": 4375, "loss": 1.4021, "grad_norm": "4.758e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.434e+00", "dlm_acc": "4.890e-01", "anc_acc": "4.827e-01", "epoch": 0.00875} {"step": 4380, "loss": 1.2975, "grad_norm": "3.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.437e-01", "anc_loss": "9.672e-01", "dlm_acc": "5.552e-01", "anc_acc": "5.517e-01", "epoch": 0.00876} {"step": 4385, "loss": 1.2831, "grad_norm": "3.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.699e-01", "anc_loss": "5.777e-01", "dlm_acc": "5.440e-01", "anc_acc": "5.393e-01", "epoch": 0.00877} {"step": 4390, "loss": 0.9456, "grad_norm": "2.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.332e-01", "anc_loss": "6.539e-01", "dlm_acc": "5.663e-01", "anc_acc": "5.599e-01", "epoch": 0.00878} {"step": 4395, "loss": 0.956, "grad_norm": "1.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.065e+00", "anc_loss": "1.114e+00", "dlm_acc": "5.443e-01", "anc_acc": "5.365e-01", "epoch": 0.00879} {"step": 4400, "loss": 1.1748, "grad_norm": "3.695e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.539e-01", "anc_loss": "9.934e-01", "dlm_acc": "6.155e-01", "anc_acc": "6.102e-01", "epoch": 0.0088} {"step": 4405, "loss": 1.3464, "grad_norm": "5.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.118e+00", "anc_loss": "1.159e+00", "dlm_acc": "5.938e-01", "anc_acc": "5.913e-01", "epoch": 0.00881} {"step": 4410, "loss": 0.9979, "grad_norm": "4.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.461e-01", "anc_loss": "8.906e-01", "dlm_acc": "6.765e-01", "anc_acc": "6.665e-01", "epoch": 0.00882} {"step": 4415, "loss": 1.1454, "grad_norm": "2.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.267e-01", "anc_loss": "8.635e-01", "dlm_acc": "6.461e-01", "anc_acc": "6.396e-01", "epoch": 0.00883} {"step": 4420, "loss": 1.5808, "grad_norm": "7.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.506e+00", "anc_loss": "1.558e+00", "dlm_acc": "4.787e-01", "anc_acc": "4.718e-01", "epoch": 0.00884} {"step": 4425, "loss": 1.1188, "grad_norm": "4.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.672e-01", "anc_loss": "8.828e-01", "dlm_acc": "5.208e-01", "anc_acc": "5.184e-01", "epoch": 0.00885} {"step": 4430, "loss": 0.9685, "grad_norm": "3.808e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.266e-01", "anc_loss": "8.430e-01", "dlm_acc": "5.389e-01", "anc_acc": "5.347e-01", "epoch": 0.00886} {"step": 4435, "loss": 1.6733, "grad_norm": "4.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.409e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.373e-01", "anc_acc": "5.283e-01", "epoch": 0.00887} {"step": 4440, "loss": 1.7087, "grad_norm": "8.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.758e-01", "anc_loss": "6.895e-01", "dlm_acc": "6.483e-01", "anc_acc": "6.446e-01", "epoch": 0.00888} {"step": 4445, "loss": 1.3232, "grad_norm": "3.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.500e-01", "anc_loss": "6.562e-01", "dlm_acc": "5.265e-01", "anc_acc": "5.248e-01", "epoch": 0.00889} {"step": 4450, "loss": 1.522, "grad_norm": "5.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.041e+00", "anc_loss": "1.070e+00", "dlm_acc": "5.144e-01", "anc_acc": "5.082e-01", "epoch": 0.0089} {"step": 4455, "loss": 1.5873, "grad_norm": "4.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.801e-01", "anc_loss": "1.023e+00", "dlm_acc": "6.126e-01", "anc_acc": "6.071e-01", "epoch": 0.00891} {"step": 4460, "loss": 1.2479, "grad_norm": "1.268e+00", "learning_rate": "1.000e-04", "dlm_loss": "5.430e-01", "anc_loss": "5.531e-01", "dlm_acc": "6.216e-01", "anc_acc": "6.148e-01", "epoch": 0.00892} {"step": 4465, "loss": 1.6955, "grad_norm": "9.005e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.039e+00", "dlm_acc": "6.091e-01", "anc_acc": "6.019e-01", "epoch": 0.00893} {"step": 4470, "loss": 1.4615, "grad_norm": "5.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.125e+00", "dlm_acc": "5.524e-01", "anc_acc": "5.471e-01", "epoch": 0.00894} {"step": 4475, "loss": 1.3779, "grad_norm": "5.530e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.141e-01", "anc_loss": "8.504e-01", "dlm_acc": "6.472e-01", "anc_acc": "6.399e-01", "epoch": 0.00895} {"step": 4480, "loss": 1.3041, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.418e-01", "anc_loss": "7.586e-01", "dlm_acc": "5.854e-01", "anc_acc": "5.783e-01", "epoch": 0.00896} {"step": 4485, "loss": 1.3987, "grad_norm": "3.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.154e+00", "dlm_acc": "5.705e-01", "anc_acc": "5.615e-01", "epoch": 0.00897} {"step": 4490, "loss": 1.1213, "grad_norm": "3.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.555e-01", "anc_loss": "9.938e-01", "dlm_acc": "5.403e-01", "anc_acc": "5.325e-01", "epoch": 0.00898} {"step": 4495, "loss": 1.4774, "grad_norm": "5.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.261e+00", "anc_loss": "1.316e+00", "dlm_acc": "5.440e-01", "anc_acc": "5.336e-01", "epoch": 0.00899} {"step": 4500, "loss": 1.2177, "grad_norm": "5.065e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.563e-01", "anc_loss": "9.848e-01", "dlm_acc": "5.019e-01", "anc_acc": "4.963e-01", "epoch": 0.009} {"step": 4505, "loss": 1.2294, "grad_norm": "3.893e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.085e+00", "dlm_acc": "6.007e-01", "anc_acc": "5.882e-01", "epoch": 0.00901} {"step": 4510, "loss": 1.2875, "grad_norm": "5.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.964e+00", "anc_loss": "2.009e+00", "dlm_acc": "3.231e-01", "anc_acc": "3.176e-01", "epoch": 0.00902} {"step": 4515, "loss": 1.3641, "grad_norm": "2.291e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.205e+00", "anc_loss": "2.243e+00", "dlm_acc": "2.467e-01", "anc_acc": "2.412e-01", "epoch": 0.00903} {"step": 4520, "loss": 1.0765, "grad_norm": "2.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.450e-01", "anc_acc": "5.362e-01", "epoch": 0.00904} {"step": 4525, "loss": 1.1595, "grad_norm": "4.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.142e+00", "dlm_acc": "5.991e-01", "anc_acc": "5.898e-01", "epoch": 0.00905} {"step": 4530, "loss": 1.1521, "grad_norm": "6.390e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.565e+00", "dlm_acc": "5.006e-01", "anc_acc": "4.894e-01", "epoch": 0.00906} {"step": 4535, "loss": 1.4286, "grad_norm": "4.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.562e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.227e-01", "epoch": 0.00907} {"step": 4540, "loss": 1.308, "grad_norm": "4.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.328e-01", "anc_acc": "5.226e-01", "epoch": 0.00908} {"step": 4545, "loss": 1.3238, "grad_norm": "4.309e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.550e+00", "anc_loss": "1.620e+00", "dlm_acc": "5.498e-01", "anc_acc": "5.390e-01", "epoch": 0.00909} {"step": 4550, "loss": 0.7404, "grad_norm": "4.572e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.047e+00", "anc_loss": "1.104e+00", "dlm_acc": "6.241e-01", "anc_acc": "6.130e-01", "epoch": 0.0091} {"step": 4555, "loss": 1.5262, "grad_norm": "8.588e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.725e+00", "anc_loss": "1.789e+00", "dlm_acc": "4.814e-01", "anc_acc": "4.720e-01", "epoch": 0.00911} {"step": 4560, "loss": 1.1641, "grad_norm": "6.198e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.592e+00", "dlm_acc": "4.471e-01", "anc_acc": "4.363e-01", "epoch": 0.00912} {"step": 4565, "loss": 1.0663, "grad_norm": "4.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.545e+00", "dlm_acc": "5.066e-01", "anc_acc": "4.957e-01", "epoch": 0.00913} {"step": 4570, "loss": 1.3708, "grad_norm": "4.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.683e+00", "anc_loss": "1.752e+00", "dlm_acc": "4.824e-01", "anc_acc": "4.713e-01", "epoch": 0.00914} {"step": 4575, "loss": 1.1085, "grad_norm": "7.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.683e+00", "dlm_acc": "4.853e-01", "anc_acc": "4.755e-01", "epoch": 0.00915} {"step": 4580, "loss": 0.991, "grad_norm": "4.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.784e+00", "anc_loss": "1.852e+00", "dlm_acc": "5.003e-01", "anc_acc": "4.918e-01", "epoch": 0.00916} {"step": 4585, "loss": 0.6159, "grad_norm": "1.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.340e+00", "dlm_acc": "5.417e-01", "anc_acc": "5.309e-01", "epoch": 0.00917} {"step": 4590, "loss": 0.6306, "grad_norm": "2.110e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.250e+00", "dlm_acc": "5.753e-01", "anc_acc": "5.644e-01", "epoch": 0.00918} {"step": 4595, "loss": 1.0734, "grad_norm": "3.987e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.634e+00", "anc_loss": "1.707e+00", "dlm_acc": "4.860e-01", "anc_acc": "4.757e-01", "epoch": 0.00919} {"step": 4600, "loss": 0.9167, "grad_norm": "3.481e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.412e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.633e-01", "anc_acc": "5.542e-01", "epoch": 0.0092} {"step": 4605, "loss": 0.7077, "grad_norm": "3.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.432e+00", "dlm_acc": "5.392e-01", "anc_acc": "5.276e-01", "epoch": 0.00921} {"step": 4610, "loss": 0.7226, "grad_norm": "2.237e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.265e+00", "dlm_acc": "5.833e-01", "anc_acc": "5.742e-01", "epoch": 0.00922} {"step": 4615, "loss": 1.374, "grad_norm": "4.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.098e-01", "anc_acc": "4.997e-01", "epoch": 0.00923} {"step": 4620, "loss": 1.169, "grad_norm": "5.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.359e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.665e-01", "anc_acc": "5.573e-01", "epoch": 0.00924} {"step": 4625, "loss": 1.1078, "grad_norm": "3.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.620e+00", "anc_loss": "1.686e+00", "dlm_acc": "4.968e-01", "anc_acc": "4.863e-01", "epoch": 0.00925} {"step": 4630, "loss": 0.8955, "grad_norm": "3.997e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.132e+00", "anc_loss": "1.193e+00", "dlm_acc": "6.032e-01", "anc_acc": "5.919e-01", "epoch": 0.00926} {"step": 4635, "loss": 0.9426, "grad_norm": "4.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.505e+00", "dlm_acc": "5.238e-01", "anc_acc": "5.142e-01", "epoch": 0.00927} {"step": 4640, "loss": 1.1765, "grad_norm": "3.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.423e-01", "anc_acc": "5.312e-01", "epoch": 0.00928} {"step": 4645, "loss": 1.3043, "grad_norm": "2.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.442e+00", "anc_loss": "1.497e+00", "dlm_acc": "4.637e-01", "anc_acc": "4.552e-01", "epoch": 0.00929} {"step": 4650, "loss": 1.0328, "grad_norm": "3.635e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.094e+00", "anc_loss": "1.135e+00", "dlm_acc": "5.672e-01", "anc_acc": "5.594e-01", "epoch": 0.0093} {"step": 4655, "loss": 1.3669, "grad_norm": "5.450e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.738e+00", "anc_loss": "1.795e+00", "dlm_acc": "4.448e-01", "anc_acc": "4.355e-01", "epoch": 0.00931} {"step": 4660, "loss": 1.3682, "grad_norm": "5.449e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.522e+00", "anc_loss": "1.583e+00", "dlm_acc": "4.865e-01", "anc_acc": "4.789e-01", "epoch": 0.00932} {"step": 4665, "loss": 0.799, "grad_norm": "6.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.057e+00", "dlm_acc": "6.055e-01", "anc_acc": "5.945e-01", "epoch": 0.00933} {"step": 4670, "loss": 1.6368, "grad_norm": "6.005e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.410e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.501e-01", "epoch": 0.00934} {"step": 4675, "loss": 0.9638, "grad_norm": "3.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.133e+00", "dlm_acc": "5.764e-01", "anc_acc": "5.687e-01", "epoch": 0.00935} {"step": 4680, "loss": 1.2416, "grad_norm": "3.494e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.695e+00", "anc_loss": "1.769e+00", "dlm_acc": "4.656e-01", "anc_acc": "4.551e-01", "epoch": 0.00936} {"step": 4685, "loss": 1.0566, "grad_norm": "4.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.623e+00", "dlm_acc": "4.867e-01", "anc_acc": "4.776e-01", "epoch": 0.00937} {"step": 4690, "loss": 0.9369, "grad_norm": "5.341e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.269e+00", "anc_loss": "1.329e+00", "dlm_acc": "5.503e-01", "anc_acc": "5.403e-01", "epoch": 0.00938} {"step": 4695, "loss": 1.2053, "grad_norm": "3.146e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.272e+00", "anc_loss": "1.323e+00", "dlm_acc": "5.085e-01", "anc_acc": "4.987e-01", "epoch": 0.00939} {"step": 4700, "loss": 1.1766, "grad_norm": "2.531e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.260e+00", "anc_loss": "1.316e+00", "dlm_acc": "5.510e-01", "anc_acc": "5.412e-01", "epoch": 0.0094} {"step": 4705, "loss": 1.0871, "grad_norm": "3.487e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.512e+00", "anc_loss": "1.576e+00", "dlm_acc": "4.980e-01", "anc_acc": "4.883e-01", "epoch": 0.00941} {"step": 4710, "loss": 1.0095, "grad_norm": "2.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.049e+00", "anc_loss": "1.100e+00", "dlm_acc": "6.171e-01", "anc_acc": "6.075e-01", "epoch": 0.00942} {"step": 4715, "loss": 1.0948, "grad_norm": "3.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.622e+00", "dlm_acc": "4.775e-01", "anc_acc": "4.673e-01", "epoch": 0.00943} {"step": 4720, "loss": 0.8801, "grad_norm": "2.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.585e-01", "anc_loss": "3.740e-01", "dlm_acc": "8.732e-01", "anc_acc": "8.702e-01", "epoch": 0.00944} {"step": 4725, "loss": 1.6283, "grad_norm": "3.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.972e+00", "anc_loss": "2.033e+00", "dlm_acc": "4.218e-01", "anc_acc": "4.130e-01", "epoch": 0.00945} {"step": 4730, "loss": 1.6447, "grad_norm": "4.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.878e+00", "anc_loss": "1.945e+00", "dlm_acc": "3.870e-01", "anc_acc": "3.760e-01", "epoch": 0.00946} {"step": 4735, "loss": 1.4107, "grad_norm": "4.361e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.387e+00", "dlm_acc": "3.757e-01", "anc_acc": "3.716e-01", "epoch": 0.00947} {"step": 4740, "loss": 1.1181, "grad_norm": "6.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.561e-01", "anc_acc": "5.442e-01", "epoch": 0.00948} {"step": 4745, "loss": 1.2022, "grad_norm": "2.701e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.980e-01", "anc_loss": "5.273e-01", "dlm_acc": "7.141e-01", "anc_acc": "7.102e-01", "epoch": 0.00949} {"step": 4750, "loss": 1.2229, "grad_norm": "4.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.379e-01", "anc_loss": "9.574e-01", "dlm_acc": "4.847e-01", "anc_acc": "4.828e-01", "epoch": 0.0095} {"step": 4755, "loss": 1.1862, "grad_norm": "3.390e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.187e+00", "dlm_acc": "5.519e-01", "anc_acc": "5.429e-01", "epoch": 0.00951} {"step": 4760, "loss": 0.9133, "grad_norm": "5.842e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.146e+00", "dlm_acc": "5.645e-01", "anc_acc": "5.552e-01", "epoch": 0.00952} {"step": 4765, "loss": 1.4159, "grad_norm": "4.070e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.445e+00", "anc_loss": "1.508e+00", "dlm_acc": "5.050e-01", "anc_acc": "4.927e-01", "epoch": 0.00953} {"step": 4770, "loss": 1.0675, "grad_norm": "3.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.453e+00", "anc_loss": "1.505e+00", "dlm_acc": "4.785e-01", "anc_acc": "4.702e-01", "epoch": 0.00954} {"step": 4775, "loss": 1.5878, "grad_norm": "3.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.802e+00", "anc_loss": "1.870e+00", "dlm_acc": "4.724e-01", "anc_acc": "4.648e-01", "epoch": 0.00955} {"step": 4780, "loss": 1.3412, "grad_norm": "3.979e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.561e+00", "dlm_acc": "5.073e-01", "anc_acc": "4.987e-01", "epoch": 0.00956} {"step": 4785, "loss": 1.741, "grad_norm": "5.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.511e+00", "anc_loss": "1.573e+00", "dlm_acc": "5.225e-01", "anc_acc": "5.125e-01", "epoch": 0.00957} {"step": 4790, "loss": 1.2381, "grad_norm": "3.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.020e+00", "anc_loss": "1.064e+00", "dlm_acc": "6.059e-01", "anc_acc": "5.977e-01", "epoch": 0.00958} {"step": 4795, "loss": 1.4114, "grad_norm": "2.653e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.379e+00", "dlm_acc": "5.539e-01", "anc_acc": "5.454e-01", "epoch": 0.00959} {"step": 4800, "loss": 1.8589, "grad_norm": "6.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.788e+00", "anc_loss": "2.830e+00", "dlm_acc": "1.280e-01", "anc_acc": "1.246e-01", "epoch": 0.0096} {"step": 4805, "loss": 1.4246, "grad_norm": "4.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.579e+00", "anc_loss": "1.655e+00", "dlm_acc": "4.784e-01", "anc_acc": "4.646e-01", "epoch": 0.00961} {"step": 4810, "loss": 1.232, "grad_norm": "3.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.262e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.504e-01", "anc_acc": "5.358e-01", "epoch": 0.00962} {"step": 4815, "loss": 1.0298, "grad_norm": "2.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.686e-01", "anc_loss": "8.971e-01", "dlm_acc": "6.212e-01", "anc_acc": "6.147e-01", "epoch": 0.00963} {"step": 4820, "loss": 1.349, "grad_norm": "5.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.748e+00", "anc_loss": "1.794e+00", "dlm_acc": "3.453e-01", "anc_acc": "3.350e-01", "epoch": 0.00964} {"step": 4825, "loss": 1.2754, "grad_norm": "4.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.498e+00", "anc_loss": "1.555e+00", "dlm_acc": "4.553e-01", "anc_acc": "4.463e-01", "epoch": 0.00965} {"step": 4830, "loss": 1.3594, "grad_norm": "3.751e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.656e-01", "anc_loss": "9.164e-01", "dlm_acc": "6.287e-01", "anc_acc": "6.161e-01", "epoch": 0.00966} {"step": 4835, "loss": 1.5635, "grad_norm": "3.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.462e+00", "dlm_acc": "4.898e-01", "anc_acc": "4.837e-01", "epoch": 0.00967} {"step": 4840, "loss": 1.0296, "grad_norm": "2.462e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.413e-01", "epoch": 0.00968} {"step": 4845, "loss": 1.1465, "grad_norm": "7.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.066e-01", "anc_acc": "4.982e-01", "epoch": 0.00969} {"step": 4850, "loss": 1.7561, "grad_norm": "3.717e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.491e+00", "anc_loss": "2.517e+00", "dlm_acc": "1.995e-01", "anc_acc": "1.985e-01", "epoch": 0.0097} {"step": 4855, "loss": 1.3388, "grad_norm": "2.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.405e+00", "anc_loss": "2.431e+00", "dlm_acc": "1.284e-01", "anc_acc": "1.259e-01", "epoch": 0.00971} {"step": 4860, "loss": 1.253, "grad_norm": "2.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.386e-01", "anc_acc": "5.299e-01", "epoch": 0.00972} {"step": 4865, "loss": 1.3849, "grad_norm": "6.236e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.512e+00", "dlm_acc": "5.188e-01", "anc_acc": "5.100e-01", "epoch": 0.00973} {"step": 4870, "loss": 1.4591, "grad_norm": "5.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.531e-01", "anc_loss": "9.898e-01", "dlm_acc": "6.010e-01", "anc_acc": "5.981e-01", "epoch": 0.00974} {"step": 4875, "loss": 1.4079, "grad_norm": "5.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.498e+00", "anc_loss": "1.554e+00", "dlm_acc": "4.449e-01", "anc_acc": "4.368e-01", "epoch": 0.00975} {"step": 4880, "loss": 1.5265, "grad_norm": "3.186e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.551e+00", "dlm_acc": "4.910e-01", "anc_acc": "4.788e-01", "epoch": 0.00976} {"step": 4885, "loss": 1.5435, "grad_norm": "4.172e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.528e+00", "anc_loss": "1.586e+00", "dlm_acc": "4.647e-01", "anc_acc": "4.560e-01", "epoch": 0.00977} {"step": 4890, "loss": 1.579, "grad_norm": "4.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.299e+00", "dlm_acc": "4.788e-01", "anc_acc": "4.721e-01", "epoch": 0.00978} {"step": 4895, "loss": 1.5556, "grad_norm": "3.256e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.369e+00", "dlm_acc": "6.225e-01", "anc_acc": "6.147e-01", "epoch": 0.00979} {"step": 4900, "loss": 1.1622, "grad_norm": "2.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.093e+00", "dlm_acc": "6.821e-01", "anc_acc": "6.780e-01", "epoch": 0.0098} {"step": 4905, "loss": 1.2394, "grad_norm": "4.204e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.086e-01", "anc_acc": "4.999e-01", "epoch": 0.00981} {"step": 4910, "loss": 1.1648, "grad_norm": "2.977e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.454e-01", "anc_acc": "5.342e-01", "epoch": 0.00982} {"step": 4915, "loss": 1.5006, "grad_norm": "6.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.103e-01", "anc_acc": "5.007e-01", "epoch": 0.00983} {"step": 4920, "loss": 1.4261, "grad_norm": "2.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.432e-01", "anc_acc": "5.335e-01", "epoch": 0.00984} {"step": 4925, "loss": 1.6195, "grad_norm": "3.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.520e+00", "anc_loss": "1.571e+00", "dlm_acc": "4.777e-01", "anc_acc": "4.701e-01", "epoch": 0.00985} {"step": 4930, "loss": 1.2484, "grad_norm": "4.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.516e-01", "anc_loss": "9.531e-01", "dlm_acc": "3.053e-01", "anc_acc": "3.053e-01", "epoch": 0.00986} {"step": 4935, "loss": 1.3251, "grad_norm": "3.815e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.406e-01", "anc_loss": "8.406e-01", "dlm_acc": "3.187e-01", "anc_acc": "3.170e-01", "epoch": 0.00987} {"step": 4940, "loss": 1.5825, "grad_norm": "3.444e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.047e-01", "anc_loss": "9.047e-01", "dlm_acc": "3.104e-01", "anc_acc": "3.086e-01", "epoch": 0.00988} {"step": 4945, "loss": 1.7393, "grad_norm": "3.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.500e-01", "anc_loss": "9.508e-01", "dlm_acc": "3.140e-01", "anc_acc": "3.128e-01", "epoch": 0.00989} {"step": 4950, "loss": 1.4864, "grad_norm": "3.035e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.299e+00", "anc_loss": "1.354e+00", "dlm_acc": "4.825e-01", "anc_acc": "4.737e-01", "epoch": 0.0099} {"step": 4955, "loss": 1.6374, "grad_norm": "4.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.814e+00", "anc_loss": "1.884e+00", "dlm_acc": "4.533e-01", "anc_acc": "4.438e-01", "epoch": 0.00991} {"step": 4960, "loss": 1.3959, "grad_norm": "3.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.664e-01", "anc_loss": "8.156e-01", "dlm_acc": "5.818e-01", "anc_acc": "5.725e-01", "epoch": 0.00992} {"step": 4965, "loss": 1.5128, "grad_norm": "5.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.312e-01", "anc_loss": "7.711e-01", "dlm_acc": "5.913e-01", "anc_acc": "5.809e-01", "epoch": 0.00993} {"step": 4970, "loss": 1.3534, "grad_norm": "3.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.531e-01", "anc_loss": "6.863e-01", "dlm_acc": "6.164e-01", "anc_acc": "6.090e-01", "epoch": 0.00994} {"step": 4975, "loss": 1.7396, "grad_norm": "4.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.609e+00", "anc_loss": "1.672e+00", "dlm_acc": "4.884e-01", "anc_acc": "4.785e-01", "epoch": 0.00995} {"step": 4980, "loss": 1.1174, "grad_norm": "4.243e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.279e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.134e-01", "anc_acc": "5.020e-01", "epoch": 0.00996} {"step": 4985, "loss": 1.5819, "grad_norm": "7.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.519e+00", "dlm_acc": "4.758e-01", "anc_acc": "4.686e-01", "epoch": 0.00997} {"step": 4990, "loss": 1.455, "grad_norm": "2.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.409e+00", "anc_loss": "1.467e+00", "dlm_acc": "5.128e-01", "anc_acc": "5.021e-01", "epoch": 0.00998} {"step": 4995, "loss": 1.5606, "grad_norm": "4.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.498e+00", "anc_loss": "1.562e+00", "dlm_acc": "4.900e-01", "anc_acc": "4.780e-01", "epoch": 0.00999} {"step": 5000, "loss": 1.7051, "grad_norm": "2.759e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.819e+00", "anc_loss": "1.891e+00", "dlm_acc": "4.425e-01", "anc_acc": "4.317e-01", "epoch": 0.01} {"step": 5005, "loss": 1.0589, "grad_norm": "1.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.144e+00", "dlm_acc": "5.428e-01", "anc_acc": "5.347e-01", "epoch": 0.01001} {"step": 5010, "loss": 1.5486, "grad_norm": "3.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.268e+00", "anc_loss": "1.319e+00", "dlm_acc": "5.712e-01", "anc_acc": "5.645e-01", "epoch": 0.01002} {"step": 5015, "loss": 1.4538, "grad_norm": "2.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.425e-01", "anc_acc": "5.349e-01", "epoch": 0.01003} {"step": 5020, "loss": 1.5352, "grad_norm": "6.734e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.146e+00", "dlm_acc": "6.204e-01", "anc_acc": "6.139e-01", "epoch": 0.01004} {"step": 5025, "loss": 1.6878, "grad_norm": "4.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.098e+00", "anc_loss": "2.202e+00", "dlm_acc": "3.821e-01", "anc_acc": "3.759e-01", "epoch": 0.01005} {"step": 5030, "loss": 1.5519, "grad_norm": "3.646e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.393e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.458e-01", "anc_acc": "5.358e-01", "epoch": 0.01006} {"step": 5035, "loss": 1.1403, "grad_norm": "5.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.719e-01", "anc_loss": "1.033e+00", "dlm_acc": "5.838e-01", "anc_acc": "5.663e-01", "epoch": 0.01007} {"step": 5040, "loss": 1.4257, "grad_norm": "3.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.243e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.000e-01", "anc_acc": "4.941e-01", "epoch": 0.01008} {"step": 5045, "loss": 1.0888, "grad_norm": "3.883e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.054e+00", "anc_loss": "1.109e+00", "dlm_acc": "5.686e-01", "anc_acc": "5.564e-01", "epoch": 0.01009} {"step": 5050, "loss": 1.8515, "grad_norm": "5.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.756e+00", "anc_loss": "1.831e+00", "dlm_acc": "4.677e-01", "anc_acc": "4.578e-01", "epoch": 0.0101} {"step": 5055, "loss": 1.6648, "grad_norm": "4.707e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.789e+00", "anc_loss": "1.844e+00", "dlm_acc": "3.391e-01", "anc_acc": "3.320e-01", "epoch": 0.01011} {"step": 5060, "loss": 1.7367, "grad_norm": "4.874e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.175e+00", "dlm_acc": "5.753e-01", "anc_acc": "5.692e-01", "epoch": 0.01012} {"step": 5065, "loss": 1.8407, "grad_norm": "4.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.630e+00", "anc_loss": "1.675e+00", "dlm_acc": "4.683e-01", "anc_acc": "4.626e-01", "epoch": 0.01013} {"step": 5070, "loss": 0.988, "grad_norm": "3.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.797e-01", "anc_loss": "9.227e-01", "dlm_acc": "5.957e-01", "anc_acc": "5.855e-01", "epoch": 0.01014} {"step": 5075, "loss": 1.1266, "grad_norm": "3.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.707e-01", "anc_loss": "9.969e-01", "dlm_acc": "5.212e-01", "anc_acc": "5.149e-01", "epoch": 0.01015} {"step": 5080, "loss": 1.0799, "grad_norm": "4.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.116e+00", "dlm_acc": "5.895e-01", "anc_acc": "5.806e-01", "epoch": 0.01016} {"step": 5085, "loss": 1.148, "grad_norm": "4.225e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.879e-01", "anc_loss": "8.258e-01", "dlm_acc": "6.720e-01", "anc_acc": "6.635e-01", "epoch": 0.01017} {"step": 5090, "loss": 0.9095, "grad_norm": "2.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.307e+00", "dlm_acc": "4.900e-01", "anc_acc": "4.790e-01", "epoch": 0.01018} {"step": 5095, "loss": 1.5574, "grad_norm": "9.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.695e+00", "anc_loss": "1.758e+00", "dlm_acc": "4.165e-01", "anc_acc": "4.092e-01", "epoch": 0.01019} {"step": 5100, "loss": 1.1628, "grad_norm": "1.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.214e+00", "dlm_acc": "6.236e-01", "anc_acc": "6.158e-01", "epoch": 0.0102} {"step": 5105, "loss": 0.675, "grad_norm": "2.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.148e-01", "anc_loss": "8.352e-01", "dlm_acc": "4.617e-01", "anc_acc": "4.567e-01", "epoch": 0.01021} {"step": 5110, "loss": 1.2629, "grad_norm": "3.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.367e-01", "anc_loss": "9.469e-01", "dlm_acc": "3.619e-01", "anc_acc": "3.570e-01", "epoch": 0.01022} {"step": 5115, "loss": 1.3627, "grad_norm": "5.053e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.496e-01", "anc_acc": "5.424e-01", "epoch": 0.01023} {"step": 5120, "loss": 1.035, "grad_norm": "3.791e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.736e-01", "anc_loss": "3.896e-01", "dlm_acc": "7.590e-01", "anc_acc": "7.534e-01", "epoch": 0.01024} {"step": 5125, "loss": 1.1971, "grad_norm": "3.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.194e+00", "dlm_acc": "5.940e-01", "anc_acc": "5.859e-01", "epoch": 0.01025} {"step": 5130, "loss": 1.365, "grad_norm": "5.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.272e+00", "dlm_acc": "5.996e-01", "anc_acc": "5.917e-01", "epoch": 0.01026} {"step": 5135, "loss": 1.2957, "grad_norm": "5.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.368e+00", "anc_loss": "1.428e+00", "dlm_acc": "4.999e-01", "anc_acc": "4.871e-01", "epoch": 0.01027} {"step": 5140, "loss": 1.0809, "grad_norm": "3.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.457e+00", "dlm_acc": "5.014e-01", "anc_acc": "4.883e-01", "epoch": 0.01028} {"step": 5145, "loss": 1.1058, "grad_norm": "3.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.523e+00", "dlm_acc": "4.968e-01", "anc_acc": "4.838e-01", "epoch": 0.01029} {"step": 5150, "loss": 1.4759, "grad_norm": "3.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.244e+00", "anc_loss": "2.283e+00", "dlm_acc": "2.992e-01", "anc_acc": "2.918e-01", "epoch": 0.0103} {"step": 5155, "loss": 1.2053, "grad_norm": "3.081e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.083e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.438e-01", "anc_acc": "5.349e-01", "epoch": 0.01031} {"step": 5160, "loss": 1.7296, "grad_norm": "5.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.472e+00", "anc_loss": "1.522e+00", "dlm_acc": "4.686e-01", "anc_acc": "4.603e-01", "epoch": 0.01032} {"step": 5165, "loss": 1.1546, "grad_norm": "3.095e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.058e-01", "anc_acc": "4.953e-01", "epoch": 0.01033} {"step": 5170, "loss": 1.4177, "grad_norm": "3.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.477e+00", "dlm_acc": "5.171e-01", "anc_acc": "5.092e-01", "epoch": 0.01034} {"step": 5175, "loss": 1.3049, "grad_norm": "3.077e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.431e+00", "anc_loss": "1.486e+00", "dlm_acc": "4.934e-01", "anc_acc": "4.834e-01", "epoch": 0.01035} {"step": 5180, "loss": 1.3311, "grad_norm": "3.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.083e+00", "dlm_acc": "6.024e-01", "anc_acc": "5.924e-01", "epoch": 0.01036} {"step": 5185, "loss": 1.3285, "grad_norm": "5.375e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.408e+00", "dlm_acc": "5.088e-01", "anc_acc": "4.948e-01", "epoch": 0.01037} {"step": 5190, "loss": 1.1838, "grad_norm": "6.979e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.115e+00", "anc_loss": "1.177e+00", "dlm_acc": "5.616e-01", "anc_acc": "5.500e-01", "epoch": 0.01038} {"step": 5195, "loss": 1.4446, "grad_norm": "3.510e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.188e+00", "dlm_acc": "6.273e-01", "anc_acc": "6.208e-01", "epoch": 0.01039} {"step": 5200, "loss": 1.7253, "grad_norm": "3.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.659e+00", "anc_loss": "1.713e+00", "dlm_acc": "5.098e-01", "anc_acc": "5.002e-01", "epoch": 0.0104} {"step": 5205, "loss": 0.9432, "grad_norm": "4.469e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.280e-02", "anc_loss": "7.732e-02", "dlm_acc": "9.452e-01", "anc_acc": "9.439e-01", "epoch": 0.01041} {"step": 5210, "loss": 1.1999, "grad_norm": "3.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.155e+00", "dlm_acc": "5.815e-01", "anc_acc": "5.765e-01", "epoch": 0.01042} {"step": 5215, "loss": 1.1191, "grad_norm": "2.455e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.419e+00", "dlm_acc": "4.891e-01", "anc_acc": "4.795e-01", "epoch": 0.01043} {"step": 5220, "loss": 1.5082, "grad_norm": "5.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.652e+00", "anc_loss": "1.708e+00", "dlm_acc": "4.364e-01", "anc_acc": "4.222e-01", "epoch": 0.01044} {"step": 5225, "loss": 1.7377, "grad_norm": "4.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.998e+00", "anc_loss": "2.053e+00", "dlm_acc": "3.632e-01", "anc_acc": "3.548e-01", "epoch": 0.01045} {"step": 5230, "loss": 0.8944, "grad_norm": "4.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.223e-01", "anc_loss": "9.391e-01", "dlm_acc": "4.315e-01", "anc_acc": "4.269e-01", "epoch": 0.01046} {"step": 5235, "loss": 1.1001, "grad_norm": "2.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.828e-01", "anc_loss": "7.937e-01", "dlm_acc": "3.654e-01", "anc_acc": "3.621e-01", "epoch": 0.01047} {"step": 5240, "loss": 1.1648, "grad_norm": "3.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.719e-01", "anc_loss": "8.844e-01", "dlm_acc": "3.601e-01", "anc_acc": "3.559e-01", "epoch": 0.01048} {"step": 5245, "loss": 1.1411, "grad_norm": "1.021e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.141e+00", "dlm_acc": "5.032e-01", "anc_acc": "4.956e-01", "epoch": 0.01049} {"step": 5250, "loss": 1.2041, "grad_norm": "5.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.278e+00", "anc_loss": "1.350e+00", "dlm_acc": "4.936e-01", "anc_acc": "4.788e-01", "epoch": 0.0105} {"step": 5255, "loss": 0.9545, "grad_norm": "1.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.016e-01", "anc_loss": "9.516e-01", "dlm_acc": "6.345e-01", "anc_acc": "6.227e-01", "epoch": 0.01051} {"step": 5260, "loss": 1.742, "grad_norm": "8.335e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.559e+00", "anc_loss": "1.617e+00", "dlm_acc": "4.713e-01", "anc_acc": "4.615e-01", "epoch": 0.01052} {"step": 5265, "loss": 1.3467, "grad_norm": "4.547e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.544e+00", "anc_loss": "1.624e+00", "dlm_acc": "4.952e-01", "anc_acc": "4.863e-01", "epoch": 0.01053} {"step": 5270, "loss": 1.3455, "grad_norm": "1.207e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.486e+00", "anc_loss": "1.556e+00", "dlm_acc": "4.663e-01", "anc_acc": "4.508e-01", "epoch": 0.01054} {"step": 5275, "loss": 1.3572, "grad_norm": "5.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.382e-01", "anc_acc": "5.321e-01", "epoch": 0.01055} {"step": 5280, "loss": 1.3867, "grad_norm": "5.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.536e+00", "anc_loss": "1.605e+00", "dlm_acc": "4.592e-01", "anc_acc": "4.490e-01", "epoch": 0.01056} {"step": 5285, "loss": 1.227, "grad_norm": "1.529e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.214e+00", "dlm_acc": "4.139e-01", "anc_acc": "4.099e-01", "epoch": 0.01057} {"step": 5290, "loss": 1.3882, "grad_norm": "7.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.801e-01", "anc_loss": "4.918e-01", "dlm_acc": "7.033e-01", "anc_acc": "6.973e-01", "epoch": 0.01058} {"step": 5295, "loss": 1.25, "grad_norm": "6.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.809e-01", "anc_loss": "4.930e-01", "dlm_acc": "6.942e-01", "anc_acc": "6.878e-01", "epoch": 0.01059} {"step": 5300, "loss": 1.0673, "grad_norm": "6.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.328e-01", "anc_loss": "8.887e-01", "dlm_acc": "6.646e-01", "anc_acc": "6.541e-01", "epoch": 0.0106} {"step": 5305, "loss": 1.1129, "grad_norm": "5.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.153e-01", "anc_acc": "5.078e-01", "epoch": 0.01061} {"step": 5310, "loss": 0.916, "grad_norm": "5.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.191e+00", "dlm_acc": "6.038e-01", "anc_acc": "5.945e-01", "epoch": 0.01062} {"step": 5315, "loss": 1.0975, "grad_norm": "4.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.977e-01", "anc_loss": "9.531e-01", "dlm_acc": "6.870e-01", "anc_acc": "6.777e-01", "epoch": 0.01063} {"step": 5320, "loss": 1.2831, "grad_norm": "4.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.525e+00", "dlm_acc": "4.969e-01", "anc_acc": "4.835e-01", "epoch": 0.01064} {"step": 5325, "loss": 1.641, "grad_norm": "4.466e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.409e+00", "anc_loss": "1.396e+00", "dlm_acc": "4.682e-01", "anc_acc": "4.643e-01", "epoch": 0.01065} {"step": 5330, "loss": 1.2438, "grad_norm": "4.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.938e-01", "anc_loss": "6.090e-01", "dlm_acc": "5.919e-01", "anc_acc": "5.868e-01", "epoch": 0.01066} {"step": 5335, "loss": 1.4777, "grad_norm": "4.581e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.136e+00", "dlm_acc": "5.187e-01", "anc_acc": "5.142e-01", "epoch": 0.01067} {"step": 5340, "loss": 1.624, "grad_norm": "4.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.372e+00", "anc_loss": "1.425e+00", "dlm_acc": "5.155e-01", "anc_acc": "5.085e-01", "epoch": 0.01068} {"step": 5345, "loss": 1.2155, "grad_norm": "3.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.366e+00", "dlm_acc": "4.762e-01", "anc_acc": "4.655e-01", "epoch": 0.01069} {"step": 5350, "loss": 1.7044, "grad_norm": "4.418e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.136e+00", "anc_loss": "2.177e+00", "dlm_acc": "3.244e-01", "anc_acc": "3.193e-01", "epoch": 0.0107} {"step": 5355, "loss": 1.3319, "grad_norm": "5.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.758e-01", "anc_loss": "9.195e-01", "dlm_acc": "6.035e-01", "anc_acc": "5.945e-01", "epoch": 0.01071} {"step": 5360, "loss": 1.5845, "grad_norm": "8.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.682e-01", "anc_loss": "1.007e+00", "dlm_acc": "6.425e-01", "anc_acc": "6.335e-01", "epoch": 0.01072} {"step": 5365, "loss": 1.5585, "grad_norm": "7.594e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.180e-01", "anc_loss": "5.668e-01", "dlm_acc": "7.620e-01", "anc_acc": "7.499e-01", "epoch": 0.01073} {"step": 5370, "loss": 1.1895, "grad_norm": "1.273e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.953e-01", "anc_loss": "3.379e-01", "dlm_acc": "8.244e-01", "anc_acc": "8.121e-01", "epoch": 0.01074} {"step": 5375, "loss": 1.5557, "grad_norm": "8.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.637e+00", "dlm_acc": "4.677e-01", "anc_acc": "4.574e-01", "epoch": 0.01075} {"step": 5380, "loss": 1.6117, "grad_norm": "6.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.046e+00", "dlm_acc": "5.998e-01", "anc_acc": "5.929e-01", "epoch": 0.01076} {"step": 5385, "loss": 1.7343, "grad_norm": "6.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.486e+00", "anc_loss": "1.548e+00", "dlm_acc": "4.907e-01", "anc_acc": "4.804e-01", "epoch": 0.01077} {"step": 5390, "loss": 1.1281, "grad_norm": "3.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.143e-01", "anc_loss": "8.625e-01", "dlm_acc": "6.833e-01", "anc_acc": "6.745e-01", "epoch": 0.01078} {"step": 5395, "loss": 1.1172, "grad_norm": "3.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.037e+00", "anc_loss": "1.100e+00", "dlm_acc": "6.195e-01", "anc_acc": "6.062e-01", "epoch": 0.01079} {"step": 5400, "loss": 1.336, "grad_norm": "4.246e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.975e-02", "anc_loss": "5.232e-02", "dlm_acc": "9.690e-01", "anc_acc": "9.682e-01", "epoch": 0.0108} {"step": 5405, "loss": 1.1578, "grad_norm": "2.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.426e-01", "anc_loss": "6.715e-01", "dlm_acc": "6.250e-01", "anc_acc": "6.144e-01", "epoch": 0.01081} {"step": 5410, "loss": 1.9921, "grad_norm": "4.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.681e+00", "anc_loss": "2.709e+00", "dlm_acc": "9.584e-02", "anc_acc": "9.414e-02", "epoch": 0.01082} {"step": 5415, "loss": 1.379, "grad_norm": "2.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.531e+00", "anc_loss": "2.544e+00", "dlm_acc": "2.378e-02", "anc_acc": "2.296e-02", "epoch": 0.01083} {"step": 5420, "loss": 1.7578, "grad_norm": "4.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.638e+00", "anc_loss": "2.642e+00", "dlm_acc": "8.128e-02", "anc_acc": "8.180e-02", "epoch": 0.01084} {"step": 5425, "loss": 2.4651, "grad_norm": "3.636e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.062e+00", "anc_loss": "3.075e+00", "dlm_acc": "2.274e-02", "anc_acc": "2.183e-02", "epoch": 0.01085} {"step": 5430, "loss": 1.7915, "grad_norm": "8.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.816e+00", "anc_loss": "1.852e+00", "dlm_acc": "3.894e-01", "anc_acc": "3.838e-01", "epoch": 0.01086} {"step": 5435, "loss": 1.0543, "grad_norm": "5.306e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.375e-01", "anc_loss": "9.738e-01", "dlm_acc": "6.391e-01", "anc_acc": "6.312e-01", "epoch": 0.01087} {"step": 5440, "loss": 0.8577, "grad_norm": "4.619e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.155e+00", "dlm_acc": "5.377e-01", "anc_acc": "5.277e-01", "epoch": 0.01088} {"step": 5445, "loss": 1.5603, "grad_norm": "5.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.909e+00", "anc_loss": "1.984e+00", "dlm_acc": "4.389e-01", "anc_acc": "4.292e-01", "epoch": 0.01089} {"step": 5450, "loss": 1.4501, "grad_norm": "3.767e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.157e-01", "anc_acc": "5.035e-01", "epoch": 0.0109} {"step": 5455, "loss": 1.6127, "grad_norm": "4.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.483e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.007e-01", "anc_acc": "4.908e-01", "epoch": 0.01091} {"step": 5460, "loss": 1.4596, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.163e+00", "dlm_acc": "5.661e-01", "anc_acc": "5.587e-01", "epoch": 0.01092} {"step": 5465, "loss": 1.1627, "grad_norm": "4.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.898e-01", "anc_loss": "5.992e-01", "dlm_acc": "5.613e-01", "anc_acc": "5.564e-01", "epoch": 0.01093} {"step": 5470, "loss": 1.241, "grad_norm": "5.382e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.922e-01", "anc_loss": "8.066e-01", "dlm_acc": "5.365e-01", "anc_acc": "5.301e-01", "epoch": 0.01094} {"step": 5475, "loss": 1.7587, "grad_norm": "7.696e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.242e+00", "dlm_acc": "5.759e-01", "anc_acc": "5.690e-01", "epoch": 0.01095} {"step": 5480, "loss": 1.182, "grad_norm": "3.884e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.414e-01", "anc_loss": "9.840e-01", "dlm_acc": "6.186e-01", "anc_acc": "6.103e-01", "epoch": 0.01096} {"step": 5485, "loss": 1.7572, "grad_norm": "4.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.523e-01", "anc_loss": "5.602e-01", "dlm_acc": "6.703e-01", "anc_acc": "6.652e-01", "epoch": 0.01097} {"step": 5490, "loss": 1.9601, "grad_norm": "4.265e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.226e+00", "anc_loss": "1.265e+00", "dlm_acc": "4.909e-01", "anc_acc": "4.859e-01", "epoch": 0.01098} {"step": 5495, "loss": 1.0855, "grad_norm": "2.752e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.324e-01", "anc_loss": "5.469e-01", "dlm_acc": "5.919e-01", "anc_acc": "5.806e-01", "epoch": 0.01099} {"step": 5500, "loss": 1.1622, "grad_norm": "7.245e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.738e-01", "anc_loss": "5.910e-01", "dlm_acc": "5.979e-01", "anc_acc": "5.862e-01", "epoch": 0.011} {"step": 5505, "loss": 1.1712, "grad_norm": "5.358e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.789e-01", "anc_loss": "4.898e-01", "dlm_acc": "6.260e-01", "anc_acc": "6.174e-01", "epoch": 0.01101} {"step": 5510, "loss": 1.0534, "grad_norm": "5.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.660e-01", "anc_loss": "6.859e-01", "dlm_acc": "6.264e-01", "anc_acc": "6.201e-01", "epoch": 0.01102} {"step": 5515, "loss": 1.8916, "grad_norm": "5.101e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.130e+00", "dlm_acc": "5.673e-01", "anc_acc": "5.606e-01", "epoch": 0.01103} {"step": 5520, "loss": 1.4248, "grad_norm": "7.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.258e-01", "anc_loss": "9.781e-01", "dlm_acc": "7.243e-01", "anc_acc": "7.154e-01", "epoch": 0.01104} {"step": 5525, "loss": 1.2134, "grad_norm": "5.124e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.314e+00", "dlm_acc": "5.461e-01", "anc_acc": "5.376e-01", "epoch": 0.01105} {"step": 5530, "loss": 1.1285, "grad_norm": "2.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.047e-01", "anc_loss": "8.328e-01", "dlm_acc": "5.859e-01", "anc_acc": "5.791e-01", "epoch": 0.01106} {"step": 5535, "loss": 1.4004, "grad_norm": "3.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.566e-01", "anc_loss": "7.758e-01", "dlm_acc": "5.908e-01", "anc_acc": "5.840e-01", "epoch": 0.01107} {"step": 5540, "loss": 0.8379, "grad_norm": "4.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.984e-01", "anc_loss": "9.391e-01", "dlm_acc": "6.118e-01", "anc_acc": "6.034e-01", "epoch": 0.01108} {"step": 5545, "loss": 1.5854, "grad_norm": "5.733e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.414e-01", "anc_loss": "6.531e-01", "dlm_acc": "5.441e-01", "anc_acc": "5.381e-01", "epoch": 0.01109} {"step": 5550, "loss": 1.4802, "grad_norm": "3.462e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.762e-01", "anc_loss": "7.887e-01", "dlm_acc": "5.295e-01", "anc_acc": "5.243e-01", "epoch": 0.0111} {"step": 5555, "loss": 1.2506, "grad_norm": "5.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.000e-01", "anc_loss": "8.023e-01", "dlm_acc": "5.350e-01", "anc_acc": "5.365e-01", "epoch": 0.01111} {"step": 5560, "loss": 1.0956, "grad_norm": "3.939e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.883e-01", "anc_loss": "6.898e-01", "dlm_acc": "5.573e-01", "anc_acc": "5.563e-01", "epoch": 0.01112} {"step": 5565, "loss": 1.0978, "grad_norm": "3.526e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.547e-01", "anc_loss": "7.586e-01", "dlm_acc": "5.250e-01", "anc_acc": "5.240e-01", "epoch": 0.01113} {"step": 5570, "loss": 1.0048, "grad_norm": "3.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.844e-01", "anc_loss": "6.883e-01", "dlm_acc": "5.436e-01", "anc_acc": "5.437e-01", "epoch": 0.01114} {"step": 5575, "loss": 1.0503, "grad_norm": "5.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.934e-01", "anc_loss": "6.980e-01", "dlm_acc": "5.522e-01", "anc_acc": "5.486e-01", "epoch": 0.01115} {"step": 5580, "loss": 1.1242, "grad_norm": "2.547e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.262e-01", "anc_loss": "6.299e-01", "dlm_acc": "5.642e-01", "anc_acc": "5.619e-01", "epoch": 0.01116} {"step": 5585, "loss": 1.5673, "grad_norm": "4.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.098e-01", "anc_acc": "5.010e-01", "epoch": 0.01117} {"step": 5590, "loss": 1.4677, "grad_norm": "3.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.169e+00", "dlm_acc": "5.415e-01", "anc_acc": "5.359e-01", "epoch": 0.01118} {"step": 5595, "loss": 1.2559, "grad_norm": "4.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.072e+00", "dlm_acc": "5.392e-01", "anc_acc": "5.287e-01", "epoch": 0.01119} {"step": 5600, "loss": 1.376, "grad_norm": "4.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.086e+00", "dlm_acc": "5.696e-01", "anc_acc": "5.575e-01", "epoch": 0.0112} {"step": 5605, "loss": 1.5417, "grad_norm": "6.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.167e+00", "dlm_acc": "5.722e-01", "anc_acc": "5.610e-01", "epoch": 0.01121} {"step": 5610, "loss": 1.5494, "grad_norm": "5.158e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.184e-01", "anc_loss": "9.488e-01", "dlm_acc": "5.410e-01", "anc_acc": "5.332e-01", "epoch": 0.01122} {"step": 5615, "loss": 1.4658, "grad_norm": "3.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.093e+00", "dlm_acc": "5.327e-01", "anc_acc": "5.234e-01", "epoch": 0.01123} {"step": 5620, "loss": 1.4299, "grad_norm": "9.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.492e+00", "anc_loss": "1.548e+00", "dlm_acc": "4.914e-01", "anc_acc": "4.844e-01", "epoch": 0.01124} {"step": 5625, "loss": 1.3094, "grad_norm": "4.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.219e-01", "anc_loss": "7.266e-01", "dlm_acc": "4.982e-01", "anc_acc": "4.969e-01", "epoch": 0.01125} {"step": 5630, "loss": 1.2997, "grad_norm": "7.071e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.115e+00", "anc_loss": "1.151e+00", "dlm_acc": "5.021e-01", "anc_acc": "4.966e-01", "epoch": 0.01126} {"step": 5635, "loss": 1.489, "grad_norm": "8.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.163e+00", "dlm_acc": "5.834e-01", "anc_acc": "5.743e-01", "epoch": 0.01127} {"step": 5640, "loss": 1.4081, "grad_norm": "4.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.015e+00", "anc_loss": "1.065e+00", "dlm_acc": "5.810e-01", "anc_acc": "5.687e-01", "epoch": 0.01128} {"step": 5645, "loss": 1.6823, "grad_norm": "5.510e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.271e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.546e-01", "anc_acc": "5.412e-01", "epoch": 0.01129} {"step": 5650, "loss": 1.5615, "grad_norm": "5.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.408e+00", "anc_loss": "1.452e+00", "dlm_acc": "5.276e-01", "anc_acc": "5.203e-01", "epoch": 0.0113} {"step": 5655, "loss": 1.4091, "grad_norm": "3.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.303e+00", "dlm_acc": "5.506e-01", "anc_acc": "5.382e-01", "epoch": 0.01131} {"step": 5660, "loss": 1.2385, "grad_norm": "3.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.332e-01", "anc_loss": "9.805e-01", "dlm_acc": "5.971e-01", "anc_acc": "5.868e-01", "epoch": 0.01132} {"step": 5665, "loss": 0.9617, "grad_norm": "2.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.031e-01", "anc_loss": "7.289e-01", "dlm_acc": "5.602e-01", "anc_acc": "5.531e-01", "epoch": 0.01133} {"step": 5670, "loss": 1.6841, "grad_norm": "3.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.134e+00", "dlm_acc": "4.982e-01", "anc_acc": "4.914e-01", "epoch": 0.01134} {"step": 5675, "loss": 1.519, "grad_norm": "6.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.242e-01", "anc_loss": "9.516e-01", "dlm_acc": "5.192e-01", "anc_acc": "5.114e-01", "epoch": 0.01135} {"step": 5680, "loss": 1.52, "grad_norm": "2.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.202e+00", "dlm_acc": "6.052e-01", "anc_acc": "5.941e-01", "epoch": 0.01136} {"step": 5685, "loss": 1.2039, "grad_norm": "2.912e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.047e+00", "anc_loss": "1.078e+00", "dlm_acc": "5.125e-01", "anc_acc": "5.042e-01", "epoch": 0.01137} {"step": 5690, "loss": 1.3745, "grad_norm": "3.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.300e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.078e-01", "anc_acc": "4.975e-01", "epoch": 0.01138} {"step": 5695, "loss": 1.3457, "grad_norm": "3.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.855e-01", "anc_loss": "1.029e+00", "dlm_acc": "5.873e-01", "anc_acc": "5.789e-01", "epoch": 0.01139} {"step": 5700, "loss": 0.903, "grad_norm": "2.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.234e-01", "anc_loss": "7.535e-01", "dlm_acc": "6.193e-01", "anc_acc": "6.124e-01", "epoch": 0.0114} {"step": 5705, "loss": 1.2746, "grad_norm": "4.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.922e-01", "anc_loss": "4.965e-01", "dlm_acc": "6.279e-01", "anc_acc": "6.257e-01", "epoch": 0.01141} {"step": 5710, "loss": 1.3337, "grad_norm": "6.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.613e-01", "anc_loss": "7.844e-01", "dlm_acc": "6.353e-01", "anc_acc": "6.295e-01", "epoch": 0.01142} {"step": 5715, "loss": 1.5025, "grad_norm": "2.617e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.594e-01", "anc_loss": "1.002e+00", "dlm_acc": "6.702e-01", "anc_acc": "6.619e-01", "epoch": 0.01143} {"step": 5720, "loss": 1.2977, "grad_norm": "3.513e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.391e-01", "anc_loss": "6.453e-01", "dlm_acc": "5.482e-01", "anc_acc": "5.484e-01", "epoch": 0.01144} {"step": 5725, "loss": 1.3507, "grad_norm": "3.717e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.395e-01", "anc_loss": "9.770e-01", "dlm_acc": "5.577e-01", "anc_acc": "5.502e-01", "epoch": 0.01145} {"step": 5730, "loss": 1.3672, "grad_norm": "2.513e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.061e+00", "dlm_acc": "5.580e-01", "anc_acc": "5.496e-01", "epoch": 0.01146} {"step": 5735, "loss": 1.4133, "grad_norm": "3.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.699e-01", "anc_loss": "9.876e-01", "dlm_acc": "4.911e-01", "anc_acc": "4.870e-01", "epoch": 0.01147} {"step": 5740, "loss": 1.432, "grad_norm": "3.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.009e-01", "anc_acc": "4.901e-01", "epoch": 0.01148} {"step": 5745, "loss": 1.3674, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.163e+00", "dlm_acc": "4.979e-01", "anc_acc": "4.918e-01", "epoch": 0.01149} {"step": 5750, "loss": 1.5579, "grad_norm": "5.684e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.344e-01", "anc_loss": "9.559e-01", "dlm_acc": "5.610e-01", "anc_acc": "5.556e-01", "epoch": 0.0115} {"step": 5755, "loss": 1.1269, "grad_norm": "4.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.945e-01", "anc_loss": "1.041e+00", "dlm_acc": "5.579e-01", "anc_acc": "5.518e-01", "epoch": 0.01151} {"step": 5760, "loss": 1.3567, "grad_norm": "7.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.100e+00", "dlm_acc": "5.120e-01", "anc_acc": "5.049e-01", "epoch": 0.01152} {"step": 5765, "loss": 1.1189, "grad_norm": "4.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.000e-01", "anc_loss": "7.219e-01", "dlm_acc": "5.586e-01", "anc_acc": "5.488e-01", "epoch": 0.01153} {"step": 5770, "loss": 1.1904, "grad_norm": "2.837e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.058e+00", "dlm_acc": "5.954e-01", "anc_acc": "5.876e-01", "epoch": 0.01154} {"step": 5775, "loss": 1.0458, "grad_norm": "3.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.820e-01", "anc_loss": "8.016e-01", "dlm_acc": "5.263e-01", "anc_acc": "5.220e-01", "epoch": 0.01155} {"step": 5780, "loss": 1.4516, "grad_norm": "6.071e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.065e+00", "anc_loss": "1.103e+00", "dlm_acc": "5.185e-01", "anc_acc": "5.111e-01", "epoch": 0.01156} {"step": 5785, "loss": 0.7867, "grad_norm": "3.940e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.113e-01", "anc_loss": "6.219e-01", "dlm_acc": "5.348e-01", "anc_acc": "5.299e-01", "epoch": 0.01157} {"step": 5790, "loss": 1.0098, "grad_norm": "4.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.105e-01", "anc_loss": "8.266e-01", "dlm_acc": "5.058e-01", "anc_acc": "4.999e-01", "epoch": 0.01158} {"step": 5795, "loss": 1.5332, "grad_norm": "7.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.116e+00", "dlm_acc": "5.888e-01", "anc_acc": "5.794e-01", "epoch": 0.01159} {"step": 5800, "loss": 1.3765, "grad_norm": "5.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.156e+00", "anc_loss": "1.211e+00", "dlm_acc": "6.419e-01", "anc_acc": "6.319e-01", "epoch": 0.0116} {"step": 5805, "loss": 1.0718, "grad_norm": "2.675e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.014e-01", "anc_loss": "9.381e-01", "dlm_acc": "6.161e-01", "anc_acc": "6.093e-01", "epoch": 0.01161} {"step": 5810, "loss": 1.2228, "grad_norm": "5.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.300e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.745e-01", "anc_acc": "5.622e-01", "epoch": 0.01162} {"step": 5815, "loss": 0.8312, "grad_norm": "3.624e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.320e-01", "anc_loss": "6.332e-01", "dlm_acc": "5.684e-01", "anc_acc": "5.676e-01", "epoch": 0.01163} {"step": 5820, "loss": 1.081, "grad_norm": "3.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.969e-01", "anc_loss": "7.012e-01", "dlm_acc": "5.438e-01", "anc_acc": "5.457e-01", "epoch": 0.01164} {"step": 5825, "loss": 1.0758, "grad_norm": "3.048e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.172e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.401e-01", "anc_acc": "5.336e-01", "epoch": 0.01165} {"step": 5830, "loss": 0.6482, "grad_norm": "3.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.781e-01", "anc_loss": "6.969e-01", "dlm_acc": "5.638e-01", "anc_acc": "5.579e-01", "epoch": 0.01166} {"step": 5835, "loss": 1.1958, "grad_norm": "4.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.469e-01", "anc_loss": "9.734e-01", "dlm_acc": "5.342e-01", "anc_acc": "5.279e-01", "epoch": 0.01167} {"step": 5840, "loss": 0.7695, "grad_norm": "8.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.123e+00", "dlm_acc": "4.876e-01", "anc_acc": "4.793e-01", "epoch": 0.01168} {"step": 5845, "loss": 0.7226, "grad_norm": "4.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.895e-01", "anc_loss": "9.125e-01", "dlm_acc": "5.104e-01", "anc_acc": "5.070e-01", "epoch": 0.01169} {"step": 5850, "loss": 0.9311, "grad_norm": "4.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.570e-01", "anc_loss": "8.750e-01", "dlm_acc": "5.207e-01", "anc_acc": "5.136e-01", "epoch": 0.0117} {"step": 5855, "loss": 0.9571, "grad_norm": "2.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.773e-01", "anc_loss": "1.018e+00", "dlm_acc": "5.941e-01", "anc_acc": "5.855e-01", "epoch": 0.01171} {"step": 5860, "loss": 0.6946, "grad_norm": "1.149e+00", "learning_rate": "1.000e-04", "dlm_loss": "7.579e-01", "anc_loss": "7.925e-01", "dlm_acc": "7.232e-01", "anc_acc": "7.182e-01", "epoch": 0.01172} {"step": 5865, "loss": 0.6539, "grad_norm": "3.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.062e-01", "anc_loss": "6.327e-01", "dlm_acc": "7.647e-01", "anc_acc": "7.574e-01", "epoch": 0.01173} {"step": 5870, "loss": 0.8605, "grad_norm": "2.473e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.418e-01", "anc_loss": "9.723e-01", "dlm_acc": "5.954e-01", "anc_acc": "5.877e-01", "epoch": 0.01174} {"step": 5875, "loss": 0.613, "grad_norm": "2.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.031e-01", "anc_loss": "4.102e-01", "dlm_acc": "6.862e-01", "anc_acc": "6.831e-01", "epoch": 0.01175} {"step": 5880, "loss": 0.9137, "grad_norm": "3.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.016e-01", "anc_loss": "4.094e-01", "dlm_acc": "6.934e-01", "anc_acc": "6.884e-01", "epoch": 0.01176} {"step": 5885, "loss": 0.6198, "grad_norm": "2.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.453e-01", "anc_loss": "3.527e-01", "dlm_acc": "7.202e-01", "anc_acc": "7.155e-01", "epoch": 0.01177} {"step": 5890, "loss": 1.2557, "grad_norm": "2.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.703e-01", "anc_loss": "4.723e-01", "dlm_acc": "6.827e-01", "anc_acc": "6.790e-01", "epoch": 0.01178} {"step": 5895, "loss": 1.286, "grad_norm": "2.986e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.039e-01", "anc_loss": "4.137e-01", "dlm_acc": "7.009e-01", "anc_acc": "6.972e-01", "epoch": 0.01179} {"step": 5900, "loss": 0.8522, "grad_norm": "3.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.527e-01", "anc_loss": "4.586e-01", "dlm_acc": "6.540e-01", "anc_acc": "6.533e-01", "epoch": 0.0118} {"step": 5905, "loss": 1.1796, "grad_norm": "7.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.174e+00", "dlm_acc": "5.352e-01", "anc_acc": "5.306e-01", "epoch": 0.01181} {"step": 5910, "loss": 0.8393, "grad_norm": "3.373e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.561e-01", "anc_loss": "9.980e-01", "dlm_acc": "6.325e-01", "anc_acc": "6.202e-01", "epoch": 0.01182} {"step": 5915, "loss": 1.9398, "grad_norm": "4.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.952e+00", "anc_loss": "2.014e+00", "dlm_acc": "4.232e-01", "anc_acc": "4.152e-01", "epoch": 0.01183} {"step": 5920, "loss": 0.879, "grad_norm": "2.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.471e-01", "anc_loss": "6.754e-01", "dlm_acc": "7.160e-01", "anc_acc": "7.071e-01", "epoch": 0.01184} {"step": 5925, "loss": 1.1593, "grad_norm": "3.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.250e-01", "anc_loss": "7.668e-01", "dlm_acc": "7.299e-01", "anc_acc": "7.214e-01", "epoch": 0.01185} {"step": 5930, "loss": 1.0557, "grad_norm": "1.164e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.258e-01", "anc_loss": "9.523e-01", "dlm_acc": "5.161e-01", "anc_acc": "5.107e-01", "epoch": 0.01186} {"step": 5935, "loss": 1.4684, "grad_norm": "8.429e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.312e+00", "dlm_acc": "4.257e-01", "anc_acc": "4.196e-01", "epoch": 0.01187} {"step": 5940, "loss": 1.0741, "grad_norm": "3.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.388e+00", "anc_loss": "1.431e+00", "dlm_acc": "4.290e-01", "anc_acc": "4.220e-01", "epoch": 0.01188} {"step": 5945, "loss": 1.1457, "grad_norm": "4.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.427e-01", "anc_acc": "5.340e-01", "epoch": 0.01189} {"step": 5950, "loss": 1.2063, "grad_norm": "4.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.032e+00", "dlm_acc": "6.271e-01", "anc_acc": "6.218e-01", "epoch": 0.0119} {"step": 5955, "loss": 1.0172, "grad_norm": "3.447e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.520e-01", "anc_loss": "2.561e-01", "dlm_acc": "8.565e-01", "anc_acc": "8.561e-01", "epoch": 0.01191} {"step": 5960, "loss": 0.75, "grad_norm": "3.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.858e-01", "anc_loss": "1.861e-01", "dlm_acc": "8.671e-01", "anc_acc": "8.671e-01", "epoch": 0.01192} {"step": 5965, "loss": 1.3017, "grad_norm": "3.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.918e-01", "anc_loss": "8.309e-01", "dlm_acc": "6.529e-01", "anc_acc": "6.447e-01", "epoch": 0.01193} {"step": 5970, "loss": 1.36, "grad_norm": "3.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.152e-01", "anc_loss": "9.578e-01", "dlm_acc": "6.424e-01", "anc_acc": "6.349e-01", "epoch": 0.01194} {"step": 5975, "loss": 1.0165, "grad_norm": "4.508e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.029e-01", "anc_acc": "5.926e-01", "epoch": 0.01195} {"step": 5980, "loss": 1.281, "grad_norm": "6.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.930e-01", "anc_loss": "8.301e-01", "dlm_acc": "6.845e-01", "anc_acc": "6.771e-01", "epoch": 0.01196} {"step": 5985, "loss": 0.8392, "grad_norm": "3.411e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.354e-01", "anc_loss": "3.453e-01", "dlm_acc": "7.627e-01", "anc_acc": "7.612e-01", "epoch": 0.01197} {"step": 5990, "loss": 1.0387, "grad_norm": "3.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.520e-01", "anc_loss": "4.605e-01", "dlm_acc": "7.107e-01", "anc_acc": "7.086e-01", "epoch": 0.01198} {"step": 5995, "loss": 1.6288, "grad_norm": "3.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.289e-01", "anc_loss": "9.613e-01", "dlm_acc": "6.372e-01", "anc_acc": "6.289e-01", "epoch": 0.01199} {"step": 6000, "loss": 1.4302, "grad_norm": "3.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.384e-01", "anc_loss": "7.723e-01", "dlm_acc": "6.961e-01", "anc_acc": "6.870e-01", "epoch": 0.012} {"step": 6005, "loss": 1.8432, "grad_norm": "5.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.711e+00", "anc_loss": "1.774e+00", "dlm_acc": "4.718e-01", "anc_acc": "4.622e-01", "epoch": 0.01201} {"step": 6010, "loss": 1.4502, "grad_norm": "5.537e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.828e-01", "anc_loss": "1.044e+00", "dlm_acc": "6.456e-01", "anc_acc": "6.345e-01", "epoch": 0.01202} {"step": 6015, "loss": 1.5433, "grad_norm": "1.044e+00", "learning_rate": "1.000e-04", "dlm_loss": "7.570e-01", "anc_loss": "8.328e-01", "dlm_acc": "7.779e-01", "anc_acc": "7.673e-01", "epoch": 0.01203} {"step": 6020, "loss": 1.5184, "grad_norm": "5.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.186e+00", "anc_loss": "1.236e+00", "dlm_acc": "5.903e-01", "anc_acc": "5.810e-01", "epoch": 0.01204} {"step": 6025, "loss": 1.3042, "grad_norm": "5.639e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.111e+00", "anc_loss": "1.155e+00", "dlm_acc": "5.727e-01", "anc_acc": "5.669e-01", "epoch": 0.01205} {"step": 6030, "loss": 1.4326, "grad_norm": "4.136e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.494e+00", "anc_loss": "1.566e+00", "dlm_acc": "5.134e-01", "anc_acc": "5.032e-01", "epoch": 0.01206} {"step": 6035, "loss": 1.3837, "grad_norm": "1.532e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.182e+00", "dlm_acc": "5.930e-01", "anc_acc": "5.848e-01", "epoch": 0.01207} {"step": 6040, "loss": 1.1282, "grad_norm": "3.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.796e-01", "anc_loss": "6.033e-01", "dlm_acc": "7.836e-01", "anc_acc": "7.748e-01", "epoch": 0.01208} {"step": 6045, "loss": 1.0638, "grad_norm": "4.043e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.035e+00", "anc_loss": "1.074e+00", "dlm_acc": "6.072e-01", "anc_acc": "5.996e-01", "epoch": 0.01209} {"step": 6050, "loss": 0.956, "grad_norm": "2.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.191e-01", "anc_loss": "5.281e-01", "dlm_acc": "5.761e-01", "anc_acc": "5.740e-01", "epoch": 0.0121} {"step": 6055, "loss": 1.1586, "grad_norm": "2.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.643e-01", "anc_loss": "9.896e-01", "dlm_acc": "5.173e-01", "anc_acc": "5.132e-01", "epoch": 0.01211} {"step": 6060, "loss": 1.0991, "grad_norm": "5.095e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.436e-01", "anc_acc": "5.369e-01", "epoch": 0.01212} {"step": 6065, "loss": 1.2122, "grad_norm": "3.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.564e+00", "dlm_acc": "4.564e-01", "anc_acc": "4.462e-01", "epoch": 0.01213} {"step": 6070, "loss": 1.1348, "grad_norm": "4.317e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.202e+00", "dlm_acc": "5.970e-01", "anc_acc": "5.874e-01", "epoch": 0.01214} {"step": 6075, "loss": 1.0403, "grad_norm": "4.667e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.024e+00", "anc_loss": "1.050e+00", "dlm_acc": "4.559e-01", "anc_acc": "4.532e-01", "epoch": 0.01215} {"step": 6080, "loss": 0.9813, "grad_norm": "2.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.383e-01", "anc_loss": "9.563e-01", "dlm_acc": "4.926e-01", "anc_acc": "4.886e-01", "epoch": 0.01216} {"step": 6085, "loss": 0.9554, "grad_norm": "3.602e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.859e-01", "anc_loss": "1.017e+00", "dlm_acc": "5.130e-01", "anc_acc": "5.060e-01", "epoch": 0.01217} {"step": 6090, "loss": 1.1062, "grad_norm": "4.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.057e-01", "anc_loss": "9.230e-01", "dlm_acc": "6.091e-01", "anc_acc": "6.060e-01", "epoch": 0.01218} {"step": 6095, "loss": 1.1436, "grad_norm": "3.657e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.164e+00", "dlm_acc": "5.819e-01", "anc_acc": "5.750e-01", "epoch": 0.01219} {"step": 6100, "loss": 0.7534, "grad_norm": "2.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.089e-01", "anc_loss": "5.301e-01", "dlm_acc": "8.086e-01", "anc_acc": "8.051e-01", "epoch": 0.0122} {"step": 6105, "loss": 0.7251, "grad_norm": "3.377e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.005e-01", "anc_loss": "5.143e-01", "dlm_acc": "7.463e-01", "anc_acc": "7.403e-01", "epoch": 0.01221} {"step": 6110, "loss": 0.9516, "grad_norm": "3.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.984e-01", "anc_loss": "7.086e-01", "dlm_acc": "5.898e-01", "anc_acc": "5.883e-01", "epoch": 0.01222} {"step": 6115, "loss": 1.226, "grad_norm": "2.940e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.197e+00", "anc_loss": "1.245e+00", "dlm_acc": "6.306e-01", "anc_acc": "6.238e-01", "epoch": 0.01223} {"step": 6120, "loss": 1.4756, "grad_norm": "3.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.172e+00", "anc_loss": "1.228e+00", "dlm_acc": "5.847e-01", "anc_acc": "5.752e-01", "epoch": 0.01224} {"step": 6125, "loss": 1.3408, "grad_norm": "3.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.623e+00", "anc_loss": "1.688e+00", "dlm_acc": "5.008e-01", "anc_acc": "4.910e-01", "epoch": 0.01225} {"step": 6130, "loss": 1.2213, "grad_norm": "3.399e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.107e-01", "anc_loss": "6.430e-01", "dlm_acc": "7.344e-01", "anc_acc": "7.237e-01", "epoch": 0.01226} {"step": 6135, "loss": 1.2279, "grad_norm": "4.067e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.233e+00", "anc_loss": "1.285e+00", "dlm_acc": "5.482e-01", "anc_acc": "5.391e-01", "epoch": 0.01227} {"step": 6140, "loss": 1.5523, "grad_norm": "3.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.373e+00", "dlm_acc": "5.662e-01", "anc_acc": "5.540e-01", "epoch": 0.01228} {"step": 6145, "loss": 1.3817, "grad_norm": "3.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.764e+00", "dlm_acc": "4.788e-01", "anc_acc": "4.671e-01", "epoch": 0.01229} {"step": 6150, "loss": 1.1306, "grad_norm": "4.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.512e+00", "anc_loss": "1.580e+00", "dlm_acc": "4.710e-01", "anc_acc": "4.605e-01", "epoch": 0.0123} {"step": 6155, "loss": 1.4827, "grad_norm": "3.714e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.998e+00", "anc_loss": "2.081e+00", "dlm_acc": "4.466e-01", "anc_acc": "4.346e-01", "epoch": 0.01231} {"step": 6160, "loss": 1.0706, "grad_norm": "3.961e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.533e+00", "anc_loss": "1.603e+00", "dlm_acc": "4.947e-01", "anc_acc": "4.828e-01", "epoch": 0.01232} {"step": 6165, "loss": 1.4519, "grad_norm": "3.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.282e+00", "anc_loss": "1.340e+00", "dlm_acc": "5.601e-01", "anc_acc": "5.497e-01", "epoch": 0.01233} {"step": 6170, "loss": 1.1396, "grad_norm": "4.687e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.007e+00", "anc_loss": "1.066e+00", "dlm_acc": "6.097e-01", "anc_acc": "5.979e-01", "epoch": 0.01234} {"step": 6175, "loss": 1.5681, "grad_norm": "4.497e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.508e+00", "dlm_acc": "5.275e-01", "anc_acc": "5.141e-01", "epoch": 0.01235} {"step": 6180, "loss": 1.1969, "grad_norm": "3.998e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.147e+00", "anc_loss": "1.206e+00", "dlm_acc": "5.511e-01", "anc_acc": "5.391e-01", "epoch": 0.01236} {"step": 6185, "loss": 1.2533, "grad_norm": "3.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.221e+00", "dlm_acc": "5.815e-01", "anc_acc": "5.702e-01", "epoch": 0.01237} {"step": 6190, "loss": 1.6746, "grad_norm": "3.653e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.602e+00", "dlm_acc": "4.992e-01", "anc_acc": "4.840e-01", "epoch": 0.01238} {"step": 6195, "loss": 1.6816, "grad_norm": "4.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.150e+00", "anc_loss": "2.195e+00", "dlm_acc": "3.421e-01", "anc_acc": "3.350e-01", "epoch": 0.01239} {"step": 6200, "loss": 1.5288, "grad_norm": "3.972e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.517e+00", "anc_loss": "1.584e+00", "dlm_acc": "5.284e-01", "anc_acc": "5.153e-01", "epoch": 0.0124} {"step": 6205, "loss": 1.4951, "grad_norm": "3.001e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.457e+00", "anc_loss": "1.504e+00", "dlm_acc": "5.482e-01", "anc_acc": "5.382e-01", "epoch": 0.01241} {"step": 6210, "loss": 1.641, "grad_norm": "4.926e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.378e+00", "anc_loss": "1.443e+00", "dlm_acc": "5.520e-01", "anc_acc": "5.398e-01", "epoch": 0.01242} {"step": 6215, "loss": 1.2849, "grad_norm": "2.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.329e+00", "dlm_acc": "4.817e-01", "anc_acc": "4.727e-01", "epoch": 0.01243} {"step": 6220, "loss": 1.6752, "grad_norm": "4.288e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.594e+00", "anc_loss": "1.651e+00", "dlm_acc": "4.960e-01", "anc_acc": "4.864e-01", "epoch": 0.01244} {"step": 6225, "loss": 1.4308, "grad_norm": "3.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.448e+00", "anc_loss": "1.509e+00", "dlm_acc": "4.925e-01", "anc_acc": "4.805e-01", "epoch": 0.01245} {"step": 6230, "loss": 1.5873, "grad_norm": "3.657e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.214e+00", "anc_loss": "1.267e+00", "dlm_acc": "6.311e-01", "anc_acc": "6.216e-01", "epoch": 0.01246} {"step": 6235, "loss": 1.5056, "grad_norm": "4.280e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.475e+00", "anc_loss": "1.538e+00", "dlm_acc": "5.191e-01", "anc_acc": "5.085e-01", "epoch": 0.01247} {"step": 6240, "loss": 1.7387, "grad_norm": "3.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.049e+00", "anc_loss": "1.101e+00", "dlm_acc": "6.696e-01", "anc_acc": "6.598e-01", "epoch": 0.01248} {"step": 6245, "loss": 1.7353, "grad_norm": "2.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.102e+00", "dlm_acc": "5.596e-01", "anc_acc": "5.504e-01", "epoch": 0.01249} {"step": 6250, "loss": 1.1092, "grad_norm": "3.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.595e-01", "anc_acc": "5.484e-01", "epoch": 0.0125} {"step": 6255, "loss": 1.1855, "grad_norm": "3.761e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.133e+00", "dlm_acc": "5.716e-01", "anc_acc": "5.605e-01", "epoch": 0.01251} {"step": 6260, "loss": 1.4205, "grad_norm": "3.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.014e-01", "anc_acc": "4.881e-01", "epoch": 0.01252} {"step": 6265, "loss": 1.3488, "grad_norm": "2.740e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.258e-01", "anc_loss": "9.281e-01", "dlm_acc": "3.184e-01", "anc_acc": "3.155e-01", "epoch": 0.01253} {"step": 6270, "loss": 1.315, "grad_norm": "2.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.053e+00", "dlm_acc": "3.840e-01", "anc_acc": "3.799e-01", "epoch": 0.01254} {"step": 6275, "loss": 1.3424, "grad_norm": "5.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.229e+00", "dlm_acc": "5.508e-01", "anc_acc": "5.427e-01", "epoch": 0.01255} {"step": 6280, "loss": 1.6511, "grad_norm": "3.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.467e+00", "anc_loss": "1.553e+00", "dlm_acc": "5.335e-01", "anc_acc": "5.208e-01", "epoch": 0.01256} {"step": 6285, "loss": 1.4827, "grad_norm": "3.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.558e-01", "anc_acc": "5.470e-01", "epoch": 0.01257} {"step": 6290, "loss": 1.2513, "grad_norm": "2.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.342e-01", "epoch": 0.01258} {"step": 6295, "loss": 1.4212, "grad_norm": "4.222e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.240e+00", "dlm_acc": "6.125e-01", "anc_acc": "6.016e-01", "epoch": 0.01259} {"step": 6300, "loss": 2.0491, "grad_norm": "9.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.703e+00", "anc_loss": "1.767e+00", "dlm_acc": "5.287e-01", "anc_acc": "5.180e-01", "epoch": 0.0126} {"step": 6305, "loss": 1.5052, "grad_norm": "2.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.215e+00", "anc_loss": "1.269e+00", "dlm_acc": "5.726e-01", "anc_acc": "5.628e-01", "epoch": 0.01261} {"step": 6310, "loss": 1.7271, "grad_norm": "3.472e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.691e+00", "dlm_acc": "4.946e-01", "anc_acc": "4.822e-01", "epoch": 0.01262} {"step": 6315, "loss": 1.6663, "grad_norm": "4.149e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.684e+00", "anc_loss": "1.755e+00", "dlm_acc": "4.971e-01", "anc_acc": "4.852e-01", "epoch": 0.01263} {"step": 6320, "loss": 1.4478, "grad_norm": "9.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.279e+00", "anc_loss": "1.342e+00", "dlm_acc": "5.432e-01", "anc_acc": "5.306e-01", "epoch": 0.01264} {"step": 6325, "loss": 1.9591, "grad_norm": "1.757e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.808e+00", "anc_loss": "1.866e+00", "dlm_acc": "4.707e-01", "anc_acc": "4.632e-01", "epoch": 0.01265} {"step": 6330, "loss": 1.5472, "grad_norm": "3.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.512e+00", "dlm_acc": "5.268e-01", "anc_acc": "5.170e-01", "epoch": 0.01266} {"step": 6335, "loss": 1.3833, "grad_norm": "3.971e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.172e+00", "dlm_acc": "6.039e-01", "anc_acc": "5.932e-01", "epoch": 0.01267} {"step": 6340, "loss": 1.6289, "grad_norm": "5.156e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.783e+00", "anc_loss": "1.861e+00", "dlm_acc": "4.579e-01", "anc_acc": "4.435e-01", "epoch": 0.01268} {"step": 6345, "loss": 1.3767, "grad_norm": "3.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.310e-01", "anc_acc": "5.174e-01", "epoch": 0.01269} {"step": 6350, "loss": 1.4637, "grad_norm": "3.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.598e+00", "dlm_acc": "5.510e-01", "anc_acc": "5.381e-01", "epoch": 0.0127} {"step": 6355, "loss": 1.2827, "grad_norm": "4.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.296e+00", "dlm_acc": "5.359e-01", "anc_acc": "5.226e-01", "epoch": 0.01271} {"step": 6360, "loss": 1.4946, "grad_norm": "4.595e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.639e+00", "dlm_acc": "4.803e-01", "anc_acc": "4.690e-01", "epoch": 0.01272} {"step": 6365, "loss": 1.3163, "grad_norm": "3.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.311e+00", "dlm_acc": "5.472e-01", "anc_acc": "5.342e-01", "epoch": 0.01273} {"step": 6370, "loss": 1.1904, "grad_norm": "3.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.508e-01", "anc_loss": "9.973e-01", "dlm_acc": "6.404e-01", "anc_acc": "6.294e-01", "epoch": 0.01274} {"step": 6375, "loss": 1.1476, "grad_norm": "2.782e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.295e+00", "dlm_acc": "5.644e-01", "anc_acc": "5.514e-01", "epoch": 0.01275} {"step": 6380, "loss": 1.3104, "grad_norm": "2.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.094e+00", "anc_loss": "1.148e+00", "dlm_acc": "6.386e-01", "anc_acc": "6.286e-01", "epoch": 0.01276} {"step": 6385, "loss": 1.1623, "grad_norm": "3.515e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.246e+00", "dlm_acc": "5.544e-01", "anc_acc": "5.424e-01", "epoch": 0.01277} {"step": 6390, "loss": 1.1475, "grad_norm": "2.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.011e+00", "anc_loss": "1.064e+00", "dlm_acc": "6.208e-01", "anc_acc": "6.085e-01", "epoch": 0.01278} {"step": 6395, "loss": 1.2043, "grad_norm": "2.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.169e+00", "dlm_acc": "6.097e-01", "anc_acc": "5.971e-01", "epoch": 0.01279} {"step": 6400, "loss": 1.8834, "grad_norm": "5.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.775e+00", "anc_loss": "1.841e+00", "dlm_acc": "4.715e-01", "anc_acc": "4.616e-01", "epoch": 0.0128} {"step": 6405, "loss": 1.4327, "grad_norm": "3.774e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.409e+00", "anc_loss": "1.465e+00", "dlm_acc": "5.368e-01", "anc_acc": "5.280e-01", "epoch": 0.01281} {"step": 6410, "loss": 0.9309, "grad_norm": "1.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.197e-01", "anc_loss": "9.684e-01", "dlm_acc": "6.236e-01", "anc_acc": "6.114e-01", "epoch": 0.01282} {"step": 6415, "loss": 1.6599, "grad_norm": "4.568e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.847e+00", "anc_loss": "1.919e+00", "dlm_acc": "4.390e-01", "anc_acc": "4.288e-01", "epoch": 0.01283} {"step": 6420, "loss": 0.8909, "grad_norm": "1.836e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.633e-01", "anc_loss": "9.187e-01", "dlm_acc": "6.369e-01", "anc_acc": "6.218e-01", "epoch": 0.01284} {"step": 6425, "loss": 1.7717, "grad_norm": "4.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.675e+00", "anc_loss": "1.753e+00", "dlm_acc": "4.944e-01", "anc_acc": "4.825e-01", "epoch": 0.01285} {"step": 6430, "loss": 1.1959, "grad_norm": "2.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.232e-01", "anc_acc": "5.119e-01", "epoch": 0.01286} {"step": 6435, "loss": 2.0746, "grad_norm": "3.836e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.579e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.738e-01", "anc_acc": "4.643e-01", "epoch": 0.01287} {"step": 6440, "loss": 1.4536, "grad_norm": "2.954e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.052e-01", "anc_acc": "4.935e-01", "epoch": 0.01288} {"step": 6445, "loss": 1.2012, "grad_norm": "5.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.051e+00", "anc_loss": "1.112e+00", "dlm_acc": "5.954e-01", "anc_acc": "5.840e-01", "epoch": 0.01289} {"step": 6450, "loss": 1.1829, "grad_norm": "4.167e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.340e+00", "anc_loss": "1.403e+00", "dlm_acc": "5.436e-01", "anc_acc": "5.321e-01", "epoch": 0.0129} {"step": 6455, "loss": 0.8763, "grad_norm": "2.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.059e+00", "dlm_acc": "6.204e-01", "anc_acc": "6.096e-01", "epoch": 0.01291} {"step": 6460, "loss": 1.1216, "grad_norm": "3.325e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.618e+00", "anc_loss": "1.686e+00", "dlm_acc": "5.222e-01", "anc_acc": "5.105e-01", "epoch": 0.01292} {"step": 6465, "loss": 1.0921, "grad_norm": "2.338e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.249e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.555e-01", "anc_acc": "5.434e-01", "epoch": 0.01293} {"step": 6470, "loss": 1.2119, "grad_norm": "2.636e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.398e+00", "anc_loss": "1.463e+00", "dlm_acc": "5.213e-01", "anc_acc": "5.097e-01", "epoch": 0.01294} {"step": 6475, "loss": 1.1336, "grad_norm": "5.515e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.458e+00", "anc_loss": "1.523e+00", "dlm_acc": "5.100e-01", "anc_acc": "5.008e-01", "epoch": 0.01295} {"step": 6480, "loss": 0.8238, "grad_norm": "4.506e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.819e-01", "anc_acc": "5.696e-01", "epoch": 0.01296} {"step": 6485, "loss": 1.2019, "grad_norm": "3.420e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.756e+00", "anc_loss": "1.827e+00", "dlm_acc": "4.555e-01", "anc_acc": "4.431e-01", "epoch": 0.01297} {"step": 6490, "loss": 1.1482, "grad_norm": "1.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.258e+00", "dlm_acc": "5.599e-01", "anc_acc": "5.469e-01", "epoch": 0.01298} {"step": 6495, "loss": 1.3655, "grad_norm": "5.437e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.573e+00", "dlm_acc": "4.927e-01", "anc_acc": "4.793e-01", "epoch": 0.01299} {"step": 6500, "loss": 1.1841, "grad_norm": "5.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.497e-01", "anc_acc": "5.384e-01", "epoch": 0.013} {"step": 6505, "loss": 1.272, "grad_norm": "6.003e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.464e+00", "anc_loss": "1.525e+00", "dlm_acc": "5.168e-01", "anc_acc": "5.045e-01", "epoch": 0.01301} {"step": 6510, "loss": 0.9198, "grad_norm": "4.884e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.242e-01", "anc_loss": "9.789e-01", "dlm_acc": "6.744e-01", "anc_acc": "6.629e-01", "epoch": 0.01302} {"step": 6515, "loss": 1.0737, "grad_norm": "3.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.222e+00", "dlm_acc": "5.883e-01", "anc_acc": "5.744e-01", "epoch": 0.01303} {"step": 6520, "loss": 1.4036, "grad_norm": "4.041e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.663e+00", "anc_loss": "1.744e+00", "dlm_acc": "5.010e-01", "anc_acc": "4.871e-01", "epoch": 0.01304} {"step": 6525, "loss": 0.9316, "grad_norm": "3.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.406e-01", "anc_loss": "8.938e-01", "dlm_acc": "6.374e-01", "anc_acc": "6.257e-01", "epoch": 0.01305} {"step": 6530, "loss": 1.6526, "grad_norm": "8.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.895e+00", "anc_loss": "1.966e+00", "dlm_acc": "4.542e-01", "anc_acc": "4.444e-01", "epoch": 0.01306} {"step": 6535, "loss": 0.9507, "grad_norm": "2.259e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.065e+00", "dlm_acc": "6.165e-01", "anc_acc": "6.055e-01", "epoch": 0.01307} {"step": 6540, "loss": 1.0046, "grad_norm": "5.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.148e+00", "dlm_acc": "5.801e-01", "anc_acc": "5.679e-01", "epoch": 0.01308} {"step": 6545, "loss": 1.1563, "grad_norm": "3.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.258e+00", "anc_loss": "1.316e+00", "dlm_acc": "5.668e-01", "anc_acc": "5.539e-01", "epoch": 0.01309} {"step": 6550, "loss": 1.3799, "grad_norm": "3.596e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.497e+00", "dlm_acc": "5.335e-01", "anc_acc": "5.217e-01", "epoch": 0.0131} {"step": 6555, "loss": 1.2998, "grad_norm": "3.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.368e+00", "anc_loss": "1.432e+00", "dlm_acc": "5.090e-01", "anc_acc": "4.977e-01", "epoch": 0.01311} {"step": 6560, "loss": 1.1967, "grad_norm": "3.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.104e+00", "dlm_acc": "5.431e-01", "anc_acc": "5.402e-01", "epoch": 0.01312} {"step": 6565, "loss": 1.6996, "grad_norm": "3.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.675e+00", "anc_loss": "1.742e+00", "dlm_acc": "4.825e-01", "anc_acc": "4.716e-01", "epoch": 0.01313} {"step": 6570, "loss": 1.3922, "grad_norm": "4.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.501e+00", "dlm_acc": "5.411e-01", "anc_acc": "5.272e-01", "epoch": 0.01314} {"step": 6575, "loss": 1.2318, "grad_norm": "3.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.194e+00", "dlm_acc": "5.760e-01", "anc_acc": "5.618e-01", "epoch": 0.01315} {"step": 6580, "loss": 1.6751, "grad_norm": "4.626e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.661e+00", "dlm_acc": "4.983e-01", "anc_acc": "4.873e-01", "epoch": 0.01316} {"step": 6585, "loss": 1.6877, "grad_norm": "4.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.382e+00", "anc_loss": "1.460e+00", "dlm_acc": "5.597e-01", "anc_acc": "5.468e-01", "epoch": 0.01317} {"step": 6590, "loss": 1.6323, "grad_norm": "4.139e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.722e+00", "anc_loss": "1.805e+00", "dlm_acc": "4.793e-01", "anc_acc": "4.657e-01", "epoch": 0.01318} {"step": 6595, "loss": 1.4325, "grad_norm": "6.109e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.191e+00", "dlm_acc": "5.607e-01", "anc_acc": "5.476e-01", "epoch": 0.01319} {"step": 6600, "loss": 1.5964, "grad_norm": "3.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.558e+00", "dlm_acc": "4.913e-01", "anc_acc": "4.810e-01", "epoch": 0.0132} {"step": 6605, "loss": 1.3474, "grad_norm": "5.348e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.142e-01", "anc_acc": "5.029e-01", "epoch": 0.01321} {"step": 6610, "loss": 1.9878, "grad_norm": "3.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.825e+00", "anc_loss": "1.903e+00", "dlm_acc": "4.471e-01", "anc_acc": "4.364e-01", "epoch": 0.01322} {"step": 6615, "loss": 1.1538, "grad_norm": "2.444e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.072e+00", "anc_loss": "1.136e+00", "dlm_acc": "5.676e-01", "anc_acc": "5.530e-01", "epoch": 0.01323} {"step": 6620, "loss": 1.385, "grad_norm": "3.217e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.347e+00", "dlm_acc": "5.394e-01", "anc_acc": "5.275e-01", "epoch": 0.01324} {"step": 6625, "loss": 1.2956, "grad_norm": "1.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.215e-01", "anc_acc": "5.088e-01", "epoch": 0.01325} {"step": 6630, "loss": 1.5767, "grad_norm": "3.019e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.346e+00", "dlm_acc": "4.295e-01", "anc_acc": "4.229e-01", "epoch": 0.01326} {"step": 6635, "loss": 1.7177, "grad_norm": "3.157e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.025e+00", "dlm_acc": "3.105e-01", "anc_acc": "3.095e-01", "epoch": 0.01327} {"step": 6640, "loss": 1.6707, "grad_norm": "5.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.080e+00", "dlm_acc": "2.190e-01", "anc_acc": "2.183e-01", "epoch": 0.01328} {"step": 6645, "loss": 1.3746, "grad_norm": "2.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.015e+00", "anc_loss": "1.019e+00", "dlm_acc": "2.346e-01", "anc_acc": "2.331e-01", "epoch": 0.01329} {"step": 6650, "loss": 1.4575, "grad_norm": "3.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.456e+00", "anc_loss": "1.506e+00", "dlm_acc": "5.293e-01", "anc_acc": "5.199e-01", "epoch": 0.0133} {"step": 6655, "loss": 1.3271, "grad_norm": "3.785e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.047e-01", "anc_acc": "4.930e-01", "epoch": 0.01331} {"step": 6660, "loss": 1.5061, "grad_norm": "2.996e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.788e+00", "anc_loss": "1.861e+00", "dlm_acc": "4.734e-01", "anc_acc": "4.605e-01", "epoch": 0.01332} {"step": 6665, "loss": 1.5621, "grad_norm": "4.061e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.361e+00", "anc_loss": "1.478e+00", "dlm_acc": "5.496e-01", "anc_acc": "5.353e-01", "epoch": 0.01333} {"step": 6670, "loss": 1.2745, "grad_norm": "4.896e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.411e+00", "dlm_acc": "5.083e-01", "anc_acc": "4.961e-01", "epoch": 0.01334} {"step": 6675, "loss": 1.4474, "grad_norm": "1.178e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.583e-01", "anc_acc": "5.458e-01", "epoch": 0.01335} {"step": 6680, "loss": 1.3054, "grad_norm": "2.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.132e+00", "anc_loss": "1.170e+00", "dlm_acc": "5.841e-01", "anc_acc": "5.811e-01", "epoch": 0.01336} {"step": 6685, "loss": 0.9224, "grad_norm": "2.015e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.240e-01", "anc_loss": "1.257e-01", "dlm_acc": "9.292e-01", "anc_acc": "9.289e-01", "epoch": 0.01337} {"step": 6690, "loss": 1.3359, "grad_norm": "5.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.684e+00", "dlm_acc": "5.255e-01", "anc_acc": "5.203e-01", "epoch": 0.01338} {"step": 6695, "loss": 1.1248, "grad_norm": "3.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.443e+00", "anc_loss": "1.518e+00", "dlm_acc": "5.212e-01", "anc_acc": "5.088e-01", "epoch": 0.01339} {"step": 6700, "loss": 1.2779, "grad_norm": "4.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.458e+00", "dlm_acc": "5.307e-01", "anc_acc": "5.178e-01", "epoch": 0.0134} {"step": 6705, "loss": 1.4667, "grad_norm": "4.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.608e+00", "anc_loss": "1.678e+00", "dlm_acc": "4.921e-01", "anc_acc": "4.814e-01", "epoch": 0.01341} {"step": 6710, "loss": 1.3519, "grad_norm": "3.635e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.400e+00", "anc_loss": "1.467e+00", "dlm_acc": "5.483e-01", "anc_acc": "5.348e-01", "epoch": 0.01342} {"step": 6715, "loss": 2.0515, "grad_norm": "5.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.064e+00", "anc_loss": "2.148e+00", "dlm_acc": "4.529e-01", "anc_acc": "4.424e-01", "epoch": 0.01343} {"step": 6720, "loss": 1.4889, "grad_norm": "4.128e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.541e-01", "anc_acc": "5.432e-01", "epoch": 0.01344} {"step": 6725, "loss": 1.1827, "grad_norm": "1.395e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.590e-01", "anc_acc": "5.473e-01", "epoch": 0.01345} {"step": 6730, "loss": 1.6608, "grad_norm": "7.239e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.683e+00", "anc_loss": "1.752e+00", "dlm_acc": "4.686e-01", "anc_acc": "4.589e-01", "epoch": 0.01346} {"step": 6735, "loss": 1.8587, "grad_norm": "4.767e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.659e+00", "anc_loss": "1.736e+00", "dlm_acc": "4.931e-01", "anc_acc": "4.815e-01", "epoch": 0.01347} {"step": 6740, "loss": 1.6299, "grad_norm": "6.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.634e+00", "anc_loss": "1.702e+00", "dlm_acc": "4.801e-01", "anc_acc": "4.690e-01", "epoch": 0.01348} {"step": 6745, "loss": 1.3085, "grad_norm": "4.065e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.360e+00", "anc_loss": "1.424e+00", "dlm_acc": "5.553e-01", "anc_acc": "5.419e-01", "epoch": 0.01349} {"step": 6750, "loss": 1.1494, "grad_norm": "2.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.108e+00", "dlm_acc": "6.024e-01", "anc_acc": "5.925e-01", "epoch": 0.0135} {"step": 6755, "loss": 1.5232, "grad_norm": "3.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.794e+00", "anc_loss": "1.861e+00", "dlm_acc": "4.322e-01", "anc_acc": "4.220e-01", "epoch": 0.01351} {"step": 6760, "loss": 1.656, "grad_norm": "3.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.820e+00", "anc_loss": "1.902e+00", "dlm_acc": "4.609e-01", "anc_acc": "4.489e-01", "epoch": 0.01352} {"step": 6765, "loss": 0.8889, "grad_norm": "2.048e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.453e-01", "anc_loss": "1.012e+00", "dlm_acc": "6.310e-01", "anc_acc": "6.145e-01", "epoch": 0.01353} {"step": 6770, "loss": 1.3236, "grad_norm": "2.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.634e+00", "anc_loss": "1.683e+00", "dlm_acc": "4.131e-01", "anc_acc": "4.027e-01", "epoch": 0.01354} {"step": 6775, "loss": 1.3633, "grad_norm": "3.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.332e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.095e-01", "anc_acc": "4.962e-01", "epoch": 0.01355} {"step": 6780, "loss": 1.4001, "grad_norm": "3.274e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.370e+00", "anc_loss": "1.427e+00", "dlm_acc": "4.640e-01", "anc_acc": "4.538e-01", "epoch": 0.01356} {"step": 6785, "loss": 1.2737, "grad_norm": "1.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.645e-01", "anc_loss": "7.816e-01", "dlm_acc": "5.422e-01", "anc_acc": "5.380e-01", "epoch": 0.01357} {"step": 6790, "loss": 1.0177, "grad_norm": "2.963e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.758e-01", "anc_loss": "8.008e-01", "dlm_acc": "5.223e-01", "anc_acc": "5.174e-01", "epoch": 0.01358} {"step": 6795, "loss": 1.3551, "grad_norm": "5.416e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.284e+00", "dlm_acc": "5.574e-01", "anc_acc": "5.437e-01", "epoch": 0.01359} {"step": 6800, "loss": 1.3325, "grad_norm": "3.740e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.207e+00", "anc_loss": "1.255e+00", "dlm_acc": "5.645e-01", "anc_acc": "5.550e-01", "epoch": 0.0136} {"step": 6805, "loss": 1.0836, "grad_norm": "3.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.422e-01", "anc_loss": "7.863e-01", "dlm_acc": "6.654e-01", "anc_acc": "6.527e-01", "epoch": 0.01361} {"step": 6810, "loss": 1.0387, "grad_norm": "2.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.109e-01", "anc_loss": "9.750e-01", "dlm_acc": "6.327e-01", "anc_acc": "6.202e-01", "epoch": 0.01362} {"step": 6815, "loss": 1.0753, "grad_norm": "3.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.121e-01", "anc_loss": "9.602e-01", "dlm_acc": "6.495e-01", "anc_acc": "6.388e-01", "epoch": 0.01363} {"step": 6820, "loss": 1.4436, "grad_norm": "3.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.526e+00", "dlm_acc": "5.066e-01", "anc_acc": "4.955e-01", "epoch": 0.01364} {"step": 6825, "loss": 1.2998, "grad_norm": "3.450e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.633e-01", "anc_loss": "1.009e+00", "dlm_acc": "6.093e-01", "anc_acc": "5.976e-01", "epoch": 0.01365} {"step": 6830, "loss": 1.5306, "grad_norm": "4.139e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.703e+00", "anc_loss": "1.778e+00", "dlm_acc": "4.447e-01", "anc_acc": "4.310e-01", "epoch": 0.01366} {"step": 6835, "loss": 1.4284, "grad_norm": "6.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.878e-01", "anc_acc": "5.768e-01", "epoch": 0.01367} {"step": 6840, "loss": 1.8445, "grad_norm": "7.267e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.588e+00", "anc_loss": "1.646e+00", "dlm_acc": "5.251e-01", "anc_acc": "5.161e-01", "epoch": 0.01368} {"step": 6845, "loss": 1.4394, "grad_norm": "2.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.617e-01", "anc_acc": "5.485e-01", "epoch": 0.01369} {"step": 6850, "loss": 1.2856, "grad_norm": "2.337e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.366e+00", "dlm_acc": "4.900e-01", "anc_acc": "4.751e-01", "epoch": 0.0137} {"step": 6855, "loss": 1.1287, "grad_norm": "3.587e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.080e-01", "anc_loss": "6.438e-01", "dlm_acc": "7.164e-01", "anc_acc": "7.082e-01", "epoch": 0.01371} {"step": 6860, "loss": 1.8157, "grad_norm": "5.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.536e+00", "anc_loss": "1.602e+00", "dlm_acc": "5.010e-01", "anc_acc": "4.893e-01", "epoch": 0.01372} {"step": 6865, "loss": 0.8654, "grad_norm": "3.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.064e+00", "anc_loss": "1.127e+00", "dlm_acc": "5.626e-01", "anc_acc": "5.476e-01", "epoch": 0.01373} {"step": 6870, "loss": 1.2836, "grad_norm": "4.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.466e+00", "anc_loss": "1.539e+00", "dlm_acc": "4.590e-01", "anc_acc": "4.477e-01", "epoch": 0.01374} {"step": 6875, "loss": 1.5004, "grad_norm": "4.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.306e+00", "anc_loss": "2.342e+00", "dlm_acc": "1.838e-01", "anc_acc": "1.787e-01", "epoch": 0.01375} {"step": 6880, "loss": 1.0286, "grad_norm": "6.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.436e+00", "dlm_acc": "4.780e-01", "anc_acc": "4.694e-01", "epoch": 0.01376} {"step": 6885, "loss": 1.7082, "grad_norm": "4.125e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.031e+00", "anc_loss": "2.092e+00", "dlm_acc": "2.898e-01", "anc_acc": "2.787e-01", "epoch": 0.01377} {"step": 6890, "loss": 1.5655, "grad_norm": "4.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.428e+00", "dlm_acc": "5.553e-01", "anc_acc": "5.455e-01", "epoch": 0.01378} {"step": 6895, "loss": 1.495, "grad_norm": "4.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.335e+00", "dlm_acc": "4.855e-01", "anc_acc": "4.764e-01", "epoch": 0.01379} {"step": 6900, "loss": 1.0727, "grad_norm": "4.325e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.173e+00", "dlm_acc": "5.814e-01", "anc_acc": "5.702e-01", "epoch": 0.0138} {"step": 6905, "loss": 1.3208, "grad_norm": "4.771e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.533e+00", "dlm_acc": "4.847e-01", "anc_acc": "4.714e-01", "epoch": 0.01381} {"step": 6910, "loss": 1.5593, "grad_norm": "4.170e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.092e+00", "dlm_acc": "2.990e-01", "anc_acc": "2.953e-01", "epoch": 0.01382} {"step": 6915, "loss": 0.8982, "grad_norm": "3.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.805e-01", "anc_loss": "9.453e-01", "dlm_acc": "6.468e-01", "anc_acc": "6.305e-01", "epoch": 0.01383} {"step": 6920, "loss": 1.1027, "grad_norm": "4.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.082e-01", "anc_acc": "5.010e-01", "epoch": 0.01384} {"step": 6925, "loss": 1.4755, "grad_norm": "3.739e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.265e+00", "dlm_acc": "6.224e-01", "anc_acc": "6.123e-01", "epoch": 0.01385} {"step": 6930, "loss": 1.3047, "grad_norm": "5.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.264e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.243e-01", "anc_acc": "5.118e-01", "epoch": 0.01386} {"step": 6935, "loss": 1.5344, "grad_norm": "9.352e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.677e+00", "anc_loss": "1.752e+00", "dlm_acc": "4.654e-01", "anc_acc": "4.511e-01", "epoch": 0.01387} {"step": 6940, "loss": 1.7462, "grad_norm": "2.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.487e+00", "anc_loss": "1.538e+00", "dlm_acc": "4.848e-01", "anc_acc": "4.749e-01", "epoch": 0.01388} {"step": 6945, "loss": 1.1156, "grad_norm": "3.689e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.352e-01", "anc_acc": "5.226e-01", "epoch": 0.01389} {"step": 6950, "loss": 1.223, "grad_norm": "7.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.556e+00", "anc_loss": "1.623e+00", "dlm_acc": "4.895e-01", "anc_acc": "4.762e-01", "epoch": 0.0139} {"step": 6955, "loss": 1.0402, "grad_norm": "3.467e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.475e+00", "dlm_acc": "5.194e-01", "anc_acc": "5.073e-01", "epoch": 0.01391} {"step": 6960, "loss": 0.8136, "grad_norm": "2.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.922e-01", "anc_loss": "1.048e+00", "dlm_acc": "5.715e-01", "anc_acc": "5.598e-01", "epoch": 0.01392} {"step": 6965, "loss": 1.5017, "grad_norm": "7.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.392e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.470e-01", "anc_acc": "5.341e-01", "epoch": 0.01393} {"step": 6970, "loss": 1.3316, "grad_norm": "5.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.237e+00", "anc_loss": "1.302e+00", "dlm_acc": "5.738e-01", "anc_acc": "5.619e-01", "epoch": 0.01394} {"step": 6975, "loss": 1.7388, "grad_norm": "4.466e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.819e+00", "anc_loss": "1.891e+00", "dlm_acc": "4.606e-01", "anc_acc": "4.501e-01", "epoch": 0.01395} {"step": 6980, "loss": 1.4112, "grad_norm": "5.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.656e+00", "anc_loss": "1.727e+00", "dlm_acc": "4.873e-01", "anc_acc": "4.748e-01", "epoch": 0.01396} {"step": 6985, "loss": 0.9581, "grad_norm": "5.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.719e-01", "anc_loss": "8.160e-01", "dlm_acc": "6.835e-01", "anc_acc": "6.737e-01", "epoch": 0.01397} {"step": 6990, "loss": 1.3635, "grad_norm": "4.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.922e-01", "anc_loss": "5.418e-01", "dlm_acc": "7.600e-01", "anc_acc": "7.464e-01", "epoch": 0.01398} {"step": 6995, "loss": 1.7035, "grad_norm": "5.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.145e+00", "dlm_acc": "5.563e-01", "anc_acc": "5.458e-01", "epoch": 0.01399} {"step": 7000, "loss": 1.8426, "grad_norm": "4.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.938e+00", "anc_loss": "2.966e+00", "dlm_acc": "2.099e-02", "anc_acc": "2.007e-02", "epoch": 0.014} {"step": 7005, "loss": 1.647, "grad_norm": "9.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.483e+00", "anc_loss": "2.528e+00", "dlm_acc": "2.325e-01", "anc_acc": "2.301e-01", "epoch": 0.01401} {"step": 7010, "loss": 1.225, "grad_norm": "4.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.192e+00", "dlm_acc": "6.176e-01", "anc_acc": "6.059e-01", "epoch": 0.01402} {"step": 7015, "loss": 2.0335, "grad_norm": "4.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.078e+00", "anc_loss": "2.140e+00", "dlm_acc": "4.164e-01", "anc_acc": "4.082e-01", "epoch": 0.01403} {"step": 7020, "loss": 1.2454, "grad_norm": "4.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.411e+00", "dlm_acc": "5.114e-01", "anc_acc": "4.979e-01", "epoch": 0.01404} {"step": 7025, "loss": 1.5995, "grad_norm": "2.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.564e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.876e-01", "anc_acc": "4.755e-01", "epoch": 0.01405} {"step": 7030, "loss": 1.2328, "grad_norm": "2.568e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.506e-01", "anc_acc": "5.377e-01", "epoch": 0.01406} {"step": 7035, "loss": 1.4469, "grad_norm": "3.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.520e+00", "dlm_acc": "4.842e-01", "anc_acc": "4.599e-01", "epoch": 0.01407} {"step": 7040, "loss": 1.5539, "grad_norm": "7.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.483e+00", "anc_loss": "1.546e+00", "dlm_acc": "4.139e-01", "anc_acc": "3.902e-01", "epoch": 0.01408} {"step": 7045, "loss": 1.7415, "grad_norm": "4.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.356e+00", "anc_loss": "2.372e+00", "dlm_acc": "6.688e-02", "anc_acc": "6.472e-02", "epoch": 0.01409} {"step": 7050, "loss": 1.5191, "grad_norm": "3.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.873e+00", "anc_loss": "1.920e+00", "dlm_acc": "3.439e-01", "anc_acc": "3.348e-01", "epoch": 0.0141} {"step": 7055, "loss": 1.3174, "grad_norm": "5.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.348e+00", "anc_loss": "2.383e+00", "dlm_acc": "2.602e-01", "anc_acc": "2.542e-01", "epoch": 0.01411} {"step": 7060, "loss": 1.4354, "grad_norm": "4.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.650e+00", "anc_loss": "2.666e+00", "dlm_acc": "9.634e-02", "anc_acc": "9.427e-02", "epoch": 0.01412} {"step": 7065, "loss": 1.1203, "grad_norm": "7.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.580e+00", "dlm_acc": "4.977e-01", "anc_acc": "4.849e-01", "epoch": 0.01413} {"step": 7070, "loss": 1.5255, "grad_norm": "4.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.409e+00", "anc_loss": "1.477e+00", "dlm_acc": "5.546e-01", "anc_acc": "5.408e-01", "epoch": 0.01414} {"step": 7075, "loss": 1.2207, "grad_norm": "5.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.641e+00", "anc_loss": "1.694e+00", "dlm_acc": "3.368e-01", "anc_acc": "3.190e-01", "epoch": 0.01415} {"step": 7080, "loss": 1.2683, "grad_norm": "5.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.613e+00", "anc_loss": "1.670e+00", "dlm_acc": "4.538e-01", "anc_acc": "4.439e-01", "epoch": 0.01416} {"step": 7085, "loss": 0.8954, "grad_norm": "2.832e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.051e-01", "anc_loss": "8.520e-01", "dlm_acc": "6.627e-01", "anc_acc": "6.527e-01", "epoch": 0.01417} {"step": 7090, "loss": 0.9498, "grad_norm": "2.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.078e+00", "anc_loss": "1.136e+00", "dlm_acc": "5.986e-01", "anc_acc": "5.858e-01", "epoch": 0.01418} {"step": 7095, "loss": 1.8544, "grad_norm": "3.866e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.237e-01", "anc_acc": "5.081e-01", "epoch": 0.01419} {"step": 7100, "loss": 1.9555, "grad_norm": "6.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.538e+00", "dlm_acc": "5.072e-01", "anc_acc": "4.954e-01", "epoch": 0.0142} {"step": 7105, "loss": 1.0264, "grad_norm": "2.945e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.342e+00", "dlm_acc": "5.247e-01", "anc_acc": "5.107e-01", "epoch": 0.01421} {"step": 7110, "loss": 0.9563, "grad_norm": "3.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.253e+00", "dlm_acc": "5.235e-01", "anc_acc": "5.120e-01", "epoch": 0.01422} {"step": 7115, "loss": 0.8804, "grad_norm": "2.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.310e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.313e-01", "anc_acc": "5.202e-01", "epoch": 0.01423} {"step": 7120, "loss": 0.8044, "grad_norm": "5.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.297e-01", "anc_loss": "9.836e-01", "dlm_acc": "6.184e-01", "anc_acc": "6.081e-01", "epoch": 0.01424} {"step": 7125, "loss": 1.3242, "grad_norm": "4.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.336e-01", "anc_loss": "9.734e-01", "dlm_acc": "6.271e-01", "anc_acc": "6.192e-01", "epoch": 0.01425} {"step": 7130, "loss": 1.2441, "grad_norm": "4.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.990e-01", "anc_loss": "7.256e-01", "dlm_acc": "7.192e-01", "anc_acc": "7.159e-01", "epoch": 0.01426} {"step": 7135, "loss": 1.0854, "grad_norm": "2.305e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.766e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.043e-01", "anc_acc": "5.906e-01", "epoch": 0.01427} {"step": 7140, "loss": 0.9225, "grad_norm": "3.385e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.773e-01", "anc_loss": "9.340e-01", "dlm_acc": "5.929e-01", "anc_acc": "5.773e-01", "epoch": 0.01428} {"step": 7145, "loss": 1.6596, "grad_norm": "6.588e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.489e+00", "anc_loss": "1.511e+00", "dlm_acc": "4.733e-01", "anc_acc": "4.705e-01", "epoch": 0.01429} {"step": 7150, "loss": 1.0864, "grad_norm": "2.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.322e-01", "anc_loss": "8.689e-01", "dlm_acc": "5.907e-01", "anc_acc": "5.833e-01", "epoch": 0.0143} {"step": 7155, "loss": 1.3864, "grad_norm": "4.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.206e-01", "anc_acc": "5.057e-01", "epoch": 0.01431} {"step": 7160, "loss": 1.4208, "grad_norm": "4.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.835e-01", "anc_loss": "1.041e+00", "dlm_acc": "7.076e-01", "anc_acc": "6.988e-01", "epoch": 0.01432} {"step": 7165, "loss": 1.1392, "grad_norm": "4.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.604e-01", "anc_loss": "1.001e+00", "dlm_acc": "6.114e-01", "anc_acc": "6.022e-01", "epoch": 0.01433} {"step": 7170, "loss": 1.1887, "grad_norm": "3.241e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.104e+00", "dlm_acc": "4.121e-01", "anc_acc": "4.008e-01", "epoch": 0.01434} {"step": 7175, "loss": 0.9658, "grad_norm": "1.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.218e+00", "dlm_acc": "5.384e-01", "anc_acc": "5.249e-01", "epoch": 0.01435} {"step": 7180, "loss": 1.5985, "grad_norm": "3.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.484e+00", "anc_loss": "1.545e+00", "dlm_acc": "5.245e-01", "anc_acc": "5.129e-01", "epoch": 0.01436} {"step": 7185, "loss": 1.849, "grad_norm": "4.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.916e+00", "anc_loss": "1.984e+00", "dlm_acc": "4.042e-01", "anc_acc": "3.920e-01", "epoch": 0.01437} {"step": 7190, "loss": 1.0663, "grad_norm": "3.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.707e-01", "anc_loss": "8.187e-01", "dlm_acc": "6.776e-01", "anc_acc": "6.640e-01", "epoch": 0.01438} {"step": 7195, "loss": 1.5695, "grad_norm": "5.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.266e-01", "anc_acc": "5.152e-01", "epoch": 0.01439} {"step": 7200, "loss": 1.3877, "grad_norm": "3.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.158e+00", "anc_loss": "1.215e+00", "dlm_acc": "5.456e-01", "anc_acc": "5.359e-01", "epoch": 0.0144} {"step": 7205, "loss": 1.0349, "grad_norm": "2.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.086e-01", "anc_loss": "9.418e-01", "dlm_acc": "5.145e-01", "anc_acc": "5.068e-01", "epoch": 0.01441} {"step": 7210, "loss": 1.3804, "grad_norm": "3.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.870e+00", "anc_loss": "1.965e+00", "dlm_acc": "3.327e-01", "anc_acc": "3.295e-01", "epoch": 0.01442} {"step": 7215, "loss": 1.1163, "grad_norm": "3.739e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.191e+00", "dlm_acc": "4.794e-01", "anc_acc": "4.670e-01", "epoch": 0.01443} {"step": 7220, "loss": 1.1743, "grad_norm": "6.675e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.340e+00", "anc_loss": "1.396e+00", "dlm_acc": "4.641e-01", "anc_acc": "4.545e-01", "epoch": 0.01444} {"step": 7225, "loss": 1.4467, "grad_norm": "1.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.165e+00", "dlm_acc": "6.071e-01", "anc_acc": "5.915e-01", "epoch": 0.01445} {"step": 7230, "loss": 1.532, "grad_norm": "3.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.661e+00", "anc_loss": "1.731e+00", "dlm_acc": "4.790e-01", "anc_acc": "4.685e-01", "epoch": 0.01446} {"step": 7235, "loss": 1.2696, "grad_norm": "5.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.328e+00", "dlm_acc": "5.156e-01", "anc_acc": "5.120e-01", "epoch": 0.01447} {"step": 7240, "loss": 1.3776, "grad_norm": "5.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.479e+00", "anc_loss": "1.542e+00", "dlm_acc": "4.787e-01", "anc_acc": "4.704e-01", "epoch": 0.01448} {"step": 7245, "loss": 1.7627, "grad_norm": "3.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.734e+00", "anc_loss": "2.784e+00", "dlm_acc": "4.403e-02", "anc_acc": "3.779e-02", "epoch": 0.01449} {"step": 7250, "loss": 1.5452, "grad_norm": "4.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.759e+00", "anc_loss": "1.805e+00", "dlm_acc": "3.998e-01", "anc_acc": "3.883e-01", "epoch": 0.0145} {"step": 7255, "loss": 1.4357, "grad_norm": "2.848e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.614e+00", "anc_loss": "1.670e+00", "dlm_acc": "4.431e-01", "anc_acc": "4.329e-01", "epoch": 0.01451} {"step": 7260, "loss": 1.257, "grad_norm": "4.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.622e+00", "anc_loss": "1.698e+00", "dlm_acc": "5.078e-01", "anc_acc": "4.982e-01", "epoch": 0.01452} {"step": 7265, "loss": 1.2824, "grad_norm": "1.726e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.037e+00", "anc_loss": "1.093e+00", "dlm_acc": "6.027e-01", "anc_acc": "5.929e-01", "epoch": 0.01453} {"step": 7270, "loss": 1.2626, "grad_norm": "2.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.624e-01", "anc_acc": "5.484e-01", "epoch": 0.01454} {"step": 7275, "loss": 1.5889, "grad_norm": "6.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.852e+00", "anc_loss": "1.915e+00", "dlm_acc": "3.755e-01", "anc_acc": "3.678e-01", "epoch": 0.01455} {"step": 7280, "loss": 1.3966, "grad_norm": "3.403e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.228e-01", "anc_acc": "5.095e-01", "epoch": 0.01456} {"step": 7285, "loss": 1.7188, "grad_norm": "3.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.301e+00", "anc_loss": "1.347e+00", "dlm_acc": "5.031e-01", "anc_acc": "4.959e-01", "epoch": 0.01457} {"step": 7290, "loss": 1.6513, "grad_norm": "6.220e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.243e+00", "dlm_acc": "5.691e-01", "anc_acc": "5.580e-01", "epoch": 0.01458} {"step": 7295, "loss": 2.0801, "grad_norm": "5.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.690e+00", "anc_loss": "1.751e+00", "dlm_acc": "5.072e-01", "anc_acc": "4.952e-01", "epoch": 0.01459} {"step": 7300, "loss": 1.7782, "grad_norm": "3.896e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.677e+00", "anc_loss": "1.748e+00", "dlm_acc": "4.639e-01", "anc_acc": "4.516e-01", "epoch": 0.0146} {"step": 7305, "loss": 1.3124, "grad_norm": "3.537e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.315e-01", "anc_acc": "5.229e-01", "epoch": 0.01461} {"step": 7310, "loss": 1.2991, "grad_norm": "3.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.543e-01", "anc_loss": "1.029e+00", "dlm_acc": "6.671e-01", "anc_acc": "6.514e-01", "epoch": 0.01462} {"step": 7315, "loss": 1.3147, "grad_norm": "3.908e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.527e+00", "dlm_acc": "4.189e-01", "anc_acc": "4.069e-01", "epoch": 0.01463} {"step": 7320, "loss": 1.3888, "grad_norm": "3.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.961e-01", "anc_loss": "9.621e-01", "dlm_acc": "6.652e-01", "anc_acc": "6.508e-01", "epoch": 0.01464} {"step": 7325, "loss": 1.531, "grad_norm": "6.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.891e-01", "anc_acc": "5.700e-01", "epoch": 0.01465} {"step": 7330, "loss": 1.302, "grad_norm": "4.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.586e-01", "anc_loss": "1.009e+00", "dlm_acc": "5.868e-01", "anc_acc": "5.717e-01", "epoch": 0.01466} {"step": 7335, "loss": 1.4012, "grad_norm": "1.087e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.028e+00", "anc_loss": "1.076e+00", "dlm_acc": "5.530e-01", "anc_acc": "5.421e-01", "epoch": 0.01467} {"step": 7340, "loss": 1.2361, "grad_norm": "4.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.727e-01", "anc_loss": "6.996e-01", "dlm_acc": "6.015e-01", "anc_acc": "5.947e-01", "epoch": 0.01468} {"step": 7345, "loss": 1.6061, "grad_norm": "3.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.364e-01", "anc_acc": "5.241e-01", "epoch": 0.01469} {"step": 7350, "loss": 1.2255, "grad_norm": "3.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.227e-01", "anc_acc": "6.092e-01", "epoch": 0.0147} {"step": 7355, "loss": 1.4768, "grad_norm": "6.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.392e+00", "anc_loss": "1.463e+00", "dlm_acc": "5.378e-01", "anc_acc": "5.256e-01", "epoch": 0.01471} {"step": 7360, "loss": 1.2548, "grad_norm": "2.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.615e+00", "anc_loss": "1.676e+00", "dlm_acc": "4.604e-01", "anc_acc": "4.482e-01", "epoch": 0.01472} {"step": 7365, "loss": 1.1985, "grad_norm": "5.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.199e+00", "dlm_acc": "5.401e-01", "anc_acc": "5.326e-01", "epoch": 0.01473} {"step": 7370, "loss": 1.3968, "grad_norm": "5.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.425e-01", "anc_acc": "5.361e-01", "epoch": 0.01474} {"step": 7375, "loss": 1.2359, "grad_norm": "3.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.196e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.272e-01", "anc_acc": "5.137e-01", "epoch": 0.01475} {"step": 7380, "loss": 1.0042, "grad_norm": "1.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.601e-01", "anc_loss": "2.743e-01", "dlm_acc": "8.750e-01", "anc_acc": "8.703e-01", "epoch": 0.01476} {"step": 7385, "loss": 1.3475, "grad_norm": "2.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.123e+00", "dlm_acc": "6.048e-01", "anc_acc": "5.939e-01", "epoch": 0.01477} {"step": 7390, "loss": 1.5838, "grad_norm": "2.804e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.156e+00", "dlm_acc": "6.023e-01", "anc_acc": "5.872e-01", "epoch": 0.01478} {"step": 7395, "loss": 1.7745, "grad_norm": "3.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.598e-01", "anc_loss": "7.973e-01", "dlm_acc": "6.249e-01", "anc_acc": "6.104e-01", "epoch": 0.01479} {"step": 7400, "loss": 0.9898, "grad_norm": "2.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.719e-01", "anc_loss": "7.008e-01", "dlm_acc": "6.220e-01", "anc_acc": "6.099e-01", "epoch": 0.0148} {"step": 7405, "loss": 0.609, "grad_norm": "4.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.318e-01", "anc_loss": "4.520e-01", "dlm_acc": "6.843e-01", "anc_acc": "6.736e-01", "epoch": 0.01481} {"step": 7410, "loss": 1.5026, "grad_norm": "4.884e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.542e+00", "anc_loss": "1.593e+00", "dlm_acc": "4.965e-01", "anc_acc": "4.884e-01", "epoch": 0.01482} {"step": 7415, "loss": 1.287, "grad_norm": "6.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.262e-01", "anc_loss": "6.367e-01", "dlm_acc": "5.999e-01", "anc_acc": "5.966e-01", "epoch": 0.01483} {"step": 7420, "loss": 1.289, "grad_norm": "4.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.797e-01", "anc_loss": "1.013e+00", "dlm_acc": "5.318e-01", "anc_acc": "5.264e-01", "epoch": 0.01484} {"step": 7425, "loss": 1.1531, "grad_norm": "3.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.750e-01", "anc_loss": "6.797e-01", "dlm_acc": "5.557e-01", "anc_acc": "5.543e-01", "epoch": 0.01485} {"step": 7430, "loss": 1.3139, "grad_norm": "1.430e+00", "learning_rate": "1.000e-04", "dlm_loss": "7.016e-01", "anc_loss": "7.063e-01", "dlm_acc": "5.435e-01", "anc_acc": "5.416e-01", "epoch": 0.01486} {"step": 7435, "loss": 1.6877, "grad_norm": "8.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.016e-01", "anc_loss": "7.055e-01", "dlm_acc": "5.461e-01", "anc_acc": "5.436e-01", "epoch": 0.01487} {"step": 7440, "loss": 1.6832, "grad_norm": "4.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.648e-01", "anc_loss": "6.695e-01", "dlm_acc": "5.432e-01", "anc_acc": "5.439e-01", "epoch": 0.01488} {"step": 7445, "loss": 1.365, "grad_norm": "3.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.172e-01", "anc_loss": "7.211e-01", "dlm_acc": "5.446e-01", "anc_acc": "5.438e-01", "epoch": 0.01489} {"step": 7450, "loss": 1.1809, "grad_norm": "1.042e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.711e-01", "anc_loss": "6.750e-01", "dlm_acc": "5.520e-01", "anc_acc": "5.516e-01", "epoch": 0.0149} {"step": 7455, "loss": 1.4716, "grad_norm": "3.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.136e+00", "dlm_acc": "5.517e-01", "anc_acc": "5.448e-01", "epoch": 0.01491} {"step": 7460, "loss": 1.3394, "grad_norm": "5.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.435e-01", "anc_acc": "5.312e-01", "epoch": 0.01492} {"step": 7465, "loss": 1.0964, "grad_norm": "6.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.310e+00", "dlm_acc": "5.718e-01", "anc_acc": "5.605e-01", "epoch": 0.01493} {"step": 7470, "loss": 1.3467, "grad_norm": "4.716e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.094e+00", "dlm_acc": "3.918e-01", "anc_acc": "3.865e-01", "epoch": 0.01494} {"step": 7475, "loss": 1.0902, "grad_norm": "3.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.797e-01", "anc_loss": "1.012e+00", "dlm_acc": "4.582e-01", "anc_acc": "4.542e-01", "epoch": 0.01495} {"step": 7480, "loss": 1.1657, "grad_norm": "2.511e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.152e-01", "anc_loss": "5.375e-01", "dlm_acc": "6.348e-01", "anc_acc": "6.187e-01", "epoch": 0.01496} {"step": 7485, "loss": 1.0895, "grad_norm": "1.847e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.660e-01", "anc_loss": "9.008e-01", "dlm_acc": "5.447e-01", "anc_acc": "5.344e-01", "epoch": 0.01497} {"step": 7490, "loss": 1.5676, "grad_norm": "2.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.891e-01", "anc_loss": "8.141e-01", "dlm_acc": "5.405e-01", "anc_acc": "5.304e-01", "epoch": 0.01498} {"step": 7495, "loss": 1.04, "grad_norm": "2.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.609e-01", "anc_loss": "7.977e-01", "dlm_acc": "5.363e-01", "anc_acc": "5.232e-01", "epoch": 0.01499} {"step": 7500, "loss": 1.6555, "grad_norm": "9.362e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.381e-01", "anc_loss": "9.836e-01", "dlm_acc": "5.780e-01", "anc_acc": "5.677e-01", "epoch": 0.015} {"step": 7505, "loss": 1.4108, "grad_norm": "4.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.949e-01", "anc_loss": "8.320e-01", "dlm_acc": "6.245e-01", "anc_acc": "6.158e-01", "epoch": 0.01501} {"step": 7510, "loss": 0.9124, "grad_norm": "2.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.102e-01", "anc_loss": "9.516e-01", "dlm_acc": "5.470e-01", "anc_acc": "5.354e-01", "epoch": 0.01502} {"step": 7515, "loss": 1.2385, "grad_norm": "5.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.238e-01", "anc_loss": "9.602e-01", "dlm_acc": "6.062e-01", "anc_acc": "5.971e-01", "epoch": 0.01503} {"step": 7520, "loss": 1.5343, "grad_norm": "4.425e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.334e+00", "dlm_acc": "6.005e-01", "anc_acc": "5.871e-01", "epoch": 0.01504} {"step": 7525, "loss": 1.6213, "grad_norm": "2.518e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.368e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.244e-01", "anc_acc": "5.127e-01", "epoch": 0.01505} {"step": 7530, "loss": 1.2575, "grad_norm": "5.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.184e+00", "dlm_acc": "5.777e-01", "anc_acc": "5.666e-01", "epoch": 0.01506} {"step": 7535, "loss": 1.3018, "grad_norm": "6.141e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.991e-01", "anc_loss": "1.034e+00", "dlm_acc": "6.017e-01", "anc_acc": "5.942e-01", "epoch": 0.01507} {"step": 7540, "loss": 0.9922, "grad_norm": "4.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.168e-01", "anc_loss": "6.262e-01", "dlm_acc": "6.427e-01", "anc_acc": "6.394e-01", "epoch": 0.01508} {"step": 7545, "loss": 0.8329, "grad_norm": "3.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.427e-01", "anc_loss": "4.467e-01", "dlm_acc": "6.746e-01", "anc_acc": "6.726e-01", "epoch": 0.01509} {"step": 7550, "loss": 1.7866, "grad_norm": "4.856e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.515e+00", "anc_loss": "1.569e+00", "dlm_acc": "5.255e-01", "anc_acc": "5.163e-01", "epoch": 0.0151} {"step": 7555, "loss": 1.5049, "grad_norm": "2.449e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.261e+00", "anc_loss": "1.324e+00", "dlm_acc": "5.885e-01", "anc_acc": "5.755e-01", "epoch": 0.01511} {"step": 7560, "loss": 1.1629, "grad_norm": "4.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.965e-01", "anc_loss": "1.048e+00", "dlm_acc": "5.721e-01", "anc_acc": "5.636e-01", "epoch": 0.01512} {"step": 7565, "loss": 1.0749, "grad_norm": "2.785e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.699e-01", "anc_loss": "9.211e-01", "dlm_acc": "5.876e-01", "anc_acc": "5.747e-01", "epoch": 0.01513} {"step": 7570, "loss": 1.2308, "grad_norm": "2.947e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.820e-01", "anc_loss": "1.015e+00", "dlm_acc": "5.661e-01", "anc_acc": "5.561e-01", "epoch": 0.01514} {"step": 7575, "loss": 1.089, "grad_norm": "2.766e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.117e-01", "anc_loss": "7.398e-01", "dlm_acc": "5.821e-01", "anc_acc": "5.738e-01", "epoch": 0.01515} {"step": 7580, "loss": 1.3581, "grad_norm": "3.076e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.973e-01", "anc_loss": "9.437e-01", "dlm_acc": "6.515e-01", "anc_acc": "6.397e-01", "epoch": 0.01516} {"step": 7585, "loss": 2.0306, "grad_norm": "3.331e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.709e+00", "anc_loss": "1.789e+00", "dlm_acc": "4.767e-01", "anc_acc": "4.644e-01", "epoch": 0.01517} {"step": 7590, "loss": 1.3757, "grad_norm": "3.527e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.520e-01", "anc_loss": "7.816e-01", "dlm_acc": "6.212e-01", "anc_acc": "6.130e-01", "epoch": 0.01518} {"step": 7595, "loss": 1.9664, "grad_norm": "2.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.393e+00", "anc_loss": "1.451e+00", "dlm_acc": "5.409e-01", "anc_acc": "5.296e-01", "epoch": 0.01519} {"step": 7600, "loss": 1.2706, "grad_norm": "3.576e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.367e+00", "anc_loss": "1.418e+00", "dlm_acc": "4.902e-01", "anc_acc": "4.796e-01", "epoch": 0.0152} {"step": 7605, "loss": 1.2244, "grad_norm": "3.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.249e+00", "dlm_acc": "5.185e-01", "anc_acc": "5.065e-01", "epoch": 0.01521} {"step": 7610, "loss": 1.1449, "grad_norm": "3.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.031e+00", "anc_loss": "1.099e+00", "dlm_acc": "6.046e-01", "anc_acc": "5.877e-01", "epoch": 0.01522} {"step": 7615, "loss": 1.3009, "grad_norm": "3.351e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.000e-01", "anc_loss": "9.422e-01", "dlm_acc": "5.521e-01", "anc_acc": "5.405e-01", "epoch": 0.01523} {"step": 7620, "loss": 1.5162, "grad_norm": "4.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.497e+00", "anc_loss": "1.531e+00", "dlm_acc": "4.016e-01", "anc_acc": "3.927e-01", "epoch": 0.01524} {"step": 7625, "loss": 1.5638, "grad_norm": "1.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.463e+00", "anc_loss": "1.523e+00", "dlm_acc": "4.819e-01", "anc_acc": "4.710e-01", "epoch": 0.01525} {"step": 7630, "loss": 1.5582, "grad_norm": "3.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.237e+00", "dlm_acc": "5.404e-01", "anc_acc": "5.282e-01", "epoch": 0.01526} {"step": 7635, "loss": 1.3199, "grad_norm": "2.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.980e-01", "anc_loss": "9.592e-01", "dlm_acc": "6.114e-01", "anc_acc": "5.946e-01", "epoch": 0.01527} {"step": 7640, "loss": 1.4796, "grad_norm": "3.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.852e-01", "anc_loss": "1.047e+00", "dlm_acc": "5.584e-01", "anc_acc": "5.416e-01", "epoch": 0.01528} {"step": 7645, "loss": 1.824, "grad_norm": "3.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.512e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.512e-01", "epoch": 0.01529} {"step": 7650, "loss": 1.6494, "grad_norm": "5.879e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.973e+00", "anc_loss": "2.061e+00", "dlm_acc": "4.079e-01", "anc_acc": "3.957e-01", "epoch": 0.0153} {"step": 7655, "loss": 0.9781, "grad_norm": "7.698e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.695e-01", "anc_loss": "7.031e-01", "dlm_acc": "6.294e-01", "anc_acc": "6.173e-01", "epoch": 0.01531} {"step": 7660, "loss": 1.3732, "grad_norm": "4.522e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.800e+00", "anc_loss": "1.877e+00", "dlm_acc": "4.600e-01", "anc_acc": "4.474e-01", "epoch": 0.01532} {"step": 7665, "loss": 1.2456, "grad_norm": "1.225e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.080e-01", "anc_acc": "4.969e-01", "epoch": 0.01533} {"step": 7670, "loss": 1.6788, "grad_norm": "7.758e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.392e+00", "anc_loss": "2.420e+00", "dlm_acc": "1.922e-01", "anc_acc": "1.865e-01", "epoch": 0.01534} {"step": 7675, "loss": 1.2053, "grad_norm": "7.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.193e+00", "dlm_acc": "5.406e-01", "anc_acc": "5.257e-01", "epoch": 0.01535} {"step": 7680, "loss": 1.3744, "grad_norm": "3.563e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.181e+00", "anc_loss": "1.255e+00", "dlm_acc": "6.668e-01", "anc_acc": "6.541e-01", "epoch": 0.01536} {"step": 7685, "loss": 1.2471, "grad_norm": "5.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.411e+00", "dlm_acc": "5.330e-01", "anc_acc": "5.233e-01", "epoch": 0.01537} {"step": 7690, "loss": 1.3923, "grad_norm": "2.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.211e+00", "dlm_acc": "5.533e-01", "anc_acc": "5.405e-01", "epoch": 0.01538} {"step": 7695, "loss": 1.187, "grad_norm": "3.315e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.936e-01", "anc_loss": "9.359e-01", "dlm_acc": "6.473e-01", "anc_acc": "6.382e-01", "epoch": 0.01539} {"step": 7700, "loss": 1.0642, "grad_norm": "3.034e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.043e-01", "anc_loss": "7.461e-01", "dlm_acc": "7.014e-01", "anc_acc": "6.945e-01", "epoch": 0.0154} {"step": 7705, "loss": 1.4514, "grad_norm": "7.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.167e+00", "dlm_acc": "6.127e-01", "anc_acc": "6.008e-01", "epoch": 0.01541} {"step": 7710, "loss": 1.1877, "grad_norm": "2.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.517e+00", "anc_loss": "1.592e+00", "dlm_acc": "4.745e-01", "anc_acc": "4.608e-01", "epoch": 0.01542} {"step": 7715, "loss": 0.8864, "grad_norm": "6.239e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.104e+00", "dlm_acc": "5.767e-01", "anc_acc": "5.639e-01", "epoch": 0.01543} {"step": 7720, "loss": 0.9776, "grad_norm": "3.161e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.125e-01", "anc_loss": "9.602e-01", "dlm_acc": "6.318e-01", "anc_acc": "6.201e-01", "epoch": 0.01544} {"step": 7725, "loss": 1.1195, "grad_norm": "6.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.186e+00", "anc_loss": "1.243e+00", "dlm_acc": "5.688e-01", "anc_acc": "5.592e-01", "epoch": 0.01545} {"step": 7730, "loss": 1.0121, "grad_norm": "3.937e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.587e+00", "anc_loss": "1.637e+00", "dlm_acc": "4.441e-01", "anc_acc": "4.337e-01", "epoch": 0.01546} {"step": 7735, "loss": 0.9359, "grad_norm": "3.899e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.910e-01", "anc_loss": "7.422e-01", "dlm_acc": "6.941e-01", "anc_acc": "6.814e-01", "epoch": 0.01547} {"step": 7740, "loss": 0.9373, "grad_norm": "3.077e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.279e+00", "dlm_acc": "5.197e-01", "anc_acc": "5.036e-01", "epoch": 0.01548} {"step": 7745, "loss": 1.0895, "grad_norm": "3.241e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.504e+00", "anc_loss": "1.561e+00", "dlm_acc": "4.888e-01", "anc_acc": "4.762e-01", "epoch": 0.01549} {"step": 7750, "loss": 1.2095, "grad_norm": "3.039e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.575e+00", "dlm_acc": "5.027e-01", "anc_acc": "4.911e-01", "epoch": 0.0155} {"step": 7755, "loss": 1.1377, "grad_norm": "7.246e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.704e+00", "anc_loss": "1.757e+00", "dlm_acc": "3.937e-01", "anc_acc": "3.843e-01", "epoch": 0.01551} {"step": 7760, "loss": 1.5884, "grad_norm": "3.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.933e+00", "anc_loss": "1.994e+00", "dlm_acc": "3.530e-01", "anc_acc": "3.433e-01", "epoch": 0.01552} {"step": 7765, "loss": 1.305, "grad_norm": "4.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.682e+00", "anc_loss": "1.766e+00", "dlm_acc": "4.678e-01", "anc_acc": "4.523e-01", "epoch": 0.01553} {"step": 7770, "loss": 0.9933, "grad_norm": "4.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.192e+00", "dlm_acc": "5.238e-01", "anc_acc": "5.103e-01", "epoch": 0.01554} {"step": 7775, "loss": 1.0806, "grad_norm": "5.238e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.581e+00", "anc_loss": "1.647e+00", "dlm_acc": "4.902e-01", "anc_acc": "4.767e-01", "epoch": 0.01555} {"step": 7780, "loss": 0.7823, "grad_norm": "2.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.326e-01", "anc_acc": "5.189e-01", "epoch": 0.01556} {"step": 7785, "loss": 1.0692, "grad_norm": "3.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.512e+00", "anc_loss": "1.575e+00", "dlm_acc": "5.069e-01", "anc_acc": "4.945e-01", "epoch": 0.01557} {"step": 7790, "loss": 0.8588, "grad_norm": "4.090e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.914e-01", "anc_loss": "1.029e+00", "dlm_acc": "5.590e-01", "anc_acc": "5.492e-01", "epoch": 0.01558} {"step": 7795, "loss": 1.1842, "grad_norm": "4.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.780e+00", "anc_loss": "1.852e+00", "dlm_acc": "4.257e-01", "anc_acc": "4.153e-01", "epoch": 0.01559} {"step": 7800, "loss": 1.1331, "grad_norm": "4.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.533e-01", "anc_acc": "5.389e-01", "epoch": 0.0156} {"step": 7805, "loss": 1.0152, "grad_norm": "3.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.105e+00", "dlm_acc": "5.106e-01", "anc_acc": "4.912e-01", "epoch": 0.01561} {"step": 7810, "loss": 1.2101, "grad_norm": "3.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.720e+00", "anc_loss": "1.794e+00", "dlm_acc": "4.616e-01", "anc_acc": "4.468e-01", "epoch": 0.01562} {"step": 7815, "loss": 0.72, "grad_norm": "3.416e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.594e-01", "anc_loss": "7.879e-01", "dlm_acc": "5.866e-01", "anc_acc": "5.731e-01", "epoch": 0.01563} {"step": 7820, "loss": 0.8702, "grad_norm": "4.701e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.087e+00", "dlm_acc": "5.936e-01", "anc_acc": "5.821e-01", "epoch": 0.01564} {"step": 7825, "loss": 0.9208, "grad_norm": "1.884e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.125e-01", "anc_loss": "9.656e-01", "dlm_acc": "6.234e-01", "anc_acc": "6.129e-01", "epoch": 0.01565} {"step": 7830, "loss": 0.4771, "grad_norm": "4.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.950e-01", "anc_loss": "4.253e-01", "dlm_acc": "7.548e-01", "anc_acc": "7.452e-01", "epoch": 0.01566} {"step": 7835, "loss": 1.0827, "grad_norm": "4.243e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.961e-01", "anc_loss": "5.109e-01", "dlm_acc": "6.476e-01", "anc_acc": "6.385e-01", "epoch": 0.01567} {"step": 7840, "loss": 1.0451, "grad_norm": "5.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.988e-01", "anc_loss": "6.133e-01", "dlm_acc": "5.879e-01", "anc_acc": "5.829e-01", "epoch": 0.01568} {"step": 7845, "loss": 0.9955, "grad_norm": "1.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.449e-01", "anc_loss": "8.725e-01", "dlm_acc": "5.994e-01", "anc_acc": "5.921e-01", "epoch": 0.01569} {"step": 7850, "loss": 0.8338, "grad_norm": "3.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.973e-01", "anc_loss": "9.453e-01", "dlm_acc": "6.834e-01", "anc_acc": "6.755e-01", "epoch": 0.0157} {"step": 7855, "loss": 1.1635, "grad_norm": "3.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.596e-01", "anc_loss": "1.004e+00", "dlm_acc": "6.624e-01", "anc_acc": "6.513e-01", "epoch": 0.01571} {"step": 7860, "loss": 1.1284, "grad_norm": "3.799e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.428e-01", "anc_loss": "9.949e-01", "dlm_acc": "6.633e-01", "anc_acc": "6.516e-01", "epoch": 0.01572} {"step": 7865, "loss": 1.2023, "grad_norm": "5.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.178e-01", "anc_loss": "2.282e-01", "dlm_acc": "8.930e-01", "anc_acc": "8.898e-01", "epoch": 0.01573} {"step": 7870, "loss": 1.1781, "grad_norm": "4.880e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.836e-01", "anc_loss": "8.221e-01", "dlm_acc": "7.564e-01", "anc_acc": "7.487e-01", "epoch": 0.01574} {"step": 7875, "loss": 1.4223, "grad_norm": "8.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.191e+00", "dlm_acc": "4.210e-01", "anc_acc": "4.114e-01", "epoch": 0.01575} {"step": 7880, "loss": 1.2137, "grad_norm": "1.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.883e-01", "anc_loss": "9.180e-01", "dlm_acc": "5.803e-01", "anc_acc": "5.734e-01", "epoch": 0.01576} {"step": 7885, "loss": 1.2319, "grad_norm": "5.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.477e-01", "anc_loss": "7.068e-01", "dlm_acc": "7.529e-01", "anc_acc": "7.374e-01", "epoch": 0.01577} {"step": 7890, "loss": 1.1973, "grad_norm": "2.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.188e+00", "dlm_acc": "5.876e-01", "anc_acc": "5.781e-01", "epoch": 0.01578} {"step": 7895, "loss": 0.7555, "grad_norm": "3.473e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.668e-01", "anc_loss": "4.922e-01", "dlm_acc": "7.801e-01", "anc_acc": "7.712e-01", "epoch": 0.01579} {"step": 7900, "loss": 1.1649, "grad_norm": "2.875e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.068e+00", "dlm_acc": "6.583e-01", "anc_acc": "6.510e-01", "epoch": 0.0158} {"step": 7905, "loss": 0.8407, "grad_norm": "8.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.040e-01", "anc_loss": "8.465e-01", "dlm_acc": "7.142e-01", "anc_acc": "7.063e-01", "epoch": 0.01581} {"step": 7910, "loss": 1.0157, "grad_norm": "2.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.441e-01", "anc_loss": "9.855e-01", "dlm_acc": "6.270e-01", "anc_acc": "6.179e-01", "epoch": 0.01582} {"step": 7915, "loss": 1.3265, "grad_norm": "4.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.552e+00", "anc_loss": "1.621e+00", "dlm_acc": "5.686e-01", "anc_acc": "5.568e-01", "epoch": 0.01583} {"step": 7920, "loss": 1.1175, "grad_norm": "3.732e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.447e-01", "epoch": 0.01584} {"step": 7925, "loss": 1.1862, "grad_norm": "3.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.980e-01", "anc_loss": "8.538e-01", "dlm_acc": "7.342e-01", "anc_acc": "7.222e-01", "epoch": 0.01585} {"step": 7930, "loss": 1.2855, "grad_norm": "6.104e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.158e+00", "anc_loss": "1.193e+00", "dlm_acc": "5.117e-01", "anc_acc": "5.051e-01", "epoch": 0.01586} {"step": 7935, "loss": 1.1262, "grad_norm": "5.712e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.398e-01", "anc_loss": "7.762e-01", "dlm_acc": "7.242e-01", "anc_acc": "7.134e-01", "epoch": 0.01587} {"step": 7940, "loss": 0.8974, "grad_norm": "3.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.117e-01", "anc_loss": "9.629e-01", "dlm_acc": "6.580e-01", "anc_acc": "6.461e-01", "epoch": 0.01588} {"step": 7945, "loss": 1.2193, "grad_norm": "6.325e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.097e+00", "anc_loss": "1.150e+00", "dlm_acc": "5.892e-01", "anc_acc": "5.779e-01", "epoch": 0.01589} {"step": 7950, "loss": 1.0566, "grad_norm": "3.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.185e+00", "dlm_acc": "6.039e-01", "anc_acc": "5.916e-01", "epoch": 0.0159} {"step": 7955, "loss": 1.1321, "grad_norm": "3.059e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.680e-01", "anc_loss": "9.367e-01", "dlm_acc": "6.593e-01", "anc_acc": "6.423e-01", "epoch": 0.01591} {"step": 7960, "loss": 1.2122, "grad_norm": "3.632e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.233e+00", "dlm_acc": "6.160e-01", "anc_acc": "6.052e-01", "epoch": 0.01592} {"step": 7965, "loss": 1.0382, "grad_norm": "3.759e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.736e-01", "anc_loss": "7.090e-01", "dlm_acc": "7.198e-01", "anc_acc": "7.135e-01", "epoch": 0.01593} {"step": 7970, "loss": 1.0271, "grad_norm": "2.335e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.820e-01", "anc_loss": "1.031e+00", "dlm_acc": "6.055e-01", "anc_acc": "5.953e-01", "epoch": 0.01594} {"step": 7975, "loss": 1.3391, "grad_norm": "4.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.786e-01", "anc_loss": "9.236e-01", "dlm_acc": "6.783e-01", "anc_acc": "6.666e-01", "epoch": 0.01595} {"step": 7980, "loss": 1.1062, "grad_norm": "4.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.845e-01", "anc_loss": "9.214e-01", "dlm_acc": "6.258e-01", "anc_acc": "6.181e-01", "epoch": 0.01596} {"step": 7985, "loss": 0.8938, "grad_norm": "4.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.770e-01", "anc_loss": "7.008e-01", "dlm_acc": "5.748e-01", "anc_acc": "5.680e-01", "epoch": 0.01597} {"step": 7990, "loss": 1.1575, "grad_norm": "1.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.164e+00", "dlm_acc": "6.102e-01", "anc_acc": "5.979e-01", "epoch": 0.01598} {"step": 7995, "loss": 1.2149, "grad_norm": "2.539e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.546e+00", "dlm_acc": "4.440e-01", "anc_acc": "4.360e-01", "epoch": 0.01599} {"step": 8000, "loss": 0.824, "grad_norm": "2.523e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.212e-01", "anc_loss": "5.555e-01", "dlm_acc": "7.933e-01", "anc_acc": "7.850e-01", "epoch": 0.016} {"step": 8005, "loss": 1.0436, "grad_norm": "4.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.836e-01", "anc_loss": "9.258e-01", "dlm_acc": "5.832e-01", "anc_acc": "5.740e-01", "epoch": 0.01601} {"step": 8010, "loss": 1.1293, "grad_norm": "3.830e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.859e-01", "anc_loss": "1.034e+00", "dlm_acc": "5.773e-01", "anc_acc": "5.693e-01", "epoch": 0.01602} {"step": 8015, "loss": 0.9962, "grad_norm": "2.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.128e+00", "dlm_acc": "6.218e-01", "anc_acc": "6.125e-01", "epoch": 0.01603} {"step": 8020, "loss": 1.7496, "grad_norm": "6.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.061e+00", "anc_loss": "2.122e+00", "dlm_acc": "4.264e-01", "anc_acc": "4.179e-01", "epoch": 0.01604} {"step": 8025, "loss": 1.4143, "grad_norm": "3.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.261e+00", "dlm_acc": "5.795e-01", "anc_acc": "5.686e-01", "epoch": 0.01605} {"step": 8030, "loss": 1.471, "grad_norm": "2.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.479e+00", "dlm_acc": "5.645e-01", "anc_acc": "5.542e-01", "epoch": 0.01606} {"step": 8035, "loss": 1.5818, "grad_norm": "5.526e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.615e+00", "dlm_acc": "5.297e-01", "anc_acc": "5.176e-01", "epoch": 0.01607} {"step": 8040, "loss": 1.1592, "grad_norm": "3.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.567e-01", "anc_acc": "5.431e-01", "epoch": 0.01608} {"step": 8045, "loss": 1.3688, "grad_norm": "3.508e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.444e+00", "anc_loss": "1.512e+00", "dlm_acc": "5.265e-01", "anc_acc": "5.119e-01", "epoch": 0.01609} {"step": 8050, "loss": 1.5472, "grad_norm": "3.478e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.866e+00", "anc_loss": "1.931e+00", "dlm_acc": "4.524e-01", "anc_acc": "4.407e-01", "epoch": 0.0161} {"step": 8055, "loss": 1.6666, "grad_norm": "8.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.794e+00", "anc_loss": "1.870e+00", "dlm_acc": "4.940e-01", "anc_acc": "4.825e-01", "epoch": 0.01611} {"step": 8060, "loss": 1.188, "grad_norm": "3.255e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.418e-01", "anc_acc": "5.299e-01", "epoch": 0.01612} {"step": 8065, "loss": 1.0523, "grad_norm": "2.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.732e+00", "anc_loss": "1.848e+00", "dlm_acc": "4.844e-01", "anc_acc": "4.663e-01", "epoch": 0.01613} {"step": 8070, "loss": 1.1219, "grad_norm": "3.767e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.565e+00", "anc_loss": "1.634e+00", "dlm_acc": "5.084e-01", "anc_acc": "4.953e-01", "epoch": 0.01614} {"step": 8075, "loss": 1.3698, "grad_norm": "1.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.582e+00", "anc_loss": "1.648e+00", "dlm_acc": "5.221e-01", "anc_acc": "5.097e-01", "epoch": 0.01615} {"step": 8080, "loss": 1.3996, "grad_norm": "3.090e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.728e+00", "anc_loss": "1.800e+00", "dlm_acc": "4.901e-01", "anc_acc": "4.787e-01", "epoch": 0.01616} {"step": 8085, "loss": 1.5614, "grad_norm": "3.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.553e+00", "anc_loss": "1.625e+00", "dlm_acc": "4.869e-01", "anc_acc": "4.748e-01", "epoch": 0.01617} {"step": 8090, "loss": 1.4363, "grad_norm": "6.186e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.689e-01", "anc_acc": "5.573e-01", "epoch": 0.01618} {"step": 8095, "loss": 1.3139, "grad_norm": "3.871e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.432e-01", "anc_acc": "5.276e-01", "epoch": 0.01619} {"step": 8100, "loss": 1.5391, "grad_norm": "6.198e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.178e+00", "dlm_acc": "5.974e-01", "anc_acc": "5.830e-01", "epoch": 0.0162} {"step": 8105, "loss": 1.4021, "grad_norm": "3.211e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.066e-01", "anc_loss": "8.617e-01", "dlm_acc": "6.600e-01", "anc_acc": "6.446e-01", "epoch": 0.01621} {"step": 8110, "loss": 1.2606, "grad_norm": "2.497e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.703e-01", "anc_loss": "8.441e-01", "dlm_acc": "7.217e-01", "anc_acc": "7.034e-01", "epoch": 0.01622} {"step": 8115, "loss": 1.5066, "grad_norm": "2.347e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.097e+00", "dlm_acc": "6.446e-01", "anc_acc": "6.297e-01", "epoch": 0.01623} {"step": 8120, "loss": 1.0871, "grad_norm": "2.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.484e-01", "anc_loss": "9.113e-01", "dlm_acc": "6.754e-01", "anc_acc": "6.587e-01", "epoch": 0.01624} {"step": 8125, "loss": 1.3464, "grad_norm": "5.353e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.015e-01", "anc_acc": "5.866e-01", "epoch": 0.01625} {"step": 8130, "loss": 1.3375, "grad_norm": "2.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.079e+00", "anc_loss": "1.143e+00", "dlm_acc": "6.219e-01", "anc_acc": "6.070e-01", "epoch": 0.01626} {"step": 8135, "loss": 1.7064, "grad_norm": "3.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.511e+00", "dlm_acc": "5.349e-01", "anc_acc": "5.213e-01", "epoch": 0.01627} {"step": 8140, "loss": 1.4396, "grad_norm": "2.690e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.075e+00", "dlm_acc": "6.352e-01", "anc_acc": "6.221e-01", "epoch": 0.01628} {"step": 8145, "loss": 1.4281, "grad_norm": "2.552e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.316e+00", "dlm_acc": "6.093e-01", "anc_acc": "5.944e-01", "epoch": 0.01629} {"step": 8150, "loss": 1.2676, "grad_norm": "2.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.469e-01", "epoch": 0.0163} {"step": 8155, "loss": 1.3095, "grad_norm": "2.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.157e+00", "dlm_acc": "6.122e-01", "anc_acc": "5.990e-01", "epoch": 0.01631} {"step": 8160, "loss": 1.6947, "grad_norm": "7.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.723e+00", "anc_loss": "1.788e+00", "dlm_acc": "4.753e-01", "anc_acc": "4.649e-01", "epoch": 0.01632} {"step": 8165, "loss": 1.8854, "grad_norm": "5.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.808e+00", "anc_loss": "1.880e+00", "dlm_acc": "4.496e-01", "anc_acc": "4.385e-01", "epoch": 0.01633} {"step": 8170, "loss": 1.6623, "grad_norm": "4.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.087e+00", "dlm_acc": "6.258e-01", "anc_acc": "6.159e-01", "epoch": 0.01634} {"step": 8175, "loss": 1.4836, "grad_norm": "1.580e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.137e-01", "anc_acc": "4.998e-01", "epoch": 0.01635} {"step": 8180, "loss": 1.5304, "grad_norm": "4.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.798e+00", "anc_loss": "1.867e+00", "dlm_acc": "3.871e-01", "anc_acc": "3.740e-01", "epoch": 0.01636} {"step": 8185, "loss": 1.3181, "grad_norm": "3.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.196e+00", "dlm_acc": "5.650e-01", "anc_acc": "5.418e-01", "epoch": 0.01637} {"step": 8190, "loss": 1.3291, "grad_norm": "3.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.068e+00", "anc_loss": "1.124e+00", "dlm_acc": "5.968e-01", "anc_acc": "5.845e-01", "epoch": 0.01638} {"step": 8195, "loss": 1.1515, "grad_norm": "3.202e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.158e+00", "dlm_acc": "6.097e-01", "anc_acc": "5.956e-01", "epoch": 0.01639} {"step": 8200, "loss": 1.7166, "grad_norm": "4.619e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.626e+00", "anc_loss": "1.700e+00", "dlm_acc": "4.460e-01", "anc_acc": "4.332e-01", "epoch": 0.0164} {"step": 8205, "loss": 1.7715, "grad_norm": "3.257e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.694e+00", "anc_loss": "1.753e+00", "dlm_acc": "4.565e-01", "anc_acc": "4.450e-01", "epoch": 0.01641} {"step": 8210, "loss": 1.6853, "grad_norm": "3.386e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.481e+00", "anc_loss": "1.542e+00", "dlm_acc": "5.084e-01", "anc_acc": "5.013e-01", "epoch": 0.01642} {"step": 8215, "loss": 1.0563, "grad_norm": "1.295e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.914e-01", "anc_loss": "9.508e-01", "dlm_acc": "5.725e-01", "anc_acc": "5.531e-01", "epoch": 0.01643} {"step": 8220, "loss": 1.341, "grad_norm": "3.420e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.472e-01", "anc_acc": "5.333e-01", "epoch": 0.01644} {"step": 8225, "loss": 0.9962, "grad_norm": "3.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.031e-01", "anc_loss": "5.454e-01", "dlm_acc": "7.802e-01", "anc_acc": "7.702e-01", "epoch": 0.01645} {"step": 8230, "loss": 1.2788, "grad_norm": "2.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.151e+00", "dlm_acc": "5.748e-01", "anc_acc": "5.582e-01", "epoch": 0.01646} {"step": 8235, "loss": 1.6328, "grad_norm": "4.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.762e+00", "anc_loss": "1.830e+00", "dlm_acc": "4.492e-01", "anc_acc": "4.379e-01", "epoch": 0.01647} {"step": 8240, "loss": 2.0232, "grad_norm": "4.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.188e+00", "anc_loss": "2.216e+00", "dlm_acc": "2.608e-01", "anc_acc": "2.567e-01", "epoch": 0.01648} {"step": 8245, "loss": 1.3712, "grad_norm": "3.943e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.258e+00", "dlm_acc": "5.524e-01", "anc_acc": "5.387e-01", "epoch": 0.01649} {"step": 8250, "loss": 1.2798, "grad_norm": "7.119e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.300e+00", "dlm_acc": "5.700e-01", "anc_acc": "5.569e-01", "epoch": 0.0165} {"step": 8255, "loss": 0.9434, "grad_norm": "3.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.992e-01", "anc_loss": "1.056e+00", "dlm_acc": "5.839e-01", "anc_acc": "5.697e-01", "epoch": 0.01651} {"step": 8260, "loss": 1.1968, "grad_norm": "3.193e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.191e+00", "dlm_acc": "5.539e-01", "anc_acc": "5.404e-01", "epoch": 0.01652} {"step": 8265, "loss": 1.3152, "grad_norm": "3.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.349e+00", "dlm_acc": "4.992e-01", "anc_acc": "4.883e-01", "epoch": 0.01653} {"step": 8270, "loss": 1.1599, "grad_norm": "3.908e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.404e+00", "dlm_acc": "5.260e-01", "anc_acc": "5.085e-01", "epoch": 0.01654} {"step": 8275, "loss": 1.293, "grad_norm": "3.996e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.125e-01", "anc_loss": "8.617e-01", "dlm_acc": "6.498e-01", "anc_acc": "6.424e-01", "epoch": 0.01655} {"step": 8280, "loss": 1.3149, "grad_norm": "5.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.236e+00", "dlm_acc": "6.149e-01", "anc_acc": "6.064e-01", "epoch": 0.01656} {"step": 8285, "loss": 1.5946, "grad_norm": "3.381e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.614e+00", "anc_loss": "1.678e+00", "dlm_acc": "4.833e-01", "anc_acc": "4.736e-01", "epoch": 0.01657} {"step": 8290, "loss": 1.5068, "grad_norm": "3.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.458e-01", "anc_acc": "4.329e-01", "epoch": 0.01658} {"step": 8295, "loss": 1.1624, "grad_norm": "2.954e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.133e-01", "anc_loss": "8.633e-01", "dlm_acc": "6.464e-01", "anc_acc": "6.339e-01", "epoch": 0.01659} {"step": 8300, "loss": 1.2257, "grad_norm": "2.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.070e-01", "anc_acc": "4.978e-01", "epoch": 0.0166} {"step": 8305, "loss": 1.2241, "grad_norm": "4.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.234e-01", "anc_loss": "8.734e-01", "dlm_acc": "6.357e-01", "anc_acc": "6.209e-01", "epoch": 0.01661} {"step": 8310, "loss": 1.5643, "grad_norm": "4.820e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.781e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.446e-01", "anc_acc": "6.328e-01", "epoch": 0.01662} {"step": 8315, "loss": 1.4236, "grad_norm": "5.438e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.453e+00", "dlm_acc": "4.196e-01", "anc_acc": "4.007e-01", "epoch": 0.01663} {"step": 8320, "loss": 1.344, "grad_norm": "3.171e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.201e+00", "anc_loss": "1.260e+00", "dlm_acc": "4.877e-01", "anc_acc": "4.738e-01", "epoch": 0.01664} {"step": 8325, "loss": 0.9182, "grad_norm": "2.341e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.199e-01", "anc_loss": "8.629e-01", "dlm_acc": "6.324e-01", "anc_acc": "6.218e-01", "epoch": 0.01665} {"step": 8330, "loss": 1.2979, "grad_norm": "2.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.836e-01", "anc_loss": "8.207e-01", "dlm_acc": "6.318e-01", "anc_acc": "6.226e-01", "epoch": 0.01666} {"step": 8335, "loss": 1.3531, "grad_norm": "3.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.470e+00", "dlm_acc": "5.121e-01", "anc_acc": "4.952e-01", "epoch": 0.01667} {"step": 8340, "loss": 1.4403, "grad_norm": "4.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.185e-01", "anc_acc": "5.050e-01", "epoch": 0.01668} {"step": 8345, "loss": 1.2267, "grad_norm": "6.491e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.397e+00", "dlm_acc": "5.684e-01", "anc_acc": "5.493e-01", "epoch": 0.01669} {"step": 8350, "loss": 1.1042, "grad_norm": "2.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.251e+00", "anc_loss": "1.347e+00", "dlm_acc": "5.338e-01", "anc_acc": "5.221e-01", "epoch": 0.0167} {"step": 8355, "loss": 1.1429, "grad_norm": "3.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.090e+00", "dlm_acc": "4.577e-01", "anc_acc": "4.507e-01", "epoch": 0.01671} {"step": 8360, "loss": 0.9806, "grad_norm": "3.172e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.953e-01", "anc_loss": "7.055e-01", "dlm_acc": "4.660e-01", "anc_acc": "4.613e-01", "epoch": 0.01672} {"step": 8365, "loss": 0.9185, "grad_norm": "2.947e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.801e-01", "anc_loss": "7.000e-01", "dlm_acc": "5.181e-01", "anc_acc": "5.128e-01", "epoch": 0.01673} {"step": 8370, "loss": 0.9925, "grad_norm": "4.469e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.219e-01", "anc_loss": "6.395e-01", "dlm_acc": "5.402e-01", "anc_acc": "5.317e-01", "epoch": 0.01674} {"step": 8375, "loss": 1.0813, "grad_norm": "4.466e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.152e+00", "dlm_acc": "5.639e-01", "anc_acc": "5.506e-01", "epoch": 0.01675} {"step": 8380, "loss": 1.4977, "grad_norm": "3.771e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.412e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.272e-01", "anc_acc": "5.122e-01", "epoch": 0.01676} {"step": 8385, "loss": 1.0558, "grad_norm": "2.362e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.189e+00", "dlm_acc": "5.228e-01", "anc_acc": "5.102e-01", "epoch": 0.01677} {"step": 8390, "loss": 1.4275, "grad_norm": "2.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.613e+00", "anc_loss": "1.686e+00", "dlm_acc": "4.918e-01", "anc_acc": "4.789e-01", "epoch": 0.01678} {"step": 8395, "loss": 1.7119, "grad_norm": "4.071e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.894e+00", "anc_loss": "1.959e+00", "dlm_acc": "4.411e-01", "anc_acc": "4.279e-01", "epoch": 0.01679} {"step": 8400, "loss": 1.5822, "grad_norm": "4.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.822e+00", "anc_loss": "1.889e+00", "dlm_acc": "4.555e-01", "anc_acc": "4.432e-01", "epoch": 0.0168} {"step": 8405, "loss": 1.5934, "grad_norm": "6.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.431e+00", "dlm_acc": "5.511e-01", "anc_acc": "5.376e-01", "epoch": 0.01681} {"step": 8410, "loss": 1.0325, "grad_norm": "3.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.102e+00", "dlm_acc": "5.430e-01", "anc_acc": "5.359e-01", "epoch": 0.01682} {"step": 8415, "loss": 1.0607, "grad_norm": "4.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.376e-01", "anc_loss": "3.548e-01", "dlm_acc": "8.981e-01", "anc_acc": "8.953e-01", "epoch": 0.01683} {"step": 8420, "loss": 1.4262, "grad_norm": "4.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.547e-01", "anc_acc": "5.457e-01", "epoch": 0.01684} {"step": 8425, "loss": 1.5711, "grad_norm": "4.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.741e+00", "anc_loss": "1.813e+00", "dlm_acc": "4.936e-01", "anc_acc": "4.813e-01", "epoch": 0.01685} {"step": 8430, "loss": 1.466, "grad_norm": "4.099e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.733e+00", "anc_loss": "1.797e+00", "dlm_acc": "4.385e-01", "anc_acc": "4.260e-01", "epoch": 0.01686} {"step": 8435, "loss": 1.2075, "grad_norm": "2.429e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.497e+00", "anc_loss": "1.572e+00", "dlm_acc": "5.002e-01", "anc_acc": "4.873e-01", "epoch": 0.01687} {"step": 8440, "loss": 1.2682, "grad_norm": "4.648e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.510e+00", "anc_loss": "1.580e+00", "dlm_acc": "5.316e-01", "anc_acc": "5.186e-01", "epoch": 0.01688} {"step": 8445, "loss": 1.5512, "grad_norm": "3.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.580e+00", "anc_loss": "1.653e+00", "dlm_acc": "4.956e-01", "anc_acc": "4.849e-01", "epoch": 0.01689} {"step": 8450, "loss": 1.4208, "grad_norm": "3.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.578e+00", "dlm_acc": "4.934e-01", "anc_acc": "4.813e-01", "epoch": 0.0169} {"step": 8455, "loss": 1.3161, "grad_norm": "3.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.449e+00", "anc_loss": "1.517e+00", "dlm_acc": "5.172e-01", "anc_acc": "5.048e-01", "epoch": 0.01691} {"step": 8460, "loss": 1.453, "grad_norm": "3.532e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.681e+00", "anc_loss": "1.762e+00", "dlm_acc": "4.929e-01", "anc_acc": "4.786e-01", "epoch": 0.01692} {"step": 8465, "loss": 1.6421, "grad_norm": "8.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.367e+00", "dlm_acc": "5.902e-01", "anc_acc": "5.773e-01", "epoch": 0.01693} {"step": 8470, "loss": 1.5532, "grad_norm": "2.591e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.340e+00", "dlm_acc": "5.873e-01", "anc_acc": "5.738e-01", "epoch": 0.01694} {"step": 8475, "loss": 0.9294, "grad_norm": "2.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.201e+00", "dlm_acc": "5.681e-01", "anc_acc": "5.526e-01", "epoch": 0.01695} {"step": 8480, "loss": 1.2097, "grad_norm": "3.701e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.343e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.205e-01", "epoch": 0.01696} {"step": 8485, "loss": 1.1138, "grad_norm": "4.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.295e+00", "dlm_acc": "5.696e-01", "anc_acc": "5.542e-01", "epoch": 0.01697} {"step": 8490, "loss": 1.3925, "grad_norm": "4.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.445e+00", "anc_loss": "1.505e+00", "dlm_acc": "5.543e-01", "anc_acc": "5.414e-01", "epoch": 0.01698} {"step": 8495, "loss": 1.3047, "grad_norm": "3.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.561e+00", "anc_loss": "1.623e+00", "dlm_acc": "4.900e-01", "anc_acc": "4.786e-01", "epoch": 0.01699} {"step": 8500, "loss": 1.1613, "grad_norm": "2.010e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.650e+00", "anc_loss": "1.729e+00", "dlm_acc": "5.237e-01", "anc_acc": "5.088e-01", "epoch": 0.017} {"step": 8505, "loss": 0.922, "grad_norm": "2.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.875e-01", "anc_loss": "1.049e+00", "dlm_acc": "6.327e-01", "anc_acc": "6.200e-01", "epoch": 0.01701} {"step": 8510, "loss": 1.1923, "grad_norm": "3.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.694e-01", "anc_acc": "5.535e-01", "epoch": 0.01702} {"step": 8515, "loss": 1.1733, "grad_norm": "3.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.456e+00", "anc_loss": "1.536e+00", "dlm_acc": "5.303e-01", "anc_acc": "5.150e-01", "epoch": 0.01703} {"step": 8520, "loss": 1.1278, "grad_norm": "5.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.644e+00", "anc_loss": "1.709e+00", "dlm_acc": "4.457e-01", "anc_acc": "4.309e-01", "epoch": 0.01704} {"step": 8525, "loss": 0.9088, "grad_norm": "2.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.159e+00", "dlm_acc": "6.020e-01", "anc_acc": "5.886e-01", "epoch": 0.01705} {"step": 8530, "loss": 1.1938, "grad_norm": "4.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.461e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.243e-01", "anc_acc": "5.123e-01", "epoch": 0.01706} {"step": 8535, "loss": 0.8107, "grad_norm": "2.132e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.279e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.219e-01", "epoch": 0.01707} {"step": 8540, "loss": 1.1756, "grad_norm": "4.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.307e+00", "dlm_acc": "5.568e-01", "anc_acc": "5.442e-01", "epoch": 0.01708} {"step": 8545, "loss": 1.4362, "grad_norm": "2.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.238e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.453e-01", "epoch": 0.01709} {"step": 8550, "loss": 0.7768, "grad_norm": "6.416e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.235e+00", "dlm_acc": "5.877e-01", "anc_acc": "5.751e-01", "epoch": 0.0171} {"step": 8555, "loss": 0.7584, "grad_norm": "2.687e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.500e+00", "anc_loss": "1.578e+00", "dlm_acc": "4.980e-01", "anc_acc": "4.846e-01", "epoch": 0.01711} {"step": 8560, "loss": 0.8306, "grad_norm": "2.896e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.638e-01", "anc_acc": "5.492e-01", "epoch": 0.01712} {"step": 8565, "loss": 1.1023, "grad_norm": "3.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.216e+00", "dlm_acc": "5.737e-01", "anc_acc": "5.575e-01", "epoch": 0.01713} {"step": 8570, "loss": 1.1824, "grad_norm": "2.326e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.125e+00", "anc_loss": "1.194e+00", "dlm_acc": "5.896e-01", "anc_acc": "5.742e-01", "epoch": 0.01714} {"step": 8575, "loss": 1.3715, "grad_norm": "3.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.856e-01", "anc_acc": "5.686e-01", "epoch": 0.01715} {"step": 8580, "loss": 1.017, "grad_norm": "2.873e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.205e+00", "dlm_acc": "5.754e-01", "anc_acc": "5.611e-01", "epoch": 0.01716} {"step": 8585, "loss": 1.0116, "grad_norm": "4.469e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.143e+00", "dlm_acc": "5.997e-01", "anc_acc": "5.862e-01", "epoch": 0.01717} {"step": 8590, "loss": 0.9453, "grad_norm": "2.046e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.117e+00", "dlm_acc": "6.043e-01", "anc_acc": "5.883e-01", "epoch": 0.01718} {"step": 8595, "loss": 1.3841, "grad_norm": "2.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.616e+00", "dlm_acc": "5.259e-01", "anc_acc": "5.111e-01", "epoch": 0.01719} {"step": 8600, "loss": 1.3579, "grad_norm": "2.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.640e+00", "anc_loss": "1.697e+00", "dlm_acc": "4.512e-01", "anc_acc": "4.413e-01", "epoch": 0.0172} {"step": 8605, "loss": 1.4035, "grad_norm": "3.230e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.089e+00", "anc_loss": "2.134e+00", "dlm_acc": "3.329e-01", "anc_acc": "3.255e-01", "epoch": 0.01721} {"step": 8610, "loss": 1.412, "grad_norm": "3.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.955e+00", "anc_loss": "2.030e+00", "dlm_acc": "4.178e-01", "anc_acc": "4.057e-01", "epoch": 0.01722} {"step": 8615, "loss": 1.3282, "grad_norm": "3.158e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.471e+00", "anc_loss": "1.533e+00", "dlm_acc": "4.996e-01", "anc_acc": "4.866e-01", "epoch": 0.01723} {"step": 8620, "loss": 1.2095, "grad_norm": "9.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.667e+00", "anc_loss": "1.758e+00", "dlm_acc": "4.798e-01", "anc_acc": "4.651e-01", "epoch": 0.01724} {"step": 8625, "loss": 1.2665, "grad_norm": "2.416e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.609e+00", "dlm_acc": "5.154e-01", "anc_acc": "5.008e-01", "epoch": 0.01725} {"step": 8630, "loss": 1.1312, "grad_norm": "2.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.080e+00", "dlm_acc": "5.647e-01", "anc_acc": "5.523e-01", "epoch": 0.01726} {"step": 8635, "loss": 1.2798, "grad_norm": "3.552e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.165e-01", "anc_acc": "5.034e-01", "epoch": 0.01727} {"step": 8640, "loss": 1.5777, "grad_norm": "4.362e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.578e+00", "anc_loss": "1.647e+00", "dlm_acc": "5.026e-01", "anc_acc": "4.902e-01", "epoch": 0.01728} {"step": 8645, "loss": 1.1651, "grad_norm": "4.094e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.500e+00", "anc_loss": "1.578e+00", "dlm_acc": "5.081e-01", "anc_acc": "4.941e-01", "epoch": 0.01729} {"step": 8650, "loss": 1.3226, "grad_norm": "2.437e+01", "learning_rate": "1.000e-04", "dlm_loss": "1.741e+00", "anc_loss": "1.856e+00", "dlm_acc": "4.273e-01", "anc_acc": "4.175e-01", "epoch": 0.0173} {"step": 8655, "loss": 1.3824, "grad_norm": "4.907e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.464e+00", "anc_loss": "1.521e+00", "dlm_acc": "5.095e-01", "anc_acc": "4.966e-01", "epoch": 0.01731} {"step": 8660, "loss": 1.1762, "grad_norm": "2.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.210e-01", "anc_acc": "5.085e-01", "epoch": 0.01732} {"step": 8665, "loss": 1.362, "grad_norm": "3.799e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.562e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.818e-01", "anc_acc": "4.687e-01", "epoch": 0.01733} {"step": 8670, "loss": 1.1352, "grad_norm": "3.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.062e+00", "dlm_acc": "6.197e-01", "anc_acc": "6.077e-01", "epoch": 0.01734} {"step": 8675, "loss": 0.9787, "grad_norm": "2.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.324e+00", "dlm_acc": "5.597e-01", "anc_acc": "5.456e-01", "epoch": 0.01735} {"step": 8680, "loss": 1.1095, "grad_norm": "2.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.591e+00", "anc_loss": "1.653e+00", "dlm_acc": "4.506e-01", "anc_acc": "4.401e-01", "epoch": 0.01736} {"step": 8685, "loss": 1.1918, "grad_norm": "2.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.235e+00", "dlm_acc": "5.619e-01", "anc_acc": "5.439e-01", "epoch": 0.01737} {"step": 8690, "loss": 1.4122, "grad_norm": "3.131e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.649e+00", "anc_loss": "1.727e+00", "dlm_acc": "5.050e-01", "anc_acc": "4.906e-01", "epoch": 0.01738} {"step": 8695, "loss": 1.2472, "grad_norm": "5.467e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.415e+00", "anc_loss": "1.485e+00", "dlm_acc": "5.322e-01", "anc_acc": "5.193e-01", "epoch": 0.01739} {"step": 8700, "loss": 1.7431, "grad_norm": "4.172e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.733e+00", "anc_loss": "1.812e+00", "dlm_acc": "5.211e-01", "anc_acc": "5.072e-01", "epoch": 0.0174} {"step": 8705, "loss": 1.2712, "grad_norm": "4.787e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.608e-01", "anc_acc": "5.484e-01", "epoch": 0.01741} {"step": 8710, "loss": 1.5361, "grad_norm": "4.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.194e+00", "anc_loss": "1.252e+00", "dlm_acc": "6.374e-01", "anc_acc": "6.283e-01", "epoch": 0.01742} {"step": 8715, "loss": 1.0231, "grad_norm": "3.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.680e-01", "anc_loss": "3.883e-01", "dlm_acc": "8.705e-01", "anc_acc": "8.657e-01", "epoch": 0.01743} {"step": 8720, "loss": 1.9255, "grad_norm": "4.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.568e+00", "anc_loss": "1.630e+00", "dlm_acc": "4.920e-01", "anc_acc": "4.819e-01", "epoch": 0.01744} {"step": 8725, "loss": 1.1148, "grad_norm": "2.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.339e+00", "anc_loss": "1.411e+00", "dlm_acc": "5.461e-01", "anc_acc": "5.292e-01", "epoch": 0.01745} {"step": 8730, "loss": 1.0959, "grad_norm": "3.622e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.339e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.543e-01", "anc_acc": "5.383e-01", "epoch": 0.01746} {"step": 8735, "loss": 0.9778, "grad_norm": "2.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.467e-01", "anc_loss": "1.010e+00", "dlm_acc": "6.524e-01", "anc_acc": "6.387e-01", "epoch": 0.01747} {"step": 8740, "loss": 1.4608, "grad_norm": "2.894e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.181e+00", "dlm_acc": "6.006e-01", "anc_acc": "5.842e-01", "epoch": 0.01748} {"step": 8745, "loss": 1.6194, "grad_norm": "7.971e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.485e+00", "anc_loss": "1.571e+00", "dlm_acc": "5.315e-01", "anc_acc": "5.151e-01", "epoch": 0.01749} {"step": 8750, "loss": 1.3619, "grad_norm": "2.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.624e-01", "anc_acc": "5.478e-01", "epoch": 0.0175} {"step": 8755, "loss": 1.2354, "grad_norm": "5.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.361e+00", "dlm_acc": "5.467e-01", "anc_acc": "5.343e-01", "epoch": 0.01751} {"step": 8760, "loss": 1.3346, "grad_norm": "2.526e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.670e-01", "anc_acc": "5.523e-01", "epoch": 0.01752} {"step": 8765, "loss": 1.43, "grad_norm": "3.636e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.109e-01", "anc_acc": "4.962e-01", "epoch": 0.01753} {"step": 8770, "loss": 1.8687, "grad_norm": "3.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.681e+00", "anc_loss": "1.745e+00", "dlm_acc": "5.096e-01", "anc_acc": "4.981e-01", "epoch": 0.01754} {"step": 8775, "loss": 1.6452, "grad_norm": "3.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.493e+00", "anc_loss": "1.624e+00", "dlm_acc": "5.478e-01", "anc_acc": "5.344e-01", "epoch": 0.01755} {"step": 8780, "loss": 1.4748, "grad_norm": "3.452e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.457e+00", "anc_loss": "1.521e+00", "dlm_acc": "5.221e-01", "anc_acc": "5.095e-01", "epoch": 0.01756} {"step": 8785, "loss": 1.5542, "grad_norm": "5.458e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.614e+00", "anc_loss": "1.677e+00", "dlm_acc": "4.418e-01", "anc_acc": "4.295e-01", "epoch": 0.01757} {"step": 8790, "loss": 1.1705, "grad_norm": "3.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.836e-01", "anc_loss": "1.051e+00", "dlm_acc": "6.250e-01", "anc_acc": "6.081e-01", "epoch": 0.01758} {"step": 8795, "loss": 1.4366, "grad_norm": "7.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.513e+00", "dlm_acc": "5.395e-01", "anc_acc": "5.256e-01", "epoch": 0.01759} {"step": 8800, "loss": 1.4813, "grad_norm": "2.595e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.258e+00", "dlm_acc": "5.263e-01", "anc_acc": "5.129e-01", "epoch": 0.0176} {"step": 8805, "loss": 1.4984, "grad_norm": "3.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.460e+00", "anc_loss": "1.521e+00", "dlm_acc": "5.213e-01", "anc_acc": "5.080e-01", "epoch": 0.01761} {"step": 8810, "loss": 1.1225, "grad_norm": "2.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.377e-01", "anc_loss": "9.801e-01", "dlm_acc": "5.875e-01", "anc_acc": "5.757e-01", "epoch": 0.01762} {"step": 8815, "loss": 1.1226, "grad_norm": "3.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.359e-01", "anc_loss": "7.879e-01", "dlm_acc": "6.401e-01", "anc_acc": "6.237e-01", "epoch": 0.01763} {"step": 8820, "loss": 1.6094, "grad_norm": "3.591e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.233e+00", "dlm_acc": "6.019e-01", "anc_acc": "5.890e-01", "epoch": 0.01764} {"step": 8825, "loss": 0.9069, "grad_norm": "2.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.352e-01", "anc_loss": "6.684e-01", "dlm_acc": "6.537e-01", "anc_acc": "6.444e-01", "epoch": 0.01765} {"step": 8830, "loss": 1.301, "grad_norm": "3.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.469e-01", "anc_loss": "5.684e-01", "dlm_acc": "6.052e-01", "anc_acc": "5.924e-01", "epoch": 0.01766} {"step": 8835, "loss": 0.8973, "grad_norm": "5.507e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.418e-01", "anc_loss": "4.652e-01", "dlm_acc": "6.376e-01", "anc_acc": "6.212e-01", "epoch": 0.01767} {"step": 8840, "loss": 1.0501, "grad_norm": "3.248e+00", "learning_rate": "1.000e-04", "dlm_loss": "5.180e-01", "anc_loss": "5.301e-01", "dlm_acc": "6.235e-01", "anc_acc": "6.182e-01", "epoch": 0.01768} {"step": 8845, "loss": 1.2433, "grad_norm": "3.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.487e-01", "anc_loss": "5.688e-01", "dlm_acc": "7.047e-01", "anc_acc": "6.978e-01", "epoch": 0.01769} {"step": 8850, "loss": 0.9113, "grad_norm": "8.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.185e-01", "anc_loss": "4.238e-01", "dlm_acc": "7.296e-01", "anc_acc": "7.263e-01", "epoch": 0.0177} {"step": 8855, "loss": 0.9691, "grad_norm": "4.530e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.460e-01", "anc_loss": "3.524e-01", "dlm_acc": "7.835e-01", "anc_acc": "7.793e-01", "epoch": 0.01771} {"step": 8860, "loss": 0.9005, "grad_norm": "2.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.830e-01", "anc_loss": "8.190e-01", "dlm_acc": "6.805e-01", "anc_acc": "6.735e-01", "epoch": 0.01772} {"step": 8865, "loss": 1.0116, "grad_norm": "2.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.944e-01", "anc_loss": "3.975e-01", "dlm_acc": "6.797e-01", "anc_acc": "6.784e-01", "epoch": 0.01773} {"step": 8870, "loss": 1.0817, "grad_norm": "2.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.992e-01", "anc_loss": "7.352e-01", "dlm_acc": "6.212e-01", "anc_acc": "6.069e-01", "epoch": 0.01774} {"step": 8875, "loss": 1.3047, "grad_norm": "5.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.188e-01", "anc_loss": "5.391e-01", "dlm_acc": "6.405e-01", "anc_acc": "6.276e-01", "epoch": 0.01775} {"step": 8880, "loss": 1.0811, "grad_norm": "3.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.768e-01", "anc_loss": "5.965e-01", "dlm_acc": "6.453e-01", "anc_acc": "6.407e-01", "epoch": 0.01776} {"step": 8885, "loss": 1.3008, "grad_norm": "4.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.039e-01", "anc_loss": "9.422e-01", "dlm_acc": "5.806e-01", "anc_acc": "5.698e-01", "epoch": 0.01777} {"step": 8890, "loss": 1.3862, "grad_norm": "2.241e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.447e-01", "anc_loss": "5.512e-01", "dlm_acc": "6.511e-01", "anc_acc": "6.494e-01", "epoch": 0.01778} {"step": 8895, "loss": 1.5935, "grad_norm": "3.622e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.871e-01", "anc_loss": "4.930e-01", "dlm_acc": "6.655e-01", "anc_acc": "6.637e-01", "epoch": 0.01779} {"step": 8900, "loss": 1.6463, "grad_norm": "4.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.188e-01", "anc_loss": "4.271e-01", "dlm_acc": "7.391e-01", "anc_acc": "7.363e-01", "epoch": 0.0178} {"step": 8905, "loss": 1.1277, "grad_norm": "2.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.258e-01", "anc_loss": "3.383e-01", "dlm_acc": "7.842e-01", "anc_acc": "7.780e-01", "epoch": 0.01781} {"step": 8910, "loss": 0.9523, "grad_norm": "4.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.344e-01", "anc_loss": "5.459e-01", "dlm_acc": "6.829e-01", "anc_acc": "6.780e-01", "epoch": 0.01782} {"step": 8915, "loss": 0.7035, "grad_norm": "3.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.660e-01", "anc_loss": "3.740e-01", "dlm_acc": "7.316e-01", "anc_acc": "7.268e-01", "epoch": 0.01783} {"step": 8920, "loss": 0.6501, "grad_norm": "3.104e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.656e-01", "anc_loss": "5.709e-01", "dlm_acc": "6.265e-01", "anc_acc": "6.225e-01", "epoch": 0.01784} {"step": 8925, "loss": 0.7203, "grad_norm": "4.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.234e-01", "anc_loss": "8.547e-01", "dlm_acc": "6.238e-01", "anc_acc": "6.164e-01", "epoch": 0.01785} {"step": 8930, "loss": 1.4945, "grad_norm": "8.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.047e+00", "dlm_acc": "5.905e-01", "anc_acc": "5.804e-01", "epoch": 0.01786} {"step": 8935, "loss": 1.2241, "grad_norm": "3.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.007e+00", "anc_loss": "1.038e+00", "dlm_acc": "5.313e-01", "anc_acc": "5.248e-01", "epoch": 0.01787} {"step": 8940, "loss": 1.2235, "grad_norm": "4.292e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.938e-01", "anc_loss": "1.033e+00", "dlm_acc": "5.331e-01", "anc_acc": "5.239e-01", "epoch": 0.01788} {"step": 8945, "loss": 1.2424, "grad_norm": "5.802e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.200e-01", "anc_acc": "5.072e-01", "epoch": 0.01789} {"step": 8950, "loss": 1.4034, "grad_norm": "5.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.392e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.109e-01", "anc_acc": "4.976e-01", "epoch": 0.0179} {"step": 8955, "loss": 1.2532, "grad_norm": "3.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.899e-01", "anc_acc": "5.751e-01", "epoch": 0.01791} {"step": 8960, "loss": 1.6392, "grad_norm": "4.493e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.353e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.695e-01", "anc_acc": "5.595e-01", "epoch": 0.01792} {"step": 8965, "loss": 1.2977, "grad_norm": "3.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.065e-01", "anc_loss": "6.301e-01", "dlm_acc": "6.769e-01", "anc_acc": "6.676e-01", "epoch": 0.01793} {"step": 8970, "loss": 1.1417, "grad_norm": "3.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.172e-01", "anc_loss": "4.391e-01", "dlm_acc": "7.042e-01", "anc_acc": "6.919e-01", "epoch": 0.01794} {"step": 8975, "loss": 1.0279, "grad_norm": "1.162e+00", "learning_rate": "1.000e-04", "dlm_loss": "4.266e-01", "anc_loss": "4.523e-01", "dlm_acc": "7.094e-01", "anc_acc": "6.954e-01", "epoch": 0.01795} {"step": 8980, "loss": 1.0597, "grad_norm": "3.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.781e-01", "anc_loss": "5.000e-01", "dlm_acc": "6.789e-01", "anc_acc": "6.657e-01", "epoch": 0.01796} {"step": 8985, "loss": 1.3544, "grad_norm": "4.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.117e-01", "anc_loss": "6.332e-01", "dlm_acc": "5.786e-01", "anc_acc": "5.668e-01", "epoch": 0.01797} {"step": 8990, "loss": 0.8601, "grad_norm": "5.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.775e-01", "anc_loss": "9.293e-01", "dlm_acc": "6.070e-01", "anc_acc": "5.908e-01", "epoch": 0.01798} {"step": 8995, "loss": 1.0181, "grad_norm": "3.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.898e-01", "anc_loss": "9.313e-01", "dlm_acc": "5.433e-01", "anc_acc": "5.310e-01", "epoch": 0.01799} {"step": 9000, "loss": 1.3536, "grad_norm": "8.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.136e+00", "dlm_acc": "4.739e-01", "anc_acc": "4.660e-01", "epoch": 0.018} {"step": 9005, "loss": 1.2839, "grad_norm": "3.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.117e-01", "anc_loss": "7.383e-01", "dlm_acc": "5.521e-01", "anc_acc": "5.397e-01", "epoch": 0.01801} {"step": 9010, "loss": 1.061, "grad_norm": "6.076e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.691e-01", "anc_loss": "9.027e-01", "dlm_acc": "5.514e-01", "anc_acc": "5.412e-01", "epoch": 0.01802} {"step": 9015, "loss": 1.4777, "grad_norm": "3.590e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.103e+00", "anc_loss": "1.159e+00", "dlm_acc": "5.649e-01", "anc_acc": "5.513e-01", "epoch": 0.01803} {"step": 9020, "loss": 0.9369, "grad_norm": "2.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.273e-01", "anc_loss": "5.500e-01", "dlm_acc": "6.162e-01", "anc_acc": "6.071e-01", "epoch": 0.01804} {"step": 9025, "loss": 1.2727, "grad_norm": "6.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.493e+00", "anc_loss": "1.566e+00", "dlm_acc": "5.472e-01", "anc_acc": "5.317e-01", "epoch": 0.01805} {"step": 9030, "loss": 0.8013, "grad_norm": "4.751e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.312e-01", "anc_loss": "7.617e-01", "dlm_acc": "6.113e-01", "anc_acc": "6.002e-01", "epoch": 0.01806} {"step": 9035, "loss": 0.7098, "grad_norm": "3.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.703e-01", "anc_loss": "1.018e+00", "dlm_acc": "6.074e-01", "anc_acc": "5.971e-01", "epoch": 0.01807} {"step": 9040, "loss": 0.9744, "grad_norm": "3.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.103e+00", "dlm_acc": "5.998e-01", "anc_acc": "5.863e-01", "epoch": 0.01808} {"step": 9045, "loss": 1.1525, "grad_norm": "3.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.340e+00", "anc_loss": "1.418e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.312e-01", "epoch": 0.01809} {"step": 9050, "loss": 0.9414, "grad_norm": "5.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.228e+00", "dlm_acc": "5.845e-01", "anc_acc": "5.714e-01", "epoch": 0.0181} {"step": 9055, "loss": 0.9205, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.992e-01", "anc_loss": "5.184e-01", "dlm_acc": "7.228e-01", "anc_acc": "7.151e-01", "epoch": 0.01811} {"step": 9060, "loss": 0.9546, "grad_norm": "3.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.201e+00", "dlm_acc": "5.888e-01", "anc_acc": "5.762e-01", "epoch": 0.01812} {"step": 9065, "loss": 1.0093, "grad_norm": "2.911e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.514e+00", "anc_loss": "1.584e+00", "dlm_acc": "5.202e-01", "anc_acc": "5.063e-01", "epoch": 0.01813} {"step": 9070, "loss": 1.1689, "grad_norm": "3.866e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.350e-01", "anc_acc": "5.219e-01", "epoch": 0.01814} {"step": 9075, "loss": 1.1268, "grad_norm": "3.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.789e-01", "anc_acc": "5.652e-01", "epoch": 0.01815} {"step": 9080, "loss": 1.2375, "grad_norm": "8.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.479e+00", "anc_loss": "1.545e+00", "dlm_acc": "5.305e-01", "anc_acc": "5.163e-01", "epoch": 0.01816} {"step": 9085, "loss": 0.8088, "grad_norm": "2.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.236e+00", "dlm_acc": "6.158e-01", "anc_acc": "5.976e-01", "epoch": 0.01817} {"step": 9090, "loss": 1.2178, "grad_norm": "2.783e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.564e+00", "dlm_acc": "5.254e-01", "anc_acc": "5.111e-01", "epoch": 0.01818} {"step": 9095, "loss": 1.3846, "grad_norm": "5.493e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.701e-01", "anc_acc": "5.581e-01", "epoch": 0.01819} {"step": 9100, "loss": 0.913, "grad_norm": "2.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.208e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.672e-01", "anc_acc": "5.529e-01", "epoch": 0.0182} {"step": 9105, "loss": 1.5543, "grad_norm": "2.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.784e+00", "dlm_acc": "5.017e-01", "anc_acc": "4.864e-01", "epoch": 0.01821} {"step": 9110, "loss": 1.1146, "grad_norm": "2.510e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.400e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.429e-01", "anc_acc": "5.277e-01", "epoch": 0.01822} {"step": 9115, "loss": 1.2307, "grad_norm": "5.399e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.655e+00", "anc_loss": "1.731e+00", "dlm_acc": "4.803e-01", "anc_acc": "4.675e-01", "epoch": 0.01823} {"step": 9120, "loss": 0.853, "grad_norm": "3.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.547e+00", "dlm_acc": "5.352e-01", "anc_acc": "5.188e-01", "epoch": 0.01824} {"step": 9125, "loss": 1.0106, "grad_norm": "4.171e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.339e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.686e-01", "anc_acc": "5.515e-01", "epoch": 0.01825} {"step": 9130, "loss": 1.2771, "grad_norm": "3.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.421e+00", "dlm_acc": "5.597e-01", "anc_acc": "5.469e-01", "epoch": 0.01826} {"step": 9135, "loss": 1.5646, "grad_norm": "4.601e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.525e+00", "anc_loss": "1.590e+00", "dlm_acc": "5.221e-01", "anc_acc": "5.087e-01", "epoch": 0.01827} {"step": 9140, "loss": 1.4121, "grad_norm": "3.858e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.666e+00", "anc_loss": "1.748e+00", "dlm_acc": "4.912e-01", "anc_acc": "4.749e-01", "epoch": 0.01828} {"step": 9145, "loss": 1.0736, "grad_norm": "4.290e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.420e-01", "anc_acc": "5.288e-01", "epoch": 0.01829} {"step": 9150, "loss": 1.2149, "grad_norm": "2.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.486e-01", "anc_acc": "5.329e-01", "epoch": 0.0183} {"step": 9155, "loss": 1.4125, "grad_norm": "5.507e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.474e+00", "anc_loss": "1.548e+00", "dlm_acc": "5.134e-01", "anc_acc": "4.982e-01", "epoch": 0.01831} {"step": 9160, "loss": 1.114, "grad_norm": "4.444e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.355e+00", "dlm_acc": "6.008e-01", "anc_acc": "5.851e-01", "epoch": 0.01832} {"step": 9165, "loss": 1.0756, "grad_norm": "2.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.256e+00", "anc_loss": "1.324e+00", "dlm_acc": "5.727e-01", "anc_acc": "5.593e-01", "epoch": 0.01833} {"step": 9170, "loss": 1.7462, "grad_norm": "5.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.745e+00", "anc_loss": "1.819e+00", "dlm_acc": "5.112e-01", "anc_acc": "4.961e-01", "epoch": 0.01834} {"step": 9175, "loss": 1.304, "grad_norm": "3.818e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.659e+00", "dlm_acc": "5.128e-01", "anc_acc": "5.001e-01", "epoch": 0.01835} {"step": 9180, "loss": 1.2042, "grad_norm": "3.938e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.399e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.092e-01", "anc_acc": "4.930e-01", "epoch": 0.01836} {"step": 9185, "loss": 1.1821, "grad_norm": "2.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.536e+00", "anc_loss": "1.599e+00", "dlm_acc": "5.115e-01", "anc_acc": "4.978e-01", "epoch": 0.01837} {"step": 9190, "loss": 1.2286, "grad_norm": "4.034e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.359e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.392e-01", "anc_acc": "5.238e-01", "epoch": 0.01838} {"step": 9195, "loss": 1.01, "grad_norm": "5.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.157e+00", "dlm_acc": "5.867e-01", "anc_acc": "5.745e-01", "epoch": 0.01839} {"step": 9200, "loss": 1.1086, "grad_norm": "3.171e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.500e+00", "anc_loss": "1.570e+00", "dlm_acc": "4.821e-01", "anc_acc": "4.690e-01", "epoch": 0.0184} {"step": 9205, "loss": 1.1343, "grad_norm": "2.767e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.286e+00", "anc_loss": "1.348e+00", "dlm_acc": "5.668e-01", "anc_acc": "5.545e-01", "epoch": 0.01841} {"step": 9210, "loss": 1.5832, "grad_norm": "5.544e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.618e+00", "anc_loss": "1.693e+00", "dlm_acc": "5.167e-01", "anc_acc": "5.043e-01", "epoch": 0.01842} {"step": 9215, "loss": 1.4256, "grad_norm": "4.731e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.698e+00", "dlm_acc": "4.688e-01", "anc_acc": "4.547e-01", "epoch": 0.01843} {"step": 9220, "loss": 1.2553, "grad_norm": "3.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.432e+00", "anc_loss": "1.498e+00", "dlm_acc": "4.921e-01", "anc_acc": "4.818e-01", "epoch": 0.01844} {"step": 9225, "loss": 1.2598, "grad_norm": "3.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.290e+00", "anc_loss": "1.353e+00", "dlm_acc": "5.581e-01", "anc_acc": "5.465e-01", "epoch": 0.01845} {"step": 9230, "loss": 1.3744, "grad_norm": "4.185e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.568e+00", "anc_loss": "1.634e+00", "dlm_acc": "4.927e-01", "anc_acc": "4.812e-01", "epoch": 0.01846} {"step": 9235, "loss": 1.2974, "grad_norm": "7.748e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.683e+00", "anc_loss": "1.762e+00", "dlm_acc": "4.747e-01", "anc_acc": "4.611e-01", "epoch": 0.01847} {"step": 9240, "loss": 1.0538, "grad_norm": "4.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.224e+00", "dlm_acc": "5.718e-01", "anc_acc": "5.580e-01", "epoch": 0.01848} {"step": 9245, "loss": 1.0439, "grad_norm": "3.373e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.167e+00", "dlm_acc": "5.429e-01", "anc_acc": "5.261e-01", "epoch": 0.01849} {"step": 9250, "loss": 1.7122, "grad_norm": "9.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.803e+00", "anc_loss": "1.878e+00", "dlm_acc": "4.309e-01", "anc_acc": "4.187e-01", "epoch": 0.0185} {"step": 9255, "loss": 1.4775, "grad_norm": "4.767e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.689e+00", "anc_loss": "1.727e+00", "dlm_acc": "2.894e-01", "anc_acc": "2.858e-01", "epoch": 0.01851} {"step": 9260, "loss": 1.9778, "grad_norm": "3.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.691e+00", "anc_loss": "1.777e+00", "dlm_acc": "4.851e-01", "anc_acc": "4.703e-01", "epoch": 0.01852} {"step": 9265, "loss": 1.6056, "grad_norm": "5.596e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.248e+00", "dlm_acc": "5.828e-01", "anc_acc": "5.693e-01", "epoch": 0.01853} {"step": 9270, "loss": 1.6132, "grad_norm": "5.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e+00", "anc_loss": "1.534e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.386e-01", "epoch": 0.01854} {"step": 9275, "loss": 1.2645, "grad_norm": "3.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.058e+00", "dlm_acc": "6.571e-01", "anc_acc": "6.465e-01", "epoch": 0.01855} {"step": 9280, "loss": 0.7958, "grad_norm": "2.339e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.410e-01", "anc_loss": "6.723e-01", "dlm_acc": "6.714e-01", "anc_acc": "6.641e-01", "epoch": 0.01856} {"step": 9285, "loss": 0.8815, "grad_norm": "3.462e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.178e+00", "anc_loss": "1.235e+00", "dlm_acc": "6.118e-01", "anc_acc": "6.026e-01", "epoch": 0.01857} {"step": 9290, "loss": 1.1998, "grad_norm": "6.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.418e-01", "anc_loss": "7.789e-01", "dlm_acc": "6.281e-01", "anc_acc": "6.201e-01", "epoch": 0.01858} {"step": 9295, "loss": 1.5396, "grad_norm": "3.527e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.124e+00", "anc_loss": "1.179e+00", "dlm_acc": "6.589e-01", "anc_acc": "6.499e-01", "epoch": 0.01859} {"step": 9300, "loss": 0.9013, "grad_norm": "1.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.701e-02", "anc_loss": "3.867e-02", "dlm_acc": "9.771e-01", "anc_acc": "9.767e-01", "epoch": 0.0186} {"step": 9305, "loss": 0.8625, "grad_norm": "3.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.088e-02", "anc_loss": "2.130e-02", "dlm_acc": "9.866e-01", "anc_acc": "9.859e-01", "epoch": 0.01861} {"step": 9310, "loss": 1.1117, "grad_norm": "5.088e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.343e-01", "anc_loss": "2.478e-01", "dlm_acc": "8.973e-01", "anc_acc": "8.930e-01", "epoch": 0.01862} {"step": 9315, "loss": 1.695, "grad_norm": "4.252e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.403e+00", "dlm_acc": "5.724e-01", "anc_acc": "5.564e-01", "epoch": 0.01863} {"step": 9320, "loss": 1.3877, "grad_norm": "4.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.643e-01", "anc_acc": "5.545e-01", "epoch": 0.01864} {"step": 9325, "loss": 1.3803, "grad_norm": "5.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.840e-01", "anc_loss": "8.242e-01", "dlm_acc": "6.907e-01", "anc_acc": "6.815e-01", "epoch": 0.01865} {"step": 9330, "loss": 1.7473, "grad_norm": "7.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.285e-01", "anc_loss": "8.672e-01", "dlm_acc": "6.651e-01", "anc_acc": "6.555e-01", "epoch": 0.01866} {"step": 9335, "loss": 1.1384, "grad_norm": "4.622e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.391e-01", "anc_loss": "3.575e-01", "dlm_acc": "8.386e-01", "anc_acc": "8.332e-01", "epoch": 0.01867} {"step": 9340, "loss": 1.0655, "grad_norm": "3.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.376e-01", "anc_loss": "5.786e-01", "dlm_acc": "7.779e-01", "anc_acc": "7.670e-01", "epoch": 0.01868} {"step": 9345, "loss": 1.5956, "grad_norm": "3.340e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.068e+00", "anc_loss": "1.102e+00", "dlm_acc": "4.922e-01", "anc_acc": "4.848e-01", "epoch": 0.01869} {"step": 9350, "loss": 1.3354, "grad_norm": "5.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.867e-01", "anc_loss": "7.012e-01", "dlm_acc": "7.023e-01", "anc_acc": "6.962e-01", "epoch": 0.0187} {"step": 9355, "loss": 0.8871, "grad_norm": "3.031e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.150e-01", "anc_loss": "8.631e-01", "dlm_acc": "6.914e-01", "anc_acc": "6.786e-01", "epoch": 0.01871} {"step": 9360, "loss": 1.3648, "grad_norm": "3.560e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.649e+00", "anc_loss": "1.704e+00", "dlm_acc": "4.721e-01", "anc_acc": "4.649e-01", "epoch": 0.01872} {"step": 9365, "loss": 1.5801, "grad_norm": "5.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.393e-01", "anc_loss": "8.805e-01", "dlm_acc": "7.014e-01", "anc_acc": "6.898e-01", "epoch": 0.01873} {"step": 9370, "loss": 1.1113, "grad_norm": "3.928e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.436e-01", "anc_loss": "9.920e-01", "dlm_acc": "6.468e-01", "anc_acc": "6.332e-01", "epoch": 0.01874} {"step": 9375, "loss": 1.3162, "grad_norm": "4.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.280e-01", "anc_acc": "5.157e-01", "epoch": 0.01875} {"step": 9380, "loss": 1.7541, "grad_norm": "4.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.017e+00", "anc_loss": "1.072e+00", "dlm_acc": "5.998e-01", "anc_acc": "5.873e-01", "epoch": 0.01876} {"step": 9385, "loss": 1.2049, "grad_norm": "3.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.395e-01", "anc_loss": "8.855e-01", "dlm_acc": "6.250e-01", "anc_acc": "6.136e-01", "epoch": 0.01877} {"step": 9390, "loss": 1.1234, "grad_norm": "3.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.592e-01", "anc_loss": "4.913e-01", "dlm_acc": "8.321e-01", "anc_acc": "8.195e-01", "epoch": 0.01878} {"step": 9395, "loss": 1.4704, "grad_norm": "6.533e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.186e+00", "dlm_acc": "5.981e-01", "anc_acc": "5.873e-01", "epoch": 0.01879} {"step": 9400, "loss": 1.9181, "grad_norm": "3.605e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.467e+00", "anc_loss": "1.555e+00", "dlm_acc": "5.118e-01", "anc_acc": "4.960e-01", "epoch": 0.0188} {"step": 9405, "loss": 2.155, "grad_norm": "3.780e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.188e+00", "dlm_acc": "5.578e-01", "anc_acc": "5.427e-01", "epoch": 0.01881} {"step": 9410, "loss": 1.1457, "grad_norm": "3.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.095e-01", "anc_loss": "6.489e-01", "dlm_acc": "7.471e-01", "anc_acc": "7.326e-01", "epoch": 0.01882} {"step": 9415, "loss": 1.0831, "grad_norm": "2.915e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.918e-01", "anc_loss": "7.391e-01", "dlm_acc": "7.202e-01", "anc_acc": "7.091e-01", "epoch": 0.01883} {"step": 9420, "loss": 1.3591, "grad_norm": "4.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.422e-01", "anc_loss": "9.688e-01", "dlm_acc": "4.684e-01", "anc_acc": "4.606e-01", "epoch": 0.01884} {"step": 9425, "loss": 1.3361, "grad_norm": "2.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.266e-01", "anc_loss": "7.785e-01", "dlm_acc": "6.893e-01", "anc_acc": "6.759e-01", "epoch": 0.01885} {"step": 9430, "loss": 1.195, "grad_norm": "6.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.299e-01", "anc_loss": "5.445e-01", "dlm_acc": "6.643e-01", "anc_acc": "6.596e-01", "epoch": 0.01886} {"step": 9435, "loss": 1.3198, "grad_norm": "3.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.406e-01", "anc_loss": "8.782e-01", "dlm_acc": "6.780e-01", "anc_acc": "6.709e-01", "epoch": 0.01887} {"step": 9440, "loss": 1.2286, "grad_norm": "6.117e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.912e-01", "anc_loss": "6.130e-01", "dlm_acc": "7.195e-01", "anc_acc": "7.177e-01", "epoch": 0.01888} {"step": 9445, "loss": 1.0803, "grad_norm": "6.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.199e-01", "anc_loss": "8.441e-01", "dlm_acc": "5.929e-01", "anc_acc": "5.863e-01", "epoch": 0.01889} {"step": 9450, "loss": 1.2246, "grad_norm": "4.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.920e-01", "anc_acc": "5.782e-01", "epoch": 0.0189} {"step": 9455, "loss": 1.2786, "grad_norm": "2.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.214e+00", "anc_loss": "1.293e+00", "dlm_acc": "5.794e-01", "anc_acc": "5.632e-01", "epoch": 0.01891} {"step": 9460, "loss": 1.2744, "grad_norm": "3.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.528e+00", "dlm_acc": "5.161e-01", "anc_acc": "5.018e-01", "epoch": 0.01892} {"step": 9465, "loss": 1.6835, "grad_norm": "6.211e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.428e+00", "dlm_acc": "5.968e-01", "anc_acc": "5.779e-01", "epoch": 0.01893} {"step": 9470, "loss": 1.3214, "grad_norm": "3.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.431e+00", "anc_loss": "1.498e+00", "dlm_acc": "4.883e-01", "anc_acc": "4.736e-01", "epoch": 0.01894} {"step": 9475, "loss": 1.5704, "grad_norm": "2.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.479e-01", "anc_acc": "5.333e-01", "epoch": 0.01895} {"step": 9480, "loss": 1.3332, "grad_norm": "6.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.216e+00", "dlm_acc": "5.570e-01", "anc_acc": "5.416e-01", "epoch": 0.01896} {"step": 9485, "loss": 1.3172, "grad_norm": "2.293e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.309e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.559e-01", "anc_acc": "5.381e-01", "epoch": 0.01897} {"step": 9490, "loss": 1.4144, "grad_norm": "2.623e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.314e+00", "dlm_acc": "5.682e-01", "anc_acc": "5.543e-01", "epoch": 0.01898} {"step": 9495, "loss": 1.7562, "grad_norm": "3.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.614e+00", "anc_loss": "1.695e+00", "dlm_acc": "4.913e-01", "anc_acc": "4.773e-01", "epoch": 0.01899} {"step": 9500, "loss": 1.5167, "grad_norm": "4.568e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.237e+00", "dlm_acc": "6.197e-01", "anc_acc": "6.052e-01", "epoch": 0.019} {"step": 9505, "loss": 1.3675, "grad_norm": "3.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.275e+00", "dlm_acc": "5.836e-01", "anc_acc": "5.689e-01", "epoch": 0.01901} {"step": 9510, "loss": 1.3972, "grad_norm": "6.539e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.210e-01", "anc_acc": "5.066e-01", "epoch": 0.01902} {"step": 9515, "loss": 1.2657, "grad_norm": "5.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.893e-01", "anc_loss": "1.044e+00", "dlm_acc": "6.356e-01", "anc_acc": "6.233e-01", "epoch": 0.01903} {"step": 9520, "loss": 1.1552, "grad_norm": "4.243e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.986e-01", "anc_loss": "8.491e-01", "dlm_acc": "7.023e-01", "anc_acc": "6.918e-01", "epoch": 0.01904} {"step": 9525, "loss": 1.1311, "grad_norm": "3.688e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.951e-01", "anc_loss": "3.998e-01", "dlm_acc": "7.544e-01", "anc_acc": "7.532e-01", "epoch": 0.01905} {"step": 9530, "loss": 1.1742, "grad_norm": "4.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.742e-01", "anc_loss": "6.754e-01", "dlm_acc": "5.639e-01", "anc_acc": "5.642e-01", "epoch": 0.01906} {"step": 9535, "loss": 1.4129, "grad_norm": "5.668e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.727e-01", "anc_loss": "7.750e-01", "dlm_acc": "5.449e-01", "anc_acc": "5.477e-01", "epoch": 0.01907} {"step": 9540, "loss": 1.2651, "grad_norm": "2.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.051e-01", "anc_loss": "7.098e-01", "dlm_acc": "5.741e-01", "anc_acc": "5.707e-01", "epoch": 0.01908} {"step": 9545, "loss": 1.2098, "grad_norm": "6.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.121e-01", "anc_loss": "4.290e-01", "dlm_acc": "8.093e-01", "anc_acc": "8.022e-01", "epoch": 0.01909} {"step": 9550, "loss": 1.1708, "grad_norm": "8.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.900e-01", "anc_loss": "4.160e-01", "dlm_acc": "8.110e-01", "anc_acc": "8.031e-01", "epoch": 0.0191} {"step": 9555, "loss": 0.9113, "grad_norm": "2.485e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.528e-02", "anc_loss": "6.670e-02", "dlm_acc": "9.672e-01", "anc_acc": "9.674e-01", "epoch": 0.01911} {"step": 9560, "loss": 1.4867, "grad_norm": "3.231e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.293e+00", "dlm_acc": "5.980e-01", "anc_acc": "5.890e-01", "epoch": 0.01912} {"step": 9565, "loss": 1.2695, "grad_norm": "3.874e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.218e+00", "dlm_acc": "4.730e-01", "anc_acc": "4.608e-01", "epoch": 0.01913} {"step": 9570, "loss": 1.486, "grad_norm": "3.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.236e-01", "anc_loss": "4.338e-01", "dlm_acc": "7.173e-01", "anc_acc": "7.148e-01", "epoch": 0.01914} {"step": 9575, "loss": 0.8181, "grad_norm": "2.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.121e-01", "anc_loss": "3.297e-01", "dlm_acc": "7.463e-01", "anc_acc": "7.328e-01", "epoch": 0.01915} {"step": 9580, "loss": 1.3521, "grad_norm": "4.263e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.672e-01", "anc_loss": "3.898e-01", "dlm_acc": "8.255e-01", "anc_acc": "8.163e-01", "epoch": 0.01916} {"step": 9585, "loss": 1.3481, "grad_norm": "5.367e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.126e+00", "anc_loss": "1.178e+00", "dlm_acc": "5.653e-01", "anc_acc": "5.578e-01", "epoch": 0.01917} {"step": 9590, "loss": 1.074, "grad_norm": "3.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.034e+00", "anc_loss": "1.059e+00", "dlm_acc": "3.380e-01", "anc_acc": "3.216e-01", "epoch": 0.01918} {"step": 9595, "loss": 1.777, "grad_norm": "6.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.406e+00", "anc_loss": "1.448e+00", "dlm_acc": "3.136e-01", "anc_acc": "3.081e-01", "epoch": 0.01919} {"step": 9600, "loss": 1.2292, "grad_norm": "8.461e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.145e+00", "dlm_acc": "3.264e-01", "anc_acc": "3.245e-01", "epoch": 0.0192} {"step": 9605, "loss": 1.4202, "grad_norm": "2.905e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.220e+00", "dlm_acc": "3.284e-01", "anc_acc": "3.259e-01", "epoch": 0.01921} {"step": 9610, "loss": 1.3662, "grad_norm": "3.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.132e+00", "dlm_acc": "5.909e-01", "anc_acc": "5.817e-01", "epoch": 0.01922} {"step": 9615, "loss": 1.2909, "grad_norm": "2.382e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.734e-01", "anc_loss": "4.840e-01", "dlm_acc": "7.283e-01", "anc_acc": "7.269e-01", "epoch": 0.01923} {"step": 9620, "loss": 1.4589, "grad_norm": "6.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.589e+00", "anc_loss": "1.650e+00", "dlm_acc": "5.677e-01", "anc_acc": "5.574e-01", "epoch": 0.01924} {"step": 9625, "loss": 1.0507, "grad_norm": "3.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.096e-01", "anc_loss": "3.363e-01", "dlm_acc": "8.232e-01", "anc_acc": "8.187e-01", "epoch": 0.01925} {"step": 9630, "loss": 1.0381, "grad_norm": "3.256e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.113e-01", "anc_loss": "7.465e-01", "dlm_acc": "6.690e-01", "anc_acc": "6.599e-01", "epoch": 0.01926} {"step": 9635, "loss": 1.1243, "grad_norm": "2.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.434e-01", "anc_loss": "6.629e-01", "dlm_acc": "6.539e-01", "anc_acc": "6.480e-01", "epoch": 0.01927} {"step": 9640, "loss": 1.3068, "grad_norm": "2.635e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.664e-01", "anc_loss": "1.023e+00", "dlm_acc": "5.970e-01", "anc_acc": "5.878e-01", "epoch": 0.01928} {"step": 9645, "loss": 1.2549, "grad_norm": "4.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.037e+00", "anc_loss": "1.106e+00", "dlm_acc": "6.661e-01", "anc_acc": "6.533e-01", "epoch": 0.01929} {"step": 9650, "loss": 1.1722, "grad_norm": "6.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.809e-01", "anc_loss": "7.174e-01", "dlm_acc": "6.715e-01", "anc_acc": "6.621e-01", "epoch": 0.0193} {"step": 9655, "loss": 1.0461, "grad_norm": "2.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.371e-01", "anc_loss": "9.600e-01", "dlm_acc": "5.634e-01", "anc_acc": "5.575e-01", "epoch": 0.01931} {"step": 9660, "loss": 1.1225, "grad_norm": "2.818e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.521e-01", "anc_loss": "7.826e-01", "dlm_acc": "6.825e-01", "anc_acc": "6.743e-01", "epoch": 0.01932} {"step": 9665, "loss": 1.304, "grad_norm": "6.110e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.231e-01", "anc_loss": "8.606e-01", "dlm_acc": "6.787e-01", "anc_acc": "6.701e-01", "epoch": 0.01933} {"step": 9670, "loss": 1.58, "grad_norm": "6.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.719e+00", "anc_loss": "1.789e+00", "dlm_acc": "4.250e-01", "anc_acc": "4.121e-01", "epoch": 0.01934} {"step": 9675, "loss": 1.0418, "grad_norm": "3.375e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.063e+00", "anc_loss": "1.121e+00", "dlm_acc": "6.153e-01", "anc_acc": "6.029e-01", "epoch": 0.01935} {"step": 9680, "loss": 1.2129, "grad_norm": "6.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.067e+00", "anc_loss": "1.132e+00", "dlm_acc": "6.082e-01", "anc_acc": "5.937e-01", "epoch": 0.01936} {"step": 9685, "loss": 1.3989, "grad_norm": "3.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.041e+00", "anc_loss": "1.092e+00", "dlm_acc": "6.233e-01", "anc_acc": "6.123e-01", "epoch": 0.01937} {"step": 9690, "loss": 1.4006, "grad_norm": "5.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.327e-01", "anc_loss": "4.708e-01", "dlm_acc": "8.223e-01", "anc_acc": "8.094e-01", "epoch": 0.01938} {"step": 9695, "loss": 0.9526, "grad_norm": "4.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.951e-01", "anc_loss": "3.104e-01", "dlm_acc": "7.957e-01", "anc_acc": "7.881e-01", "epoch": 0.01939} {"step": 9700, "loss": 1.0178, "grad_norm": "3.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.449e-01", "anc_loss": "3.695e-01", "dlm_acc": "7.786e-01", "anc_acc": "7.666e-01", "epoch": 0.0194} {"step": 9705, "loss": 1.1762, "grad_norm": "4.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.451e-01", "anc_loss": "3.797e-01", "dlm_acc": "7.938e-01", "anc_acc": "7.775e-01", "epoch": 0.01941} {"step": 9710, "loss": 1.1035, "grad_norm": "2.204e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.789e-01", "anc_loss": "7.244e-01", "dlm_acc": "7.540e-01", "anc_acc": "7.407e-01", "epoch": 0.01942} {"step": 9715, "loss": 1.587, "grad_norm": "3.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.559e-01", "anc_loss": "6.824e-01", "dlm_acc": "7.183e-01", "anc_acc": "7.114e-01", "epoch": 0.01943} {"step": 9720, "loss": 1.3513, "grad_norm": "2.008e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.213e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.752e-01", "anc_acc": "5.599e-01", "epoch": 0.01944} {"step": 9725, "loss": 1.463, "grad_norm": "9.010e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.492e+00", "anc_loss": "1.547e+00", "dlm_acc": "4.352e-01", "anc_acc": "4.270e-01", "epoch": 0.01945} {"step": 9730, "loss": 1.5375, "grad_norm": "7.608e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.620e+00", "anc_loss": "1.671e+00", "dlm_acc": "4.544e-01", "anc_acc": "4.457e-01", "epoch": 0.01946} {"step": 9735, "loss": 1.1251, "grad_norm": "5.312e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.611e-01", "anc_loss": "5.962e-01", "dlm_acc": "7.712e-01", "anc_acc": "7.652e-01", "epoch": 0.01947} {"step": 9740, "loss": 0.9961, "grad_norm": "2.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.258e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.424e-01", "anc_acc": "5.280e-01", "epoch": 0.01948} {"step": 9745, "loss": 1.0104, "grad_norm": "4.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.688e-01", "anc_loss": "8.082e-01", "dlm_acc": "6.275e-01", "anc_acc": "6.199e-01", "epoch": 0.01949} {"step": 9750, "loss": 0.7712, "grad_norm": "3.338e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.532e-01", "anc_loss": "3.942e-01", "dlm_acc": "8.457e-01", "anc_acc": "8.342e-01", "epoch": 0.0195} {"step": 9755, "loss": 1.0613, "grad_norm": "8.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.914e-01", "anc_loss": "9.516e-01", "dlm_acc": "6.476e-01", "anc_acc": "6.364e-01", "epoch": 0.01951} {"step": 9760, "loss": 1.2122, "grad_norm": "5.563e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.805e-01", "anc_loss": "7.164e-01", "dlm_acc": "6.987e-01", "anc_acc": "6.920e-01", "epoch": 0.01952} {"step": 9765, "loss": 0.8532, "grad_norm": "4.241e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.880e-01", "anc_loss": "1.965e-01", "dlm_acc": "8.440e-01", "anc_acc": "8.378e-01", "epoch": 0.01953} {"step": 9770, "loss": 0.8742, "grad_norm": "4.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.125e-01", "anc_loss": "2.256e-01", "dlm_acc": "8.466e-01", "anc_acc": "8.402e-01", "epoch": 0.01954} {"step": 9775, "loss": 0.8972, "grad_norm": "3.780e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.043e-01", "anc_loss": "7.494e-01", "dlm_acc": "7.086e-01", "anc_acc": "6.989e-01", "epoch": 0.01955} {"step": 9780, "loss": 1.5105, "grad_norm": "6.012e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.134e+00", "dlm_acc": "5.206e-01", "anc_acc": "5.131e-01", "epoch": 0.01956} {"step": 9785, "loss": 1.2016, "grad_norm": "4.244e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.063e-01", "anc_loss": "8.242e-01", "dlm_acc": "4.970e-01", "anc_acc": "4.922e-01", "epoch": 0.01957} {"step": 9790, "loss": 1.22, "grad_norm": "5.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.764e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.595e-01", "anc_acc": "6.444e-01", "epoch": 0.01958} {"step": 9795, "loss": 1.1642, "grad_norm": "5.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.961e-01", "anc_loss": "3.100e-01", "dlm_acc": "7.808e-01", "anc_acc": "7.734e-01", "epoch": 0.01959} {"step": 9800, "loss": 1.563, "grad_norm": "5.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.367e+00", "dlm_acc": "5.711e-01", "anc_acc": "5.583e-01", "epoch": 0.0196} {"step": 9805, "loss": 1.3722, "grad_norm": "1.027e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.758e-01", "anc_loss": "1.017e+00", "dlm_acc": "5.393e-01", "anc_acc": "5.345e-01", "epoch": 0.01961} {"step": 9810, "loss": 1.2083, "grad_norm": "2.288e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.793e-01", "anc_loss": "7.136e-01", "dlm_acc": "7.236e-01", "anc_acc": "7.168e-01", "epoch": 0.01962} {"step": 9815, "loss": 1.0844, "grad_norm": "5.183e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.850e-01", "anc_loss": "6.153e-01", "dlm_acc": "7.223e-01", "anc_acc": "7.126e-01", "epoch": 0.01963} {"step": 9820, "loss": 1.1877, "grad_norm": "2.273e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.215e+00", "anc_loss": "1.276e+00", "dlm_acc": "5.886e-01", "anc_acc": "5.737e-01", "epoch": 0.01964} {"step": 9825, "loss": 1.6978, "grad_norm": "6.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.614e+00", "anc_loss": "1.703e+00", "dlm_acc": "4.941e-01", "anc_acc": "4.771e-01", "epoch": 0.01965} {"step": 9830, "loss": 1.0691, "grad_norm": "3.019e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.006e+00", "anc_loss": "1.072e+00", "dlm_acc": "5.875e-01", "anc_acc": "5.705e-01", "epoch": 0.01966} {"step": 9835, "loss": 1.2864, "grad_norm": "3.352e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.956e-01", "anc_acc": "5.807e-01", "epoch": 0.01967} {"step": 9840, "loss": 1.5302, "grad_norm": "6.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.286e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.272e-01", "anc_acc": "5.100e-01", "epoch": 0.01968} {"step": 9845, "loss": 1.7981, "grad_norm": "4.530e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.581e+00", "dlm_acc": "5.106e-01", "anc_acc": "4.937e-01", "epoch": 0.01969} {"step": 9850, "loss": 1.3985, "grad_norm": "3.450e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.502e+00", "anc_loss": "1.575e+00", "dlm_acc": "4.932e-01", "anc_acc": "4.802e-01", "epoch": 0.0197} {"step": 9855, "loss": 1.1006, "grad_norm": "7.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.144e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.886e-01", "anc_acc": "5.704e-01", "epoch": 0.01971} {"step": 9860, "loss": 1.1407, "grad_norm": "4.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.492e-01", "anc_acc": "5.337e-01", "epoch": 0.01972} {"step": 9865, "loss": 1.062, "grad_norm": "2.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.239e+00", "dlm_acc": "5.626e-01", "anc_acc": "5.450e-01", "epoch": 0.01973} {"step": 9870, "loss": 1.1023, "grad_norm": "3.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.359e-01", "anc_loss": "1.013e+00", "dlm_acc": "6.852e-01", "anc_acc": "6.672e-01", "epoch": 0.01974} {"step": 9875, "loss": 1.3177, "grad_norm": "3.222e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.730e+00", "anc_loss": "1.814e+00", "dlm_acc": "4.644e-01", "anc_acc": "4.515e-01", "epoch": 0.01975} {"step": 9880, "loss": 1.2709, "grad_norm": "3.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.650e-01", "anc_acc": "5.495e-01", "epoch": 0.01976} {"step": 9885, "loss": 1.4456, "grad_norm": "3.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.563e-01", "anc_acc": "5.387e-01", "epoch": 0.01977} {"step": 9890, "loss": 1.4608, "grad_norm": "4.506e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.546e+00", "dlm_acc": "4.797e-01", "anc_acc": "4.635e-01", "epoch": 0.01978} {"step": 9895, "loss": 1.6249, "grad_norm": "4.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.284e+00", "anc_loss": "2.293e+00", "dlm_acc": "1.457e-01", "anc_acc": "1.429e-01", "epoch": 0.01979} {"step": 9900, "loss": 1.7855, "grad_norm": "3.795e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.231e+00", "anc_loss": "2.255e+00", "dlm_acc": "2.012e-01", "anc_acc": "1.970e-01", "epoch": 0.0198} {"step": 9905, "loss": 1.5272, "grad_norm": "3.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.688e+00", "anc_loss": "1.773e+00", "dlm_acc": "5.021e-01", "anc_acc": "4.871e-01", "epoch": 0.01981} {"step": 9910, "loss": 1.1567, "grad_norm": "2.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.824e-01", "anc_loss": "7.055e-01", "dlm_acc": "6.404e-01", "anc_acc": "6.315e-01", "epoch": 0.01982} {"step": 9915, "loss": 1.11, "grad_norm": "3.335e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.812e-01", "anc_loss": "3.949e-01", "dlm_acc": "7.395e-01", "anc_acc": "7.331e-01", "epoch": 0.01983} {"step": 9920, "loss": 1.6312, "grad_norm": "3.849e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.279e+00", "dlm_acc": "5.419e-01", "anc_acc": "5.238e-01", "epoch": 0.01984} {"step": 9925, "loss": 1.5404, "grad_norm": "2.739e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.803e-01", "anc_acc": "5.645e-01", "epoch": 0.01985} {"step": 9930, "loss": 1.285, "grad_norm": "3.576e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.438e-01", "anc_loss": "8.885e-01", "dlm_acc": "7.354e-01", "anc_acc": "7.253e-01", "epoch": 0.01986} {"step": 9935, "loss": 1.8182, "grad_norm": "4.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.334e+00", "anc_loss": "2.367e+00", "dlm_acc": "1.777e-01", "anc_acc": "1.730e-01", "epoch": 0.01987} {"step": 9940, "loss": 1.7624, "grad_norm": "2.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.747e+00", "anc_loss": "2.769e+00", "dlm_acc": "4.065e-02", "anc_acc": "3.908e-02", "epoch": 0.01988} {"step": 9945, "loss": 1.8572, "grad_norm": "4.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.475e+00", "anc_loss": "2.491e+00", "dlm_acc": "1.057e-01", "anc_acc": "1.047e-01", "epoch": 0.01989} {"step": 9950, "loss": 1.9979, "grad_norm": "3.172e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.009e+00", "anc_loss": "2.072e+00", "dlm_acc": "4.120e-01", "anc_acc": "4.035e-01", "epoch": 0.0199} {"step": 9955, "loss": 1.6227, "grad_norm": "3.738e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.466e+00", "dlm_acc": "4.696e-01", "anc_acc": "4.484e-01", "epoch": 0.01991} {"step": 9960, "loss": 1.452, "grad_norm": "2.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.206e+00", "dlm_acc": "5.430e-01", "anc_acc": "5.119e-01", "epoch": 0.01992} {"step": 9965, "loss": 1.3818, "grad_norm": "3.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.090e+00", "anc_loss": "1.164e+00", "dlm_acc": "5.428e-01", "anc_acc": "5.222e-01", "epoch": 0.01993} {"step": 9970, "loss": 1.2593, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.250e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.206e-01", "anc_acc": "4.987e-01", "epoch": 0.01994} {"step": 9975, "loss": 1.588, "grad_norm": "4.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.623e+00", "dlm_acc": "2.342e-01", "anc_acc": "2.268e-01", "epoch": 0.01995} {"step": 9980, "loss": 1.6351, "grad_norm": "4.719e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.550e+00", "anc_loss": "1.566e+00", "dlm_acc": "1.457e-01", "anc_acc": "1.416e-01", "epoch": 0.01996} {"step": 9985, "loss": 1.3844, "grad_norm": "4.378e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.484e+00", "dlm_acc": "3.434e-01", "anc_acc": "3.296e-01", "epoch": 0.01997} {"step": 9990, "loss": 1.3846, "grad_norm": "2.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.490e+00", "dlm_acc": "5.042e-01", "anc_acc": "4.866e-01", "epoch": 0.01998} {"step": 9995, "loss": 1.6188, "grad_norm": "3.053e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.660e+00", "dlm_acc": "4.583e-01", "anc_acc": "4.453e-01", "epoch": 0.01999} {"step": 10000, "loss": 1.3248, "grad_norm": "2.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.855e-01", "anc_loss": "8.389e-01", "dlm_acc": "6.531e-01", "anc_acc": "6.390e-01", "epoch": 0.02} {"step": 10005, "loss": 1.7156, "grad_norm": "5.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.375e+00", "dlm_acc": "5.848e-01", "anc_acc": "5.746e-01", "epoch": 0.02001} {"step": 10010, "loss": 1.0176, "grad_norm": "5.718e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.838e-01", "anc_loss": "5.156e-01", "dlm_acc": "8.367e-01", "anc_acc": "8.319e-01", "epoch": 0.02002} {"step": 10015, "loss": 1.1735, "grad_norm": "3.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.471e+00", "anc_loss": "1.534e+00", "dlm_acc": "4.995e-01", "anc_acc": "4.827e-01", "epoch": 0.02003} {"step": 10020, "loss": 1.4083, "grad_norm": "6.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.243e+00", "dlm_acc": "4.532e-01", "anc_acc": "4.376e-01", "epoch": 0.02004} {"step": 10025, "loss": 1.308, "grad_norm": "2.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.238e+00", "dlm_acc": "5.628e-01", "anc_acc": "5.429e-01", "epoch": 0.02005} {"step": 10030, "loss": 1.3686, "grad_norm": "3.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.332e-01", "anc_acc": "5.215e-01", "epoch": 0.02006} {"step": 10035, "loss": 1.2037, "grad_norm": "3.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.131e+00", "dlm_acc": "5.764e-01", "anc_acc": "5.627e-01", "epoch": 0.02007} {"step": 10040, "loss": 1.2115, "grad_norm": "5.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.119e+00", "dlm_acc": "5.578e-01", "anc_acc": "5.477e-01", "epoch": 0.02008} {"step": 10045, "loss": 1.6221, "grad_norm": "4.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.047e-01", "anc_acc": "4.896e-01", "epoch": 0.02009} {"step": 10050, "loss": 1.3113, "grad_norm": "3.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.536e+00", "anc_loss": "1.631e+00", "dlm_acc": "4.976e-01", "anc_acc": "4.800e-01", "epoch": 0.0201} {"step": 10055, "loss": 1.0953, "grad_norm": "3.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.202e+00", "dlm_acc": "5.472e-01", "anc_acc": "5.349e-01", "epoch": 0.02011} {"step": 10060, "loss": 1.5965, "grad_norm": "4.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.635e+00", "anc_loss": "1.727e+00", "dlm_acc": "5.015e-01", "anc_acc": "4.834e-01", "epoch": 0.02012} {"step": 10065, "loss": 1.4611, "grad_norm": "3.204e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.560e+00", "dlm_acc": "4.090e-01", "anc_acc": "3.973e-01", "epoch": 0.02013} {"step": 10070, "loss": 0.9554, "grad_norm": "2.626e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.613e-01", "anc_loss": "8.879e-01", "dlm_acc": "5.687e-01", "anc_acc": "5.570e-01", "epoch": 0.02014} {"step": 10075, "loss": 1.1172, "grad_norm": "3.004e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.766e-01", "anc_loss": "1.027e+00", "dlm_acc": "5.722e-01", "anc_acc": "5.604e-01", "epoch": 0.02015} {"step": 10080, "loss": 1.3939, "grad_norm": "6.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.627e+00", "dlm_acc": "5.195e-01", "anc_acc": "4.981e-01", "epoch": 0.02016} {"step": 10085, "loss": 1.19, "grad_norm": "2.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.664e+00", "dlm_acc": "4.900e-01", "anc_acc": "4.714e-01", "epoch": 0.02017} {"step": 10090, "loss": 1.7229, "grad_norm": "3.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.436e+00", "anc_loss": "2.459e+00", "dlm_acc": "1.640e-01", "anc_acc": "1.612e-01", "epoch": 0.02018} {"step": 10095, "loss": 1.3674, "grad_norm": "3.619e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.439e-01", "anc_acc": "5.317e-01", "epoch": 0.02019} {"step": 10100, "loss": 1.5884, "grad_norm": "3.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.261e+00", "anc_loss": "1.311e+00", "dlm_acc": "6.286e-01", "anc_acc": "6.207e-01", "epoch": 0.0202} {"step": 10105, "loss": 1.5225, "grad_norm": "2.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.478e+00", "anc_loss": "1.568e+00", "dlm_acc": "5.479e-01", "anc_acc": "5.328e-01", "epoch": 0.02021} {"step": 10110, "loss": 1.2799, "grad_norm": "2.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.276e+00", "dlm_acc": "5.542e-01", "anc_acc": "5.423e-01", "epoch": 0.02022} {"step": 10115, "loss": 1.1954, "grad_norm": "3.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.849e-01", "anc_loss": "9.357e-01", "dlm_acc": "6.710e-01", "anc_acc": "6.592e-01", "epoch": 0.02023} {"step": 10120, "loss": 1.3845, "grad_norm": "3.685e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.269e+00", "dlm_acc": "5.897e-01", "anc_acc": "5.682e-01", "epoch": 0.02024} {"step": 10125, "loss": 1.073, "grad_norm": "1.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.168e-01", "anc_loss": "9.777e-01", "dlm_acc": "6.055e-01", "anc_acc": "5.882e-01", "epoch": 0.02025} {"step": 10130, "loss": 1.4288, "grad_norm": "3.261e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.116e+00", "dlm_acc": "3.714e-01", "anc_acc": "3.660e-01", "epoch": 0.02026} {"step": 10135, "loss": 1.3413, "grad_norm": "5.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.149e+00", "dlm_acc": "5.822e-01", "anc_acc": "5.720e-01", "epoch": 0.02027} {"step": 10140, "loss": 1.3941, "grad_norm": "6.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.102e-01", "anc_loss": "8.836e-01", "dlm_acc": "6.329e-01", "anc_acc": "6.112e-01", "epoch": 0.02028} {"step": 10145, "loss": 0.9245, "grad_norm": "4.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.146e-01", "anc_loss": "4.453e-01", "dlm_acc": "8.286e-01", "anc_acc": "8.170e-01", "epoch": 0.02029} {"step": 10150, "loss": 1.3518, "grad_norm": "5.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.010e+00", "anc_loss": "1.052e+00", "dlm_acc": "5.342e-01", "anc_acc": "5.232e-01", "epoch": 0.0203} {"step": 10155, "loss": 1.4329, "grad_norm": "3.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.571e-01", "anc_acc": "5.453e-01", "epoch": 0.02031} {"step": 10160, "loss": 1.1608, "grad_norm": "3.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.422e-01", "anc_loss": "6.602e-01", "dlm_acc": "5.869e-01", "anc_acc": "5.799e-01", "epoch": 0.02032} {"step": 10165, "loss": 1.5094, "grad_norm": "4.719e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.694e+00", "anc_loss": "1.780e+00", "dlm_acc": "4.900e-01", "anc_acc": "4.733e-01", "epoch": 0.02033} {"step": 10170, "loss": 1.5025, "grad_norm": "3.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.475e+00", "anc_loss": "1.542e+00", "dlm_acc": "5.666e-01", "anc_acc": "5.518e-01", "epoch": 0.02034} {"step": 10175, "loss": 1.2296, "grad_norm": "2.540e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.141e-01", "anc_loss": "8.445e-01", "dlm_acc": "5.977e-01", "anc_acc": "5.880e-01", "epoch": 0.02035} {"step": 10180, "loss": 1.0887, "grad_norm": "4.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.625e-01", "anc_loss": "6.852e-01", "dlm_acc": "5.894e-01", "anc_acc": "5.762e-01", "epoch": 0.02036} {"step": 10185, "loss": 1.1663, "grad_norm": "3.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.001e+00", "anc_loss": "1.087e+00", "dlm_acc": "6.189e-01", "anc_acc": "5.981e-01", "epoch": 0.02037} {"step": 10190, "loss": 1.4509, "grad_norm": "3.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.353e+00", "anc_loss": "1.422e+00", "dlm_acc": "4.872e-01", "anc_acc": "4.755e-01", "epoch": 0.02038} {"step": 10195, "loss": 0.9942, "grad_norm": "1.114e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.234e-01", "anc_loss": "6.707e-01", "dlm_acc": "6.807e-01", "anc_acc": "6.660e-01", "epoch": 0.02039} {"step": 10200, "loss": 1.2551, "grad_norm": "3.320e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.639e-01", "anc_loss": "2.834e-01", "dlm_acc": "8.730e-01", "anc_acc": "8.654e-01", "epoch": 0.0204} {"step": 10205, "loss": 1.213, "grad_norm": "3.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.145e-01", "anc_loss": "6.535e-01", "dlm_acc": "6.506e-01", "anc_acc": "6.319e-01", "epoch": 0.02041} {"step": 10210, "loss": 0.9981, "grad_norm": "2.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.297e-01", "anc_loss": "8.809e-01", "dlm_acc": "6.445e-01", "anc_acc": "6.317e-01", "epoch": 0.02042} {"step": 10215, "loss": 1.0925, "grad_norm": "4.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.945e-01", "anc_loss": "5.184e-01", "dlm_acc": "7.767e-01", "anc_acc": "7.678e-01", "epoch": 0.02043} {"step": 10220, "loss": 1.2606, "grad_norm": "2.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.779e-01", "anc_loss": "1.031e+00", "dlm_acc": "6.283e-01", "anc_acc": "6.140e-01", "epoch": 0.02044} {"step": 10225, "loss": 1.258, "grad_norm": "4.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.393e-01", "anc_loss": "8.759e-01", "dlm_acc": "6.215e-01", "anc_acc": "6.091e-01", "epoch": 0.02045} {"step": 10230, "loss": 1.2123, "grad_norm": "1.906e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.191e-01", "anc_loss": "9.750e-01", "dlm_acc": "6.144e-01", "anc_acc": "6.014e-01", "epoch": 0.02046} {"step": 10235, "loss": 1.2964, "grad_norm": "5.159e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.105e+00", "dlm_acc": "5.759e-01", "anc_acc": "5.633e-01", "epoch": 0.02047} {"step": 10240, "loss": 1.3325, "grad_norm": "3.208e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.111e-01", "anc_acc": "4.971e-01", "epoch": 0.02048} {"step": 10245, "loss": 1.0854, "grad_norm": "2.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.992e-01", "anc_loss": "7.336e-01", "dlm_acc": "6.045e-01", "anc_acc": "5.944e-01", "epoch": 0.02049} {"step": 10250, "loss": 1.4011, "grad_norm": "3.061e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.202e+00", "dlm_acc": "5.668e-01", "anc_acc": "5.536e-01", "epoch": 0.0205} {"step": 10255, "loss": 1.0152, "grad_norm": "1.894e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.354e-01", "anc_loss": "5.687e-01", "dlm_acc": "7.134e-01", "anc_acc": "6.972e-01", "epoch": 0.02051} {"step": 10260, "loss": 1.2775, "grad_norm": "4.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.926e-01", "anc_loss": "8.461e-01", "dlm_acc": "6.483e-01", "anc_acc": "6.343e-01", "epoch": 0.02052} {"step": 10265, "loss": 1.4785, "grad_norm": "4.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.984e-01", "anc_loss": "8.203e-01", "dlm_acc": "4.802e-01", "anc_acc": "4.731e-01", "epoch": 0.02053} {"step": 10270, "loss": 1.5033, "grad_norm": "4.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.146e+00", "dlm_acc": "5.788e-01", "anc_acc": "5.643e-01", "epoch": 0.02054} {"step": 10275, "loss": 1.2054, "grad_norm": "3.676e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.340e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.609e-01", "anc_acc": "5.491e-01", "epoch": 0.02055} {"step": 10280, "loss": 0.9516, "grad_norm": "3.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.169e+00", "anc_loss": "1.233e+00", "dlm_acc": "5.375e-01", "anc_acc": "5.234e-01", "epoch": 0.02056} {"step": 10285, "loss": 1.2859, "grad_norm": "4.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.476e+00", "anc_loss": "1.540e+00", "dlm_acc": "5.027e-01", "anc_acc": "4.900e-01", "epoch": 0.02057} {"step": 10290, "loss": 1.1223, "grad_norm": "4.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.553e+00", "dlm_acc": "5.045e-01", "anc_acc": "4.890e-01", "epoch": 0.02058} {"step": 10295, "loss": 1.1892, "grad_norm": "1.952e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.484e+00", "anc_loss": "1.564e+00", "dlm_acc": "5.096e-01", "anc_acc": "4.919e-01", "epoch": 0.02059} {"step": 10300, "loss": 1.0974, "grad_norm": "4.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.222e+00", "dlm_acc": "5.877e-01", "anc_acc": "5.701e-01", "epoch": 0.0206} {"step": 10305, "loss": 1.4512, "grad_norm": "3.124e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.181e+00", "anc_loss": "1.247e+00", "dlm_acc": "5.381e-01", "anc_acc": "5.233e-01", "epoch": 0.02061} {"step": 10310, "loss": 1.5316, "grad_norm": "4.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.791e+00", "anc_loss": "1.856e+00", "dlm_acc": "4.174e-01", "anc_acc": "4.052e-01", "epoch": 0.02062} {"step": 10315, "loss": 1.2279, "grad_norm": "2.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.356e+00", "anc_loss": "1.421e+00", "dlm_acc": "5.242e-01", "anc_acc": "5.106e-01", "epoch": 0.02063} {"step": 10320, "loss": 1.1397, "grad_norm": "2.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.203e+00", "dlm_acc": "5.850e-01", "anc_acc": "5.690e-01", "epoch": 0.02064} {"step": 10325, "loss": 0.9142, "grad_norm": "2.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.580e-01", "anc_acc": "5.431e-01", "epoch": 0.02065} {"step": 10330, "loss": 0.696, "grad_norm": "2.252e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.166e+00", "dlm_acc": "5.782e-01", "anc_acc": "5.619e-01", "epoch": 0.02066} {"step": 10335, "loss": 1.2403, "grad_norm": "4.101e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.680e+00", "anc_loss": "1.753e+00", "dlm_acc": "4.633e-01", "anc_acc": "4.499e-01", "epoch": 0.02067} {"step": 10340, "loss": 0.9607, "grad_norm": "3.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.201e+00", "dlm_acc": "6.047e-01", "anc_acc": "5.885e-01", "epoch": 0.02068} {"step": 10345, "loss": 1.1666, "grad_norm": "3.873e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.353e+00", "anc_loss": "1.425e+00", "dlm_acc": "5.017e-01", "anc_acc": "4.864e-01", "epoch": 0.02069} {"step": 10350, "loss": 1.6201, "grad_norm": "3.321e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.524e+00", "dlm_acc": "5.644e-01", "anc_acc": "5.487e-01", "epoch": 0.0207} {"step": 10355, "loss": 0.9869, "grad_norm": "2.956e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.855e-01", "anc_loss": "1.058e+00", "dlm_acc": "6.266e-01", "anc_acc": "6.072e-01", "epoch": 0.02071} {"step": 10360, "loss": 0.9823, "grad_norm": "2.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.957e-01", "anc_acc": "5.780e-01", "epoch": 0.02072} {"step": 10365, "loss": 0.9706, "grad_norm": "3.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.383e+00", "dlm_acc": "5.762e-01", "anc_acc": "5.612e-01", "epoch": 0.02073} {"step": 10370, "loss": 0.9283, "grad_norm": "2.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.256e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.694e-01", "anc_acc": "5.534e-01", "epoch": 0.02074} {"step": 10375, "loss": 0.9344, "grad_norm": "2.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.166e+00", "dlm_acc": "5.865e-01", "anc_acc": "5.698e-01", "epoch": 0.02075} {"step": 10380, "loss": 1.0444, "grad_norm": "4.583e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.273e-01", "anc_loss": "8.812e-01", "dlm_acc": "6.520e-01", "anc_acc": "6.386e-01", "epoch": 0.02076} {"step": 10385, "loss": 1.4283, "grad_norm": "3.761e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.332e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.629e-01", "anc_acc": "5.462e-01", "epoch": 0.02077} {"step": 10390, "loss": 1.3913, "grad_norm": "3.737e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.294e+00", "anc_loss": "1.371e+00", "dlm_acc": "5.795e-01", "anc_acc": "5.656e-01", "epoch": 0.02078} {"step": 10395, "loss": 1.2623, "grad_norm": "2.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.207e+00", "anc_loss": "1.276e+00", "dlm_acc": "5.651e-01", "anc_acc": "5.504e-01", "epoch": 0.02079} {"step": 10400, "loss": 1.3757, "grad_norm": "3.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.356e+00", "dlm_acc": "5.526e-01", "anc_acc": "5.379e-01", "epoch": 0.0208} {"step": 10405, "loss": 1.4239, "grad_norm": "5.757e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.476e+00", "anc_loss": "1.547e+00", "dlm_acc": "5.173e-01", "anc_acc": "5.031e-01", "epoch": 0.02081} {"step": 10410, "loss": 1.1149, "grad_norm": "3.877e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.180e+00", "dlm_acc": "5.320e-01", "anc_acc": "5.173e-01", "epoch": 0.02082} {"step": 10415, "loss": 1.2247, "grad_norm": "1.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.318e-01", "anc_acc": "5.161e-01", "epoch": 0.02083} {"step": 10420, "loss": 1.5666, "grad_norm": "3.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.566e+00", "anc_loss": "1.637e+00", "dlm_acc": "4.692e-01", "anc_acc": "4.576e-01", "epoch": 0.02084} {"step": 10425, "loss": 1.3, "grad_norm": "4.004e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.947e-01", "anc_loss": "7.549e-01", "dlm_acc": "7.477e-01", "anc_acc": "7.376e-01", "epoch": 0.02085} {"step": 10430, "loss": 1.5706, "grad_norm": "4.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.850e+00", "anc_loss": "1.916e+00", "dlm_acc": "4.135e-01", "anc_acc": "4.015e-01", "epoch": 0.02086} {"step": 10435, "loss": 1.6297, "grad_norm": "5.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.444e+00", "anc_loss": "1.481e+00", "dlm_acc": "5.473e-01", "anc_acc": "5.376e-01", "epoch": 0.02087} {"step": 10440, "loss": 1.0887, "grad_norm": "3.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.215e-01", "anc_loss": "7.677e-01", "dlm_acc": "7.290e-01", "anc_acc": "7.147e-01", "epoch": 0.02088} {"step": 10445, "loss": 1.063, "grad_norm": "4.129e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.248e+00", "dlm_acc": "6.054e-01", "anc_acc": "5.894e-01", "epoch": 0.02089} {"step": 10450, "loss": 1.3004, "grad_norm": "3.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.428e+00", "dlm_acc": "5.113e-01", "anc_acc": "4.973e-01", "epoch": 0.0209} {"step": 10455, "loss": 1.3522, "grad_norm": "3.658e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.390e+00", "dlm_acc": "5.246e-01", "anc_acc": "5.115e-01", "epoch": 0.02091} {"step": 10460, "loss": 1.4277, "grad_norm": "3.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.459e+00", "anc_loss": "1.536e+00", "dlm_acc": "5.203e-01", "anc_acc": "5.054e-01", "epoch": 0.02092} {"step": 10465, "loss": 1.3078, "grad_norm": "2.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.520e+00", "anc_loss": "1.600e+00", "dlm_acc": "4.442e-01", "anc_acc": "4.299e-01", "epoch": 0.02093} {"step": 10470, "loss": 1.5488, "grad_norm": "3.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.856e-01", "anc_acc": "5.710e-01", "epoch": 0.02094} {"step": 10475, "loss": 1.5019, "grad_norm": "1.509e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.645e+00", "dlm_acc": "4.666e-01", "anc_acc": "4.505e-01", "epoch": 0.02095} {"step": 10480, "loss": 1.3861, "grad_norm": "3.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.500e+00", "anc_loss": "1.578e+00", "dlm_acc": "5.272e-01", "anc_acc": "5.150e-01", "epoch": 0.02096} {"step": 10485, "loss": 2.1396, "grad_norm": "5.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.983e+00", "anc_loss": "2.070e+00", "dlm_acc": "4.275e-01", "anc_acc": "4.124e-01", "epoch": 0.02097} {"step": 10490, "loss": 1.3851, "grad_norm": "1.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.315e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.547e-01", "anc_acc": "5.384e-01", "epoch": 0.02098} {"step": 10495, "loss": 1.4533, "grad_norm": "4.455e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.250e+00", "dlm_acc": "5.525e-01", "anc_acc": "5.389e-01", "epoch": 0.02099} {"step": 10500, "loss": 1.5255, "grad_norm": "8.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.900e-01", "anc_acc": "5.722e-01", "epoch": 0.021} {"step": 10505, "loss": 1.3675, "grad_norm": "2.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.169e+00", "anc_loss": "1.247e+00", "dlm_acc": "5.909e-01", "anc_acc": "5.718e-01", "epoch": 0.02101} {"step": 10510, "loss": 1.3432, "grad_norm": "2.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.196e+00", "dlm_acc": "6.085e-01", "anc_acc": "5.914e-01", "epoch": 0.02102} {"step": 10515, "loss": 1.5613, "grad_norm": "2.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.360e+00", "anc_loss": "1.436e+00", "dlm_acc": "5.864e-01", "anc_acc": "5.680e-01", "epoch": 0.02103} {"step": 10520, "loss": 1.3252, "grad_norm": "3.594e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.533e+00", "anc_loss": "1.606e+00", "dlm_acc": "5.066e-01", "anc_acc": "4.928e-01", "epoch": 0.02104} {"step": 10525, "loss": 1.1962, "grad_norm": "1.003e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.018e+00", "anc_loss": "1.063e+00", "dlm_acc": "5.953e-01", "anc_acc": "5.860e-01", "epoch": 0.02105} {"step": 10530, "loss": 1.2501, "grad_norm": "4.491e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.965e-01", "anc_loss": "1.079e+00", "dlm_acc": "6.469e-01", "anc_acc": "6.270e-01", "epoch": 0.02106} {"step": 10535, "loss": 1.3594, "grad_norm": "4.202e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.726e-01", "anc_acc": "5.532e-01", "epoch": 0.02107} {"step": 10540, "loss": 1.1361, "grad_norm": "3.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.034e+00", "anc_loss": "1.108e+00", "dlm_acc": "6.515e-01", "anc_acc": "6.340e-01", "epoch": 0.02108} {"step": 10545, "loss": 0.9553, "grad_norm": "3.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.211e-01", "anc_loss": "9.805e-01", "dlm_acc": "6.453e-01", "anc_acc": "6.295e-01", "epoch": 0.02109} {"step": 10550, "loss": 0.7308, "grad_norm": "2.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.112e+00", "dlm_acc": "5.972e-01", "anc_acc": "5.810e-01", "epoch": 0.0211} {"step": 10555, "loss": 0.9539, "grad_norm": "3.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.157e+00", "anc_loss": "1.239e+00", "dlm_acc": "6.144e-01", "anc_acc": "5.966e-01", "epoch": 0.02111} {"step": 10560, "loss": 0.8642, "grad_norm": "2.159e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.051e+00", "anc_loss": "1.114e+00", "dlm_acc": "5.937e-01", "anc_acc": "5.786e-01", "epoch": 0.02112} {"step": 10565, "loss": 1.0837, "grad_norm": "3.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.170e+00", "dlm_acc": "6.296e-01", "anc_acc": "6.159e-01", "epoch": 0.02113} {"step": 10570, "loss": 1.2815, "grad_norm": "7.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.090e+00", "anc_loss": "1.172e+00", "dlm_acc": "6.373e-01", "anc_acc": "6.188e-01", "epoch": 0.02114} {"step": 10575, "loss": 1.3994, "grad_norm": "4.201e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.379e+00", "dlm_acc": "5.670e-01", "anc_acc": "5.535e-01", "epoch": 0.02115} {"step": 10580, "loss": 1.3216, "grad_norm": "8.818e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.424e-01", "anc_acc": "5.288e-01", "epoch": 0.02116} {"step": 10585, "loss": 1.0613, "grad_norm": "4.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.673e+00", "anc_loss": "1.748e+00", "dlm_acc": "4.610e-01", "anc_acc": "4.462e-01", "epoch": 0.02117} {"step": 10590, "loss": 1.1288, "grad_norm": "4.848e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.867e+00", "anc_loss": "1.958e+00", "dlm_acc": "4.661e-01", "anc_acc": "4.514e-01", "epoch": 0.02118} {"step": 10595, "loss": 1.4998, "grad_norm": "4.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.891e+00", "anc_loss": "1.966e+00", "dlm_acc": "4.548e-01", "anc_acc": "4.426e-01", "epoch": 0.02119} {"step": 10600, "loss": 1.248, "grad_norm": "2.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.681e+00", "dlm_acc": "4.926e-01", "anc_acc": "4.772e-01", "epoch": 0.0212} {"step": 10605, "loss": 1.1134, "grad_norm": "2.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.321e+00", "dlm_acc": "5.897e-01", "anc_acc": "5.711e-01", "epoch": 0.02121} {"step": 10610, "loss": 1.2327, "grad_norm": "3.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.124e+00", "anc_loss": "1.201e+00", "dlm_acc": "6.093e-01", "anc_acc": "5.912e-01", "epoch": 0.02122} {"step": 10615, "loss": 1.2039, "grad_norm": "2.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.138e+00", "dlm_acc": "5.939e-01", "anc_acc": "5.757e-01", "epoch": 0.02123} {"step": 10620, "loss": 1.2204, "grad_norm": "3.808e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.650e+00", "dlm_acc": "4.766e-01", "anc_acc": "4.593e-01", "epoch": 0.02124} {"step": 10625, "loss": 1.55, "grad_norm": "3.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.623e+00", "dlm_acc": "4.822e-01", "anc_acc": "4.698e-01", "epoch": 0.02125} {"step": 10630, "loss": 1.45, "grad_norm": "8.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.398e+00", "anc_loss": "1.467e+00", "dlm_acc": "5.180e-01", "anc_acc": "5.038e-01", "epoch": 0.02126} {"step": 10635, "loss": 1.2012, "grad_norm": "2.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.459e+00", "anc_loss": "1.525e+00", "dlm_acc": "4.980e-01", "anc_acc": "4.831e-01", "epoch": 0.02127} {"step": 10640, "loss": 1.4552, "grad_norm": "3.294e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.891e+00", "anc_loss": "1.944e+00", "dlm_acc": "3.448e-01", "anc_acc": "3.345e-01", "epoch": 0.02128} {"step": 10645, "loss": 1.1926, "grad_norm": "6.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.672e-01", "anc_loss": "7.125e-01", "dlm_acc": "7.284e-01", "anc_acc": "7.199e-01", "epoch": 0.02129} {"step": 10650, "loss": 1.4659, "grad_norm": "3.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.249e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.844e-01", "anc_acc": "5.682e-01", "epoch": 0.0213} {"step": 10655, "loss": 1.2675, "grad_norm": "3.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.529e-01", "anc_loss": "1.013e+00", "dlm_acc": "6.283e-01", "anc_acc": "6.170e-01", "epoch": 0.02131} {"step": 10660, "loss": 1.0843, "grad_norm": "3.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.865e-01", "anc_loss": "9.377e-01", "dlm_acc": "6.477e-01", "anc_acc": "6.377e-01", "epoch": 0.02132} {"step": 10665, "loss": 1.0023, "grad_norm": "1.766e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.277e-01", "anc_loss": "5.434e-01", "dlm_acc": "6.195e-01", "anc_acc": "6.097e-01", "epoch": 0.02133} {"step": 10670, "loss": 1.2674, "grad_norm": "5.560e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.742e-01", "anc_loss": "9.180e-01", "dlm_acc": "6.324e-01", "anc_acc": "6.277e-01", "epoch": 0.02134} {"step": 10675, "loss": 0.9648, "grad_norm": "4.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.481e+00", "dlm_acc": "3.736e-01", "anc_acc": "3.680e-01", "epoch": 0.02135} {"step": 10680, "loss": 1.324, "grad_norm": "4.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.179e+00", "dlm_acc": "5.210e-01", "anc_acc": "5.047e-01", "epoch": 0.02136} {"step": 10685, "loss": 1.3545, "grad_norm": "4.866e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.236e+00", "dlm_acc": "5.452e-01", "anc_acc": "5.228e-01", "epoch": 0.02137} {"step": 10690, "loss": 1.1726, "grad_norm": "3.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.089e+00", "anc_loss": "1.159e+00", "dlm_acc": "4.984e-01", "anc_acc": "4.783e-01", "epoch": 0.02138} {"step": 10695, "loss": 1.6435, "grad_norm": "7.594e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.666e+00", "dlm_acc": "3.650e-01", "anc_acc": "3.509e-01", "epoch": 0.02139} {"step": 10700, "loss": 1.4034, "grad_norm": "1.797e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.531e+00", "dlm_acc": "4.234e-01", "anc_acc": "4.027e-01", "epoch": 0.0214} {"step": 10705, "loss": 1.1258, "grad_norm": "3.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.323e+00", "dlm_acc": "4.786e-01", "anc_acc": "4.535e-01", "epoch": 0.02141} {"step": 10710, "loss": 1.0656, "grad_norm": "3.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.152e+00", "dlm_acc": "5.484e-01", "anc_acc": "5.189e-01", "epoch": 0.02142} {"step": 10715, "loss": 1.2322, "grad_norm": "2.778e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.200e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.439e-01", "anc_acc": "5.282e-01", "epoch": 0.02143} {"step": 10720, "loss": 1.1914, "grad_norm": "5.035e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.382e+00", "anc_loss": "1.457e+00", "dlm_acc": "4.626e-01", "anc_acc": "4.433e-01", "epoch": 0.02144} {"step": 10725, "loss": 1.1064, "grad_norm": "3.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.578e-01", "anc_loss": "1.012e+00", "dlm_acc": "5.981e-01", "anc_acc": "5.864e-01", "epoch": 0.02145} {"step": 10730, "loss": 1.374, "grad_norm": "6.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.660e+00", "anc_loss": "1.723e+00", "dlm_acc": "3.787e-01", "anc_acc": "3.661e-01", "epoch": 0.02146} {"step": 10735, "loss": 1.6016, "grad_norm": "3.398e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.376e+00", "anc_loss": "2.404e+00", "dlm_acc": "1.976e-01", "anc_acc": "1.871e-01", "epoch": 0.02147} {"step": 10740, "loss": 0.8496, "grad_norm": "3.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.460e+00", "dlm_acc": "5.119e-01", "anc_acc": "4.947e-01", "epoch": 0.02148} {"step": 10745, "loss": 1.0009, "grad_norm": "4.623e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.388e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.401e-01", "anc_acc": "5.263e-01", "epoch": 0.02149} {"step": 10750, "loss": 1.1072, "grad_norm": "2.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.145e+00", "dlm_acc": "6.461e-01", "anc_acc": "6.256e-01", "epoch": 0.0215} {"step": 10755, "loss": 1.1037, "grad_norm": "5.230e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.941e-01", "anc_loss": "7.625e-01", "dlm_acc": "6.999e-01", "anc_acc": "6.837e-01", "epoch": 0.02151} {"step": 10760, "loss": 1.0404, "grad_norm": "2.498e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.508e-01", "anc_loss": "1.007e+00", "dlm_acc": "6.059e-01", "anc_acc": "5.938e-01", "epoch": 0.02152} {"step": 10765, "loss": 1.2073, "grad_norm": "7.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.328e-01", "anc_loss": "7.814e-01", "dlm_acc": "7.692e-01", "anc_acc": "7.587e-01", "epoch": 0.02153} {"step": 10770, "loss": 1.1115, "grad_norm": "5.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.221e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.011e-01", "anc_acc": "4.865e-01", "epoch": 0.02154} {"step": 10775, "loss": 1.4311, "grad_norm": "6.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.489e-01", "anc_acc": "5.263e-01", "epoch": 0.02155} {"step": 10780, "loss": 0.9742, "grad_norm": "4.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.000e-01", "anc_loss": "9.840e-01", "dlm_acc": "5.897e-01", "anc_acc": "5.613e-01", "epoch": 0.02156} {"step": 10785, "loss": 0.8767, "grad_norm": "4.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.250e-01", "anc_loss": "7.500e-01", "dlm_acc": "5.278e-01", "anc_acc": "5.168e-01", "epoch": 0.02157} {"step": 10790, "loss": 1.1931, "grad_norm": "4.372e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.163e+00", "dlm_acc": "4.129e-01", "anc_acc": "4.026e-01", "epoch": 0.02158} {"step": 10795, "loss": 1.276, "grad_norm": "4.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.667e-01", "anc_loss": "8.073e-01", "dlm_acc": "5.759e-01", "anc_acc": "5.669e-01", "epoch": 0.02159} {"step": 10800, "loss": 1.3503, "grad_norm": "4.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.299e+00", "anc_loss": "1.369e+00", "dlm_acc": "5.281e-01", "anc_acc": "5.159e-01", "epoch": 0.0216} {"step": 10805, "loss": 1.1427, "grad_norm": "3.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.097e+00", "dlm_acc": "5.793e-01", "anc_acc": "5.693e-01", "epoch": 0.02161} {"step": 10810, "loss": 1.2304, "grad_norm": "3.533e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.488e+00", "dlm_acc": "4.945e-01", "anc_acc": "4.811e-01", "epoch": 0.02162} {"step": 10815, "loss": 1.771, "grad_norm": "3.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.442e+00", "anc_loss": "1.499e+00", "dlm_acc": "5.395e-01", "anc_acc": "5.407e-01", "epoch": 0.02163} {"step": 10820, "loss": 1.1644, "grad_norm": "4.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.247e+00", "dlm_acc": "5.664e-01", "anc_acc": "5.524e-01", "epoch": 0.02164} {"step": 10825, "loss": 1.5365, "grad_norm": "3.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.040e-01", "anc_acc": "4.805e-01", "epoch": 0.02165} {"step": 10830, "loss": 1.2247, "grad_norm": "7.161e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.248e+00", "dlm_acc": "5.356e-01", "anc_acc": "5.232e-01", "epoch": 0.02166} {"step": 10835, "loss": 1.2803, "grad_norm": "1.528e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.745e+00", "anc_loss": "1.817e+00", "dlm_acc": "4.230e-01", "anc_acc": "4.088e-01", "epoch": 0.02167} {"step": 10840, "loss": 1.2025, "grad_norm": "3.122e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.579e+00", "anc_loss": "1.635e+00", "dlm_acc": "4.384e-01", "anc_acc": "4.277e-01", "epoch": 0.02168} {"step": 10845, "loss": 1.3106, "grad_norm": "5.365e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.860e+00", "anc_loss": "1.891e+00", "dlm_acc": "3.233e-01", "anc_acc": "3.181e-01", "epoch": 0.02169} {"step": 10850, "loss": 1.3653, "grad_norm": "5.626e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.181e+00", "anc_loss": "2.239e+00", "dlm_acc": "2.980e-01", "anc_acc": "2.879e-01", "epoch": 0.0217} {"step": 10855, "loss": 1.0073, "grad_norm": "3.295e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.034e+00", "anc_loss": "1.078e+00", "dlm_acc": "5.936e-01", "anc_acc": "5.862e-01", "epoch": 0.02171} {"step": 10860, "loss": 0.986, "grad_norm": "5.124e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.418e-01", "anc_loss": "5.621e-01", "dlm_acc": "6.190e-01", "anc_acc": "6.068e-01", "epoch": 0.02172} {"step": 10865, "loss": 1.1257, "grad_norm": "9.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.483e-01", "anc_acc": "5.345e-01", "epoch": 0.02173} {"step": 10870, "loss": 1.2949, "grad_norm": "4.170e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.947e+00", "anc_loss": "1.995e+00", "dlm_acc": "3.408e-01", "anc_acc": "3.334e-01", "epoch": 0.02174} {"step": 10875, "loss": 1.4234, "grad_norm": "9.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.938e-01", "anc_loss": "9.777e-01", "dlm_acc": "6.541e-01", "anc_acc": "6.366e-01", "epoch": 0.02175} {"step": 10880, "loss": 0.7807, "grad_norm": "5.038e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.169e-01", "anc_loss": "1.303e-01", "dlm_acc": "9.405e-01", "anc_acc": "9.360e-01", "epoch": 0.02176} {"step": 10885, "loss": 1.2519, "grad_norm": "3.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.847e-01", "anc_acc": "5.749e-01", "epoch": 0.02177} {"step": 10890, "loss": 1.6229, "grad_norm": "3.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.392e+00", "anc_loss": "2.445e+00", "dlm_acc": "2.524e-01", "anc_acc": "2.433e-01", "epoch": 0.02178} {"step": 10895, "loss": 2.1444, "grad_norm": "5.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.847e+00", "anc_loss": "2.866e+00", "dlm_acc": "3.157e-02", "anc_acc": "3.084e-02", "epoch": 0.02179} {"step": 10900, "loss": 1.9195, "grad_norm": "5.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.769e+00", "anc_loss": "1.845e+00", "dlm_acc": "4.308e-01", "anc_acc": "4.149e-01", "epoch": 0.0218} {"step": 10905, "loss": 1.6895, "grad_norm": "2.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.109e-01", "anc_acc": "4.956e-01", "epoch": 0.02181} {"step": 10910, "loss": 1.7406, "grad_norm": "2.806e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.050e+00", "anc_loss": "2.080e+00", "dlm_acc": "2.140e-01", "anc_acc": "2.098e-01", "epoch": 0.02182} {"step": 10915, "loss": 1.4066, "grad_norm": "2.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.276e+00", "dlm_acc": "5.667e-01", "anc_acc": "5.512e-01", "epoch": 0.02183} {"step": 10920, "loss": 1.3805, "grad_norm": "2.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.108e+00", "dlm_acc": "6.017e-01", "anc_acc": "5.891e-01", "epoch": 0.02184} {"step": 10925, "loss": 1.3252, "grad_norm": "3.292e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.734e-01", "anc_loss": "1.023e+00", "dlm_acc": "5.695e-01", "anc_acc": "5.576e-01", "epoch": 0.02185} {"step": 10930, "loss": 1.3083, "grad_norm": "2.815e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.186e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.142e-01", "anc_acc": "5.025e-01", "epoch": 0.02186} {"step": 10935, "loss": 1.0239, "grad_norm": "7.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.125e+00", "anc_loss": "1.187e+00", "dlm_acc": "5.767e-01", "anc_acc": "5.661e-01", "epoch": 0.02187} {"step": 10940, "loss": 1.3729, "grad_norm": "3.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.251e+00", "dlm_acc": "4.839e-01", "anc_acc": "4.746e-01", "epoch": 0.02188} {"step": 10945, "loss": 0.9058, "grad_norm": "2.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.789e-01", "anc_loss": "6.922e-01", "dlm_acc": "5.370e-01", "anc_acc": "5.300e-01", "epoch": 0.02189} {"step": 10950, "loss": 1.0805, "grad_norm": "3.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.023e-01", "anc_loss": "9.203e-01", "dlm_acc": "3.820e-01", "anc_acc": "3.748e-01", "epoch": 0.0219} {"step": 10955, "loss": 1.1915, "grad_norm": "4.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.385e+00", "anc_loss": "1.457e+00", "dlm_acc": "4.896e-01", "anc_acc": "4.779e-01", "epoch": 0.02191} {"step": 10960, "loss": 1.4062, "grad_norm": "3.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.553e+00", "anc_loss": "1.622e+00", "dlm_acc": "4.805e-01", "anc_acc": "4.685e-01", "epoch": 0.02192} {"step": 10965, "loss": 0.9189, "grad_norm": "2.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.676e-01", "anc_loss": "9.301e-01", "dlm_acc": "6.398e-01", "anc_acc": "6.256e-01", "epoch": 0.02193} {"step": 10970, "loss": 0.9712, "grad_norm": "3.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.215e-01", "anc_loss": "6.305e-01", "dlm_acc": "5.329e-01", "anc_acc": "5.304e-01", "epoch": 0.02194} {"step": 10975, "loss": 0.7243, "grad_norm": "1.842e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.969e-01", "anc_loss": "6.059e-01", "dlm_acc": "5.116e-01", "anc_acc": "5.077e-01", "epoch": 0.02195} {"step": 10980, "loss": 0.5276, "grad_norm": "3.643e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.508e-01", "anc_loss": "6.617e-01", "dlm_acc": "5.258e-01", "anc_acc": "5.216e-01", "epoch": 0.02196} {"step": 10985, "loss": 0.7183, "grad_norm": "2.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.195e+00", "dlm_acc": "5.600e-01", "anc_acc": "5.445e-01", "epoch": 0.02197} {"step": 10990, "loss": 0.9951, "grad_norm": "5.675e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.255e-01", "anc_acc": "5.060e-01", "epoch": 0.02198} {"step": 10995, "loss": 1.0755, "grad_norm": "3.820e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.097e+00", "dlm_acc": "5.969e-01", "anc_acc": "5.808e-01", "epoch": 0.02199} {"step": 11000, "loss": 1.0789, "grad_norm": "6.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.309e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.394e-01", "anc_acc": "5.261e-01", "epoch": 0.022} {"step": 11005, "loss": 1.1206, "grad_norm": "3.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.500e+00", "anc_loss": "1.570e+00", "dlm_acc": "4.708e-01", "anc_acc": "4.569e-01", "epoch": 0.02201} {"step": 11010, "loss": 1.0475, "grad_norm": "3.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.902e-01", "anc_loss": "9.430e-01", "dlm_acc": "6.623e-01", "anc_acc": "6.517e-01", "epoch": 0.02202} {"step": 11015, "loss": 1.0372, "grad_norm": "3.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.430e-01", "anc_loss": "8.875e-01", "dlm_acc": "5.829e-01", "anc_acc": "5.682e-01", "epoch": 0.02203} {"step": 11020, "loss": 1.4459, "grad_norm": "4.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.445e+00", "anc_loss": "1.510e+00", "dlm_acc": "5.634e-01", "anc_acc": "5.494e-01", "epoch": 0.02204} {"step": 11025, "loss": 0.9984, "grad_norm": "6.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.117e-01", "anc_loss": "9.539e-01", "dlm_acc": "4.540e-01", "anc_acc": "4.473e-01", "epoch": 0.02205} {"step": 11030, "loss": 1.0926, "grad_norm": "3.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.129e+00", "dlm_acc": "5.536e-01", "anc_acc": "5.383e-01", "epoch": 0.02206} {"step": 11035, "loss": 1.0585, "grad_norm": "3.587e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.400e-01", "anc_loss": "9.666e-01", "dlm_acc": "5.070e-01", "anc_acc": "4.996e-01", "epoch": 0.02207} {"step": 11040, "loss": 0.9966, "grad_norm": "4.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.270e-01", "anc_loss": "5.527e-01", "dlm_acc": "7.586e-01", "anc_acc": "7.499e-01", "epoch": 0.02208} {"step": 11045, "loss": 0.9984, "grad_norm": "4.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.244e-01", "anc_loss": "5.595e-01", "dlm_acc": "7.802e-01", "anc_acc": "7.732e-01", "epoch": 0.02209} {"step": 11050, "loss": 0.9905, "grad_norm": "3.109e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.055e-01", "anc_loss": "6.270e-01", "dlm_acc": "5.654e-01", "anc_acc": "5.540e-01", "epoch": 0.0221} {"step": 11055, "loss": 0.8088, "grad_norm": "1.403e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.504e-01", "anc_loss": "5.707e-01", "dlm_acc": "6.077e-01", "anc_acc": "5.958e-01", "epoch": 0.02211} {"step": 11060, "loss": 1.2285, "grad_norm": "3.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.061e+00", "anc_loss": "1.107e+00", "dlm_acc": "6.565e-01", "anc_acc": "6.475e-01", "epoch": 0.02212} {"step": 11065, "loss": 0.857, "grad_norm": "4.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.044e-01", "anc_loss": "6.574e-01", "dlm_acc": "7.342e-01", "anc_acc": "7.200e-01", "epoch": 0.02213} {"step": 11070, "loss": 1.0776, "grad_norm": "5.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.984e-01", "anc_loss": "1.022e+00", "dlm_acc": "4.718e-01", "anc_acc": "4.669e-01", "epoch": 0.02214} {"step": 11075, "loss": 1.1158, "grad_norm": "2.954e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.503e-01", "anc_acc": "5.341e-01", "epoch": 0.02215} {"step": 11080, "loss": 0.7645, "grad_norm": "2.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.633e-01", "anc_loss": "8.967e-01", "dlm_acc": "5.716e-01", "anc_acc": "5.630e-01", "epoch": 0.02216} {"step": 11085, "loss": 0.4601, "grad_norm": "1.128e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.304e-01", "anc_loss": "2.429e-01", "dlm_acc": "8.242e-01", "anc_acc": "8.175e-01", "epoch": 0.02217} {"step": 11090, "loss": 0.6347, "grad_norm": "3.068e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.490e-01", "anc_loss": "3.719e-01", "dlm_acc": "7.963e-01", "anc_acc": "7.853e-01", "epoch": 0.02218} {"step": 11095, "loss": 0.9003, "grad_norm": "2.596e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.978e-01", "anc_loss": "6.333e-01", "dlm_acc": "7.356e-01", "anc_acc": "7.237e-01", "epoch": 0.02219} {"step": 11100, "loss": 0.9117, "grad_norm": "3.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.094e-01", "anc_loss": "8.652e-01", "dlm_acc": "6.907e-01", "anc_acc": "6.781e-01", "epoch": 0.0222} {"step": 11105, "loss": 0.8859, "grad_norm": "2.947e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.785e-01", "anc_loss": "6.363e-01", "dlm_acc": "6.825e-01", "anc_acc": "6.589e-01", "epoch": 0.02221} {"step": 11110, "loss": 1.4721, "grad_norm": "5.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.591e+00", "dlm_acc": "5.472e-01", "anc_acc": "5.319e-01", "epoch": 0.02222} {"step": 11115, "loss": 1.1232, "grad_norm": "4.759e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.925e+00", "anc_loss": "1.970e+00", "dlm_acc": "3.478e-01", "anc_acc": "3.377e-01", "epoch": 0.02223} {"step": 11120, "loss": 1.3885, "grad_norm": "1.210e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.931e+00", "anc_loss": "1.997e+00", "dlm_acc": "3.288e-01", "anc_acc": "3.193e-01", "epoch": 0.02224} {"step": 11125, "loss": 1.0889, "grad_norm": "2.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.404e-01", "anc_loss": "6.895e-01", "dlm_acc": "7.751e-01", "anc_acc": "7.606e-01", "epoch": 0.02225} {"step": 11130, "loss": 1.5229, "grad_norm": "4.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.124e+00", "dlm_acc": "6.106e-01", "anc_acc": "5.974e-01", "epoch": 0.02226} {"step": 11135, "loss": 1.4227, "grad_norm": "7.666e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.415e+00", "dlm_acc": "5.131e-01", "anc_acc": "4.948e-01", "epoch": 0.02227} {"step": 11140, "loss": 1.6239, "grad_norm": "5.601e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.594e+00", "anc_loss": "2.625e+00", "dlm_acc": "1.059e-01", "anc_acc": "1.012e-01", "epoch": 0.02228} {"step": 11145, "loss": 1.4968, "grad_norm": "4.532e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.271e+00", "anc_loss": "1.365e+00", "dlm_acc": "6.074e-01", "anc_acc": "5.895e-01", "epoch": 0.02229} {"step": 11150, "loss": 1.187, "grad_norm": "3.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.342e+00", "dlm_acc": "5.946e-01", "anc_acc": "5.703e-01", "epoch": 0.0223} {"step": 11155, "loss": 0.9443, "grad_norm": "2.628e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.012e-01", "anc_loss": "8.414e-01", "dlm_acc": "6.372e-01", "anc_acc": "6.229e-01", "epoch": 0.02231} {"step": 11160, "loss": 1.5976, "grad_norm": "1.609e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.610e+00", "anc_loss": "1.665e+00", "dlm_acc": "4.833e-01", "anc_acc": "4.688e-01", "epoch": 0.02232} {"step": 11165, "loss": 1.3507, "grad_norm": "9.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.292e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.658e-01", "anc_acc": "5.489e-01", "epoch": 0.02233} {"step": 11170, "loss": 1.2599, "grad_norm": "4.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.031e+00", "anc_loss": "1.117e+00", "dlm_acc": "6.108e-01", "anc_acc": "5.886e-01", "epoch": 0.02234} {"step": 11175, "loss": 1.4116, "grad_norm": "5.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.362e+00", "dlm_acc": "5.404e-01", "anc_acc": "5.252e-01", "epoch": 0.02235} {"step": 11180, "loss": 1.3034, "grad_norm": "3.650e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.467e+00", "dlm_acc": "4.594e-01", "anc_acc": "4.441e-01", "epoch": 0.02236} {"step": 11185, "loss": 0.9724, "grad_norm": "3.855e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.898e-01", "anc_loss": "1.052e+00", "dlm_acc": "5.944e-01", "anc_acc": "5.802e-01", "epoch": 0.02237} {"step": 11190, "loss": 1.1115, "grad_norm": "4.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.851e-01", "anc_acc": "5.650e-01", "epoch": 0.02238} {"step": 11195, "loss": 1.3027, "grad_norm": "2.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.545e+00", "anc_loss": "1.650e+00", "dlm_acc": "5.431e-01", "anc_acc": "5.271e-01", "epoch": 0.02239} {"step": 11200, "loss": 1.3252, "grad_norm": "2.806e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.348e-01", "anc_loss": "9.820e-01", "dlm_acc": "5.258e-01", "anc_acc": "5.081e-01", "epoch": 0.0224} {"step": 11205, "loss": 1.6595, "grad_norm": "5.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.541e+00", "anc_loss": "1.637e+00", "dlm_acc": "4.714e-01", "anc_acc": "4.490e-01", "epoch": 0.02241} {"step": 11210, "loss": 1.1392, "grad_norm": "3.622e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.092e+00", "anc_loss": "1.173e+00", "dlm_acc": "5.990e-01", "anc_acc": "5.727e-01", "epoch": 0.02242} {"step": 11215, "loss": 1.2375, "grad_norm": "3.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.191e+00", "dlm_acc": "5.713e-01", "anc_acc": "5.563e-01", "epoch": 0.02243} {"step": 11220, "loss": 0.8796, "grad_norm": "2.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.083e+00", "dlm_acc": "6.143e-01", "anc_acc": "5.982e-01", "epoch": 0.02244} {"step": 11225, "loss": 1.1102, "grad_norm": "2.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.562e+00", "anc_loss": "1.658e+00", "dlm_acc": "4.746e-01", "anc_acc": "4.532e-01", "epoch": 0.02245} {"step": 11230, "loss": 1.0699, "grad_norm": "4.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.222e+00", "dlm_acc": "6.129e-01", "anc_acc": "6.014e-01", "epoch": 0.02246} {"step": 11235, "loss": 1.1891, "grad_norm": "2.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.241e+00", "dlm_acc": "5.304e-01", "anc_acc": "5.099e-01", "epoch": 0.02247} {"step": 11240, "loss": 1.9328, "grad_norm": "4.808e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.659e+00", "anc_loss": "1.733e+00", "dlm_acc": "4.570e-01", "anc_acc": "4.439e-01", "epoch": 0.02248} {"step": 11245, "loss": 1.4117, "grad_norm": "4.071e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.706e+00", "anc_loss": "1.794e+00", "dlm_acc": "4.121e-01", "anc_acc": "3.975e-01", "epoch": 0.02249} {"step": 11250, "loss": 1.2545, "grad_norm": "3.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.233e+00", "dlm_acc": "5.589e-01", "anc_acc": "5.449e-01", "epoch": 0.0225} {"step": 11255, "loss": 1.1349, "grad_norm": "5.408e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.516e-01", "anc_loss": "1.038e+00", "dlm_acc": "6.135e-01", "anc_acc": "5.887e-01", "epoch": 0.02251} {"step": 11260, "loss": 1.4052, "grad_norm": "4.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.042e+00", "anc_loss": "1.145e+00", "dlm_acc": "6.679e-01", "anc_acc": "6.475e-01", "epoch": 0.02252} {"step": 11265, "loss": 1.5658, "grad_norm": "6.340e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.071e+00", "anc_loss": "1.116e+00", "dlm_acc": "5.883e-01", "anc_acc": "5.793e-01", "epoch": 0.02253} {"step": 11270, "loss": 1.5652, "grad_norm": "2.306e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.290e+00", "dlm_acc": "6.009e-01", "anc_acc": "5.925e-01", "epoch": 0.02254} {"step": 11275, "loss": 1.4217, "grad_norm": "4.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.242e-01", "anc_acc": "4.962e-01", "epoch": 0.02255} {"step": 11280, "loss": 1.1446, "grad_norm": "5.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.744e-01", "anc_acc": "5.577e-01", "epoch": 0.02256} {"step": 11285, "loss": 1.1108, "grad_norm": "2.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.485e+00", "anc_loss": "1.551e+00", "dlm_acc": "4.867e-01", "anc_acc": "4.761e-01", "epoch": 0.02257} {"step": 11290, "loss": 1.2205, "grad_norm": "3.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.536e-01", "anc_loss": "6.771e-01", "dlm_acc": "6.645e-01", "anc_acc": "6.595e-01", "epoch": 0.02258} {"step": 11295, "loss": 1.3119, "grad_norm": "3.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.725e-01", "anc_loss": "7.142e-01", "dlm_acc": "7.168e-01", "anc_acc": "7.112e-01", "epoch": 0.02259} {"step": 11300, "loss": 1.0817, "grad_norm": "2.931e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.517e-01", "anc_loss": "5.873e-01", "dlm_acc": "7.473e-01", "anc_acc": "7.361e-01", "epoch": 0.0226} {"step": 11305, "loss": 1.4367, "grad_norm": "3.361e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.437e+00", "dlm_acc": "4.757e-01", "anc_acc": "4.633e-01", "epoch": 0.02261} {"step": 11310, "loss": 1.3969, "grad_norm": "3.225e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.567e-01", "anc_loss": "8.941e-01", "dlm_acc": "6.049e-01", "anc_acc": "5.960e-01", "epoch": 0.02262} {"step": 11315, "loss": 1.1271, "grad_norm": "2.237e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.213e-01", "anc_loss": "8.687e-01", "dlm_acc": "7.530e-01", "anc_acc": "7.434e-01", "epoch": 0.02263} {"step": 11320, "loss": 1.0784, "grad_norm": "6.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.277e-01", "anc_loss": "8.852e-01", "dlm_acc": "6.847e-01", "anc_acc": "6.723e-01", "epoch": 0.02264} {"step": 11325, "loss": 1.0287, "grad_norm": "2.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.699e-01", "anc_loss": "7.057e-01", "dlm_acc": "7.382e-01", "anc_acc": "7.272e-01", "epoch": 0.02265} {"step": 11330, "loss": 1.1685, "grad_norm": "3.260e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.052e+00", "dlm_acc": "6.826e-01", "anc_acc": "6.752e-01", "epoch": 0.02266} {"step": 11335, "loss": 1.5904, "grad_norm": "5.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.330e+00", "dlm_acc": "6.177e-01", "anc_acc": "6.045e-01", "epoch": 0.02267} {"step": 11340, "loss": 1.0107, "grad_norm": "2.472e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.521e-01", "anc_loss": "3.680e-01", "dlm_acc": "7.741e-01", "anc_acc": "7.690e-01", "epoch": 0.02268} {"step": 11345, "loss": 1.1805, "grad_norm": "3.526e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.317e-01", "anc_loss": "8.629e-01", "dlm_acc": "7.414e-01", "anc_acc": "7.340e-01", "epoch": 0.02269} {"step": 11350, "loss": 1.0069, "grad_norm": "3.246e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.006e-01", "anc_loss": "2.106e-01", "dlm_acc": "8.832e-01", "anc_acc": "8.799e-01", "epoch": 0.0227} {"step": 11355, "loss": 0.8831, "grad_norm": "3.496e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.753e-01", "anc_loss": "1.835e-01", "dlm_acc": "8.902e-01", "anc_acc": "8.863e-01", "epoch": 0.02271} {"step": 11360, "loss": 1.0281, "grad_norm": "4.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.635e-01", "anc_loss": "1.705e-01", "dlm_acc": "9.015e-01", "anc_acc": "8.993e-01", "epoch": 0.02272} {"step": 11365, "loss": 1.3276, "grad_norm": "6.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.076e+00", "anc_loss": "1.133e+00", "dlm_acc": "5.469e-01", "anc_acc": "5.349e-01", "epoch": 0.02273} {"step": 11370, "loss": 1.0582, "grad_norm": "4.138e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.488e-01", "anc_loss": "8.020e-01", "dlm_acc": "6.356e-01", "anc_acc": "6.211e-01", "epoch": 0.02274} {"step": 11375, "loss": 1.212, "grad_norm": "4.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.018e-01", "anc_loss": "7.568e-01", "dlm_acc": "7.435e-01", "anc_acc": "7.308e-01", "epoch": 0.02275} {"step": 11380, "loss": 1.3007, "grad_norm": "3.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.512e+00", "dlm_acc": "5.162e-01", "anc_acc": "4.998e-01", "epoch": 0.02276} {"step": 11385, "loss": 1.3877, "grad_norm": "2.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.552e+00", "anc_loss": "1.626e+00", "dlm_acc": "5.239e-01", "anc_acc": "5.112e-01", "epoch": 0.02277} {"step": 11390, "loss": 1.4417, "grad_norm": "3.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.488e-01", "anc_loss": "5.672e-01", "dlm_acc": "6.583e-01", "anc_acc": "6.512e-01", "epoch": 0.02278} {"step": 11395, "loss": 1.4029, "grad_norm": "2.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.179e-01", "anc_loss": "4.418e-01", "dlm_acc": "7.596e-01", "anc_acc": "7.510e-01", "epoch": 0.02279} {"step": 11400, "loss": 0.8705, "grad_norm": "5.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.742e-01", "anc_loss": "3.821e-01", "dlm_acc": "7.001e-01", "anc_acc": "6.940e-01", "epoch": 0.0228} {"step": 11405, "loss": 1.0036, "grad_norm": "5.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.367e-01", "anc_loss": "4.559e-01", "dlm_acc": "7.490e-01", "anc_acc": "7.417e-01", "epoch": 0.02281} {"step": 11410, "loss": 1.4312, "grad_norm": "6.322e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.082e-01", "anc_loss": "6.340e-01", "dlm_acc": "6.938e-01", "anc_acc": "6.836e-01", "epoch": 0.02282} {"step": 11415, "loss": 1.6052, "grad_norm": "7.587e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.485e-01", "anc_acc": "5.376e-01", "epoch": 0.02283} {"step": 11420, "loss": 1.4494, "grad_norm": "3.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.969e-01", "anc_loss": "1.033e+00", "dlm_acc": "3.914e-01", "anc_acc": "3.830e-01", "epoch": 0.02284} {"step": 11425, "loss": 1.4751, "grad_norm": "7.327e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.537e-01", "anc_loss": "1.020e+00", "dlm_acc": "6.822e-01", "anc_acc": "6.685e-01", "epoch": 0.02285} {"step": 11430, "loss": 1.4775, "grad_norm": "4.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.412e+00", "dlm_acc": "5.642e-01", "anc_acc": "5.474e-01", "epoch": 0.02286} {"step": 11435, "loss": 1.1829, "grad_norm": "3.307e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.426e-01", "anc_loss": "8.965e-01", "dlm_acc": "5.490e-01", "anc_acc": "5.289e-01", "epoch": 0.02287} {"step": 11440, "loss": 1.7566, "grad_norm": "4.539e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.178e+00", "anc_loss": "1.243e+00", "dlm_acc": "6.161e-01", "anc_acc": "6.029e-01", "epoch": 0.02288} {"step": 11445, "loss": 1.1491, "grad_norm": "3.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.008e+00", "anc_loss": "1.043e+00", "dlm_acc": "4.470e-01", "anc_acc": "4.403e-01", "epoch": 0.02289} {"step": 11450, "loss": 1.4509, "grad_norm": "3.664e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.088e+00", "dlm_acc": "4.176e-01", "anc_acc": "4.060e-01", "epoch": 0.0229} {"step": 11455, "loss": 1.2388, "grad_norm": "3.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.891e-01", "anc_loss": "1.021e+00", "dlm_acc": "4.290e-01", "anc_acc": "4.186e-01", "epoch": 0.02291} {"step": 11460, "loss": 1.7536, "grad_norm": "3.699e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.210e+00", "dlm_acc": "4.004e-01", "anc_acc": "3.926e-01", "epoch": 0.02292} {"step": 11465, "loss": 1.1472, "grad_norm": "2.681e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.793e-01", "anc_loss": "1.016e+00", "dlm_acc": "4.318e-01", "anc_acc": "4.171e-01", "epoch": 0.02293} {"step": 11470, "loss": 1.6659, "grad_norm": "3.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.106e+00", "anc_loss": "1.145e+00", "dlm_acc": "4.291e-01", "anc_acc": "4.163e-01", "epoch": 0.02294} {"step": 11475, "loss": 1.2577, "grad_norm": "1.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.099e+00", "dlm_acc": "4.836e-01", "anc_acc": "4.694e-01", "epoch": 0.02295} {"step": 11480, "loss": 0.9634, "grad_norm": "3.410e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.098e-01", "anc_loss": "5.545e-01", "dlm_acc": "7.739e-01", "anc_acc": "7.623e-01", "epoch": 0.02296} {"step": 11485, "loss": 1.2314, "grad_norm": "3.241e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.049e+00", "anc_loss": "1.095e+00", "dlm_acc": "6.681e-01", "anc_acc": "6.572e-01", "epoch": 0.02297} {"step": 11490, "loss": 1.0048, "grad_norm": "4.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.129e-01", "anc_loss": "9.770e-01", "dlm_acc": "6.118e-01", "anc_acc": "5.963e-01", "epoch": 0.02298} {"step": 11495, "loss": 1.1332, "grad_norm": "2.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.854e-01", "anc_loss": "8.369e-01", "dlm_acc": "7.425e-01", "anc_acc": "7.326e-01", "epoch": 0.02299} {"step": 11500, "loss": 1.4455, "grad_norm": "5.327e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.518e+00", "anc_loss": "1.614e+00", "dlm_acc": "5.122e-01", "anc_acc": "5.020e-01", "epoch": 0.023} {"step": 11505, "loss": 1.1814, "grad_norm": "3.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.327e+00", "dlm_acc": "6.092e-01", "anc_acc": "5.935e-01", "epoch": 0.02301} {"step": 11510, "loss": 1.1516, "grad_norm": "4.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.152e-01", "anc_loss": "9.508e-01", "dlm_acc": "6.510e-01", "anc_acc": "6.446e-01", "epoch": 0.02302} {"step": 11515, "loss": 0.8309, "grad_norm": "3.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.765e-01", "anc_loss": "2.924e-01", "dlm_acc": "8.217e-01", "anc_acc": "8.161e-01", "epoch": 0.02303} {"step": 11520, "loss": 1.8063, "grad_norm": "5.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.815e-01", "anc_loss": "9.163e-01", "dlm_acc": "6.619e-01", "anc_acc": "6.540e-01", "epoch": 0.02304} {"step": 11525, "loss": 1.1684, "grad_norm": "3.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.079e+00", "anc_loss": "1.114e+00", "dlm_acc": "6.649e-01", "anc_acc": "6.561e-01", "epoch": 0.02305} {"step": 11530, "loss": 1.3495, "grad_norm": "6.533e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.081e-01", "anc_loss": "8.554e-01", "dlm_acc": "7.369e-01", "anc_acc": "7.279e-01", "epoch": 0.02306} {"step": 11535, "loss": 1.5122, "grad_norm": "4.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.544e-01", "anc_loss": "1.018e+00", "dlm_acc": "7.194e-01", "anc_acc": "7.049e-01", "epoch": 0.02307} {"step": 11540, "loss": 1.1563, "grad_norm": "2.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.430e-01", "anc_loss": "5.819e-01", "dlm_acc": "7.686e-01", "anc_acc": "7.550e-01", "epoch": 0.02308} {"step": 11545, "loss": 1.7134, "grad_norm": "3.783e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.611e+00", "anc_loss": "1.689e+00", "dlm_acc": "4.984e-01", "anc_acc": "4.818e-01", "epoch": 0.02309} {"step": 11550, "loss": 1.5367, "grad_norm": "2.587e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.335e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.610e-01", "anc_acc": "5.441e-01", "epoch": 0.0231} {"step": 11555, "loss": 1.2884, "grad_norm": "3.192e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.439e-01", "epoch": 0.02311} {"step": 11560, "loss": 1.3207, "grad_norm": "7.717e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.264e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.618e-01", "anc_acc": "5.439e-01", "epoch": 0.02312} {"step": 11565, "loss": 1.3962, "grad_norm": "3.425e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.507e+00", "dlm_acc": "5.335e-01", "anc_acc": "5.192e-01", "epoch": 0.02313} {"step": 11570, "loss": 1.3663, "grad_norm": "3.162e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.608e+00", "anc_loss": "1.692e+00", "dlm_acc": "4.684e-01", "anc_acc": "4.546e-01", "epoch": 0.02314} {"step": 11575, "loss": 1.8513, "grad_norm": "6.196e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.995e+00", "anc_loss": "2.071e+00", "dlm_acc": "3.539e-01", "anc_acc": "3.416e-01", "epoch": 0.02315} {"step": 11580, "loss": 1.2751, "grad_norm": "2.699e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.457e+00", "anc_loss": "1.522e+00", "dlm_acc": "4.957e-01", "anc_acc": "4.801e-01", "epoch": 0.02316} {"step": 11585, "loss": 1.2311, "grad_norm": "6.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.197e+00", "anc_loss": "1.276e+00", "dlm_acc": "5.785e-01", "anc_acc": "5.599e-01", "epoch": 0.02317} {"step": 11590, "loss": 1.9974, "grad_norm": "4.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.841e+00", "anc_loss": "1.930e+00", "dlm_acc": "4.536e-01", "anc_acc": "4.379e-01", "epoch": 0.02318} {"step": 11595, "loss": 1.7095, "grad_norm": "2.937e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.070e-01", "anc_loss": "9.844e-01", "dlm_acc": "6.471e-01", "anc_acc": "6.266e-01", "epoch": 0.02319} {"step": 11600, "loss": 1.5788, "grad_norm": "3.436e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.163e+00", "dlm_acc": "6.241e-01", "anc_acc": "6.068e-01", "epoch": 0.0232} {"step": 11605, "loss": 1.144, "grad_norm": "2.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.489e+00", "anc_loss": "1.578e+00", "dlm_acc": "5.029e-01", "anc_acc": "4.866e-01", "epoch": 0.02321} {"step": 11610, "loss": 1.1564, "grad_norm": "4.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.489e+00", "anc_loss": "1.575e+00", "dlm_acc": "5.453e-01", "anc_acc": "5.287e-01", "epoch": 0.02322} {"step": 11615, "loss": 1.2091, "grad_norm": "3.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.436e+00", "dlm_acc": "5.368e-01", "anc_acc": "5.201e-01", "epoch": 0.02323} {"step": 11620, "loss": 1.208, "grad_norm": "2.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.143e+00", "dlm_acc": "6.375e-01", "anc_acc": "6.251e-01", "epoch": 0.02324} {"step": 11625, "loss": 0.8472, "grad_norm": "4.003e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.749e-01", "anc_loss": "3.927e-01", "dlm_acc": "8.233e-01", "anc_acc": "8.187e-01", "epoch": 0.02325} {"step": 11630, "loss": 1.312, "grad_norm": "3.713e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.369e-01", "anc_loss": "5.737e-01", "dlm_acc": "7.744e-01", "anc_acc": "7.662e-01", "epoch": 0.02326} {"step": 11635, "loss": 1.8619, "grad_norm": "3.640e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.711e-01", "anc_loss": "9.334e-01", "dlm_acc": "6.958e-01", "anc_acc": "6.851e-01", "epoch": 0.02327} {"step": 11640, "loss": 1.7904, "grad_norm": "5.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.789e-01", "anc_loss": "1.036e+00", "dlm_acc": "6.520e-01", "anc_acc": "6.365e-01", "epoch": 0.02328} {"step": 11645, "loss": 1.4955, "grad_norm": "4.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.979e-01", "anc_loss": "8.370e-01", "dlm_acc": "7.052e-01", "anc_acc": "6.957e-01", "epoch": 0.02329} {"step": 11650, "loss": 1.2753, "grad_norm": "2.137e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.932e-01", "anc_loss": "5.111e-01", "dlm_acc": "7.372e-01", "anc_acc": "7.307e-01", "epoch": 0.0233} {"step": 11655, "loss": 1.0589, "grad_norm": "2.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.920e-01", "anc_loss": "3.031e-01", "dlm_acc": "8.203e-01", "anc_acc": "8.146e-01", "epoch": 0.02331} {"step": 11660, "loss": 1.1475, "grad_norm": "2.260e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.953e-01", "anc_loss": "2.091e-01", "dlm_acc": "8.780e-01", "anc_acc": "8.729e-01", "epoch": 0.02332} {"step": 11665, "loss": 0.8965, "grad_norm": "4.804e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.917e-01", "anc_loss": "2.042e-01", "dlm_acc": "8.810e-01", "anc_acc": "8.749e-01", "epoch": 0.02333} {"step": 11670, "loss": 1.3903, "grad_norm": "7.538e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.385e-01", "anc_loss": "3.561e-01", "dlm_acc": "8.105e-01", "anc_acc": "8.030e-01", "epoch": 0.02334} {"step": 11675, "loss": 1.1469, "grad_norm": "3.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.482e-01", "anc_loss": "9.957e-01", "dlm_acc": "6.856e-01", "anc_acc": "6.749e-01", "epoch": 0.02335} {"step": 11680, "loss": 1.2563, "grad_norm": "2.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.037e+00", "anc_loss": "1.107e+00", "dlm_acc": "6.090e-01", "anc_acc": "5.932e-01", "epoch": 0.02336} {"step": 11685, "loss": 1.2962, "grad_norm": "5.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.155e+00", "dlm_acc": "6.052e-01", "anc_acc": "5.915e-01", "epoch": 0.02337} {"step": 11690, "loss": 1.0857, "grad_norm": "6.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.102e-01", "anc_loss": "8.852e-01", "dlm_acc": "6.198e-01", "anc_acc": "6.017e-01", "epoch": 0.02338} {"step": 11695, "loss": 1.0, "grad_norm": "3.997e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.223e-01", "anc_loss": "9.727e-01", "dlm_acc": "6.046e-01", "anc_acc": "5.954e-01", "epoch": 0.02339} {"step": 11700, "loss": 0.8933, "grad_norm": "1.519e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.129e-01", "anc_loss": "9.682e-01", "dlm_acc": "6.462e-01", "anc_acc": "6.336e-01", "epoch": 0.0234} {"step": 11705, "loss": 1.4985, "grad_norm": "5.260e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.090e-01", "anc_loss": "5.285e-01", "dlm_acc": "6.696e-01", "anc_acc": "6.612e-01", "epoch": 0.02341} {"step": 11710, "loss": 1.1807, "grad_norm": "2.932e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.126e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.938e-01", "anc_acc": "5.804e-01", "epoch": 0.02342} {"step": 11715, "loss": 0.7484, "grad_norm": "3.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.031e-01", "anc_loss": "7.277e-01", "dlm_acc": "6.336e-01", "anc_acc": "6.292e-01", "epoch": 0.02343} {"step": 11720, "loss": 1.476, "grad_norm": "3.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.352e-01", "anc_loss": "4.473e-01", "dlm_acc": "7.378e-01", "anc_acc": "7.360e-01", "epoch": 0.02344} {"step": 11725, "loss": 1.4831, "grad_norm": "5.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.364e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.498e-01", "anc_acc": "5.387e-01", "epoch": 0.02345} {"step": 11730, "loss": 1.3387, "grad_norm": "6.238e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.051e-01", "anc_loss": "9.492e-01", "dlm_acc": "6.281e-01", "anc_acc": "6.153e-01", "epoch": 0.02346} {"step": 11735, "loss": 1.3483, "grad_norm": "7.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.707e-01", "anc_acc": "5.556e-01", "epoch": 0.02347} {"step": 11740, "loss": 0.8722, "grad_norm": "5.283e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.607e-01", "anc_loss": "8.186e-01", "dlm_acc": "7.298e-01", "anc_acc": "7.132e-01", "epoch": 0.02348} {"step": 11745, "loss": 0.9587, "grad_norm": "3.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.076e-01", "anc_loss": "5.406e-01", "dlm_acc": "7.668e-01", "anc_acc": "7.602e-01", "epoch": 0.02349} {"step": 11750, "loss": 1.087, "grad_norm": "3.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.645e-01", "anc_loss": "7.055e-01", "dlm_acc": "7.736e-01", "anc_acc": "7.660e-01", "epoch": 0.0235} {"step": 11755, "loss": 1.0451, "grad_norm": "3.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.412e+00", "dlm_acc": "4.878e-01", "anc_acc": "4.775e-01", "epoch": 0.02351} {"step": 11760, "loss": 0.9167, "grad_norm": "4.522e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.209e-01", "anc_loss": "7.637e-01", "dlm_acc": "6.749e-01", "anc_acc": "6.639e-01", "epoch": 0.02352} {"step": 11765, "loss": 0.9064, "grad_norm": "3.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.082e-01", "anc_loss": "4.413e-01", "dlm_acc": "8.347e-01", "anc_acc": "8.238e-01", "epoch": 0.02353} {"step": 11770, "loss": 1.0613, "grad_norm": "2.866e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.643e-01", "anc_loss": "9.221e-01", "dlm_acc": "6.971e-01", "anc_acc": "6.854e-01", "epoch": 0.02354} {"step": 11775, "loss": 1.378, "grad_norm": "5.292e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.668e-01", "anc_loss": "5.180e-01", "dlm_acc": "8.030e-01", "anc_acc": "7.891e-01", "epoch": 0.02355} {"step": 11780, "loss": 1.3269, "grad_norm": "3.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.834e-01", "anc_loss": "3.967e-01", "dlm_acc": "7.610e-01", "anc_acc": "7.553e-01", "epoch": 0.02356} {"step": 11785, "loss": 0.8317, "grad_norm": "1.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.141e-01", "anc_loss": "5.467e-01", "dlm_acc": "7.558e-01", "anc_acc": "7.502e-01", "epoch": 0.02357} {"step": 11790, "loss": 1.2516, "grad_norm": "2.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.477e-01", "anc_loss": "6.844e-01", "dlm_acc": "7.083e-01", "anc_acc": "7.000e-01", "epoch": 0.02358} {"step": 11795, "loss": 1.0365, "grad_norm": "2.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.211e-01", "anc_loss": "8.718e-01", "dlm_acc": "7.243e-01", "anc_acc": "7.142e-01", "epoch": 0.02359} {"step": 11800, "loss": 1.0544, "grad_norm": "2.578e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.500e-01", "anc_loss": "6.945e-01", "dlm_acc": "7.068e-01", "anc_acc": "6.961e-01", "epoch": 0.0236} {"step": 11805, "loss": 1.285, "grad_norm": "4.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.163e+00", "dlm_acc": "5.582e-01", "anc_acc": "5.463e-01", "epoch": 0.02361} {"step": 11810, "loss": 1.0568, "grad_norm": "4.969e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.080e+00", "dlm_acc": "4.425e-01", "anc_acc": "4.357e-01", "epoch": 0.02362} {"step": 11815, "loss": 0.9736, "grad_norm": "3.437e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.805e-01", "anc_loss": "9.477e-01", "dlm_acc": "6.689e-01", "anc_acc": "6.552e-01", "epoch": 0.02363} {"step": 11820, "loss": 0.9951, "grad_norm": "5.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.063e-01", "anc_loss": "7.609e-01", "dlm_acc": "7.060e-01", "anc_acc": "6.945e-01", "epoch": 0.02364} {"step": 11825, "loss": 0.965, "grad_norm": "5.429e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.179e+00", "anc_loss": "1.256e+00", "dlm_acc": "5.967e-01", "anc_acc": "5.799e-01", "epoch": 0.02365} {"step": 11830, "loss": 0.776, "grad_norm": "9.481e+00", "learning_rate": "1.000e-04", "dlm_loss": "5.450e-01", "anc_loss": "5.687e-01", "dlm_acc": "7.892e-01", "anc_acc": "7.770e-01", "epoch": 0.02366} {"step": 11835, "loss": 0.9197, "grad_norm": "6.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.753e-01", "anc_loss": "8.247e-01", "dlm_acc": "7.193e-01", "anc_acc": "7.070e-01", "epoch": 0.02367} {"step": 11840, "loss": 1.3862, "grad_norm": "3.478e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.222e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.485e-01", "anc_acc": "5.414e-01", "epoch": 0.02368} {"step": 11845, "loss": 1.1806, "grad_norm": "2.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.241e+00", "dlm_acc": "5.740e-01", "anc_acc": "5.592e-01", "epoch": 0.02369} {"step": 11850, "loss": 0.9716, "grad_norm": "5.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.115e-01", "anc_loss": "5.361e-01", "dlm_acc": "7.669e-01", "anc_acc": "7.614e-01", "epoch": 0.0237} {"step": 11855, "loss": 0.9729, "grad_norm": "2.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.887e-01", "anc_loss": "8.500e-01", "dlm_acc": "6.499e-01", "anc_acc": "6.344e-01", "epoch": 0.02371} {"step": 11860, "loss": 1.2499, "grad_norm": "4.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.637e-01", "anc_loss": "4.896e-01", "dlm_acc": "8.546e-01", "anc_acc": "8.500e-01", "epoch": 0.02372} {"step": 11865, "loss": 1.3054, "grad_norm": "2.326e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.504e-01", "anc_loss": "3.746e-01", "dlm_acc": "8.365e-01", "anc_acc": "8.296e-01", "epoch": 0.02373} {"step": 11870, "loss": 1.2169, "grad_norm": "1.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.478e+00", "dlm_acc": "5.359e-01", "anc_acc": "5.216e-01", "epoch": 0.02374} {"step": 11875, "loss": 0.8815, "grad_norm": "2.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.234e-01", "anc_loss": "9.945e-01", "dlm_acc": "6.470e-01", "anc_acc": "6.293e-01", "epoch": 0.02375} {"step": 11880, "loss": 1.3691, "grad_norm": "4.005e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.691e+00", "anc_loss": "1.802e+00", "dlm_acc": "4.908e-01", "anc_acc": "4.732e-01", "epoch": 0.02376} {"step": 11885, "loss": 2.138, "grad_norm": "3.996e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.842e+00", "anc_loss": "1.936e+00", "dlm_acc": "4.767e-01", "anc_acc": "4.609e-01", "epoch": 0.02377} {"step": 11890, "loss": 1.8644, "grad_norm": "6.984e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.743e+00", "anc_loss": "1.833e+00", "dlm_acc": "4.989e-01", "anc_acc": "4.819e-01", "epoch": 0.02378} {"step": 11895, "loss": 1.7629, "grad_norm": "2.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.766e+00", "anc_loss": "1.856e+00", "dlm_acc": "4.752e-01", "anc_acc": "4.591e-01", "epoch": 0.02379} {"step": 11900, "loss": 1.3868, "grad_norm": "5.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.469e+00", "anc_loss": "1.555e+00", "dlm_acc": "5.141e-01", "anc_acc": "4.982e-01", "epoch": 0.0238} {"step": 11905, "loss": 0.8651, "grad_norm": "2.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.305e-01", "anc_loss": "8.930e-01", "dlm_acc": "6.383e-01", "anc_acc": "6.207e-01", "epoch": 0.02381} {"step": 11910, "loss": 1.3581, "grad_norm": "3.432e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.290e+00", "anc_loss": "1.353e+00", "dlm_acc": "5.514e-01", "anc_acc": "5.383e-01", "epoch": 0.02382} {"step": 11915, "loss": 1.4541, "grad_norm": "4.380e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.525e+00", "anc_loss": "1.614e+00", "dlm_acc": "5.289e-01", "anc_acc": "5.114e-01", "epoch": 0.02383} {"step": 11920, "loss": 1.3391, "grad_norm": "4.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.388e+00", "dlm_acc": "5.838e-01", "anc_acc": "5.668e-01", "epoch": 0.02384} {"step": 11925, "loss": 1.2976, "grad_norm": "4.129e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.397e+00", "anc_loss": "1.481e+00", "dlm_acc": "5.426e-01", "anc_acc": "5.257e-01", "epoch": 0.02385} {"step": 11930, "loss": 1.1168, "grad_norm": "3.220e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.613e-01", "anc_loss": "1.040e+00", "dlm_acc": "6.415e-01", "anc_acc": "6.228e-01", "epoch": 0.02386} {"step": 11935, "loss": 1.3296, "grad_norm": "3.970e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.753e-01", "anc_acc": "5.588e-01", "epoch": 0.02387} {"step": 11940, "loss": 1.2279, "grad_norm": "6.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.304e+00", "anc_loss": "1.376e+00", "dlm_acc": "5.386e-01", "anc_acc": "5.231e-01", "epoch": 0.02388} {"step": 11945, "loss": 1.1519, "grad_norm": "2.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.230e-01", "anc_loss": "5.918e-01", "dlm_acc": "7.962e-01", "anc_acc": "7.779e-01", "epoch": 0.02389} {"step": 11950, "loss": 1.3539, "grad_norm": "2.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.514e+00", "anc_loss": "1.602e+00", "dlm_acc": "4.824e-01", "anc_acc": "4.658e-01", "epoch": 0.0239} {"step": 11955, "loss": 1.0635, "grad_norm": "2.370e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.938e-01", "anc_loss": "1.074e+00", "dlm_acc": "6.040e-01", "anc_acc": "5.849e-01", "epoch": 0.02391} {"step": 11960, "loss": 1.4032, "grad_norm": "4.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.353e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.369e-01", "epoch": 0.02392} {"step": 11965, "loss": 1.7728, "grad_norm": "2.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.570e+00", "anc_loss": "1.666e+00", "dlm_acc": "5.355e-01", "anc_acc": "5.154e-01", "epoch": 0.02393} {"step": 11970, "loss": 1.0518, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.102e+00", "dlm_acc": "6.307e-01", "anc_acc": "6.138e-01", "epoch": 0.02394} {"step": 11975, "loss": 1.7901, "grad_norm": "2.077e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.627e+00", "anc_loss": "1.721e+00", "dlm_acc": "4.848e-01", "anc_acc": "4.692e-01", "epoch": 0.02395} {"step": 11980, "loss": 1.3256, "grad_norm": "4.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.255e+00", "anc_loss": "1.336e+00", "dlm_acc": "5.930e-01", "anc_acc": "5.731e-01", "epoch": 0.02396} {"step": 11985, "loss": 1.7463, "grad_norm": "3.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.719e+00", "anc_loss": "1.808e+00", "dlm_acc": "4.837e-01", "anc_acc": "4.674e-01", "epoch": 0.02397} {"step": 11990, "loss": 0.8501, "grad_norm": "2.210e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.111e+00", "dlm_acc": "5.795e-01", "anc_acc": "5.649e-01", "epoch": 0.02398} {"step": 11995, "loss": 1.2189, "grad_norm": "3.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.209e+00", "dlm_acc": "5.705e-01", "anc_acc": "5.537e-01", "epoch": 0.02399} {"step": 12000, "loss": 1.5074, "grad_norm": "8.012e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.573e+00", "anc_loss": "1.684e+00", "dlm_acc": "5.367e-01", "anc_acc": "5.182e-01", "epoch": 0.024} {"step": 12005, "loss": 1.6701, "grad_norm": "8.926e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.692e+00", "anc_loss": "1.769e+00", "dlm_acc": "4.886e-01", "anc_acc": "4.724e-01", "epoch": 0.02401} {"step": 12010, "loss": 1.409, "grad_norm": "3.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.666e+00", "anc_loss": "1.767e+00", "dlm_acc": "4.857e-01", "anc_acc": "4.699e-01", "epoch": 0.02402} {"step": 12015, "loss": 1.4203, "grad_norm": "4.348e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.872e+00", "anc_loss": "1.975e+00", "dlm_acc": "4.385e-01", "anc_acc": "4.238e-01", "epoch": 0.02403} {"step": 12020, "loss": 1.1364, "grad_norm": "2.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.647e+00", "anc_loss": "1.702e+00", "dlm_acc": "4.232e-01", "anc_acc": "4.116e-01", "epoch": 0.02404} {"step": 12025, "loss": 0.8262, "grad_norm": "2.331e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.422e-01", "anc_loss": "6.813e-01", "dlm_acc": "7.992e-01", "anc_acc": "7.929e-01", "epoch": 0.02405} {"step": 12030, "loss": 1.1254, "grad_norm": "3.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.980e-01", "anc_acc": "5.867e-01", "epoch": 0.02406} {"step": 12035, "loss": 1.2496, "grad_norm": "3.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.324e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.896e-01", "anc_acc": "5.765e-01", "epoch": 0.02407} {"step": 12040, "loss": 1.0797, "grad_norm": "3.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.339e-01", "anc_acc": "5.185e-01", "epoch": 0.02408} {"step": 12045, "loss": 1.0572, "grad_norm": "3.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.313e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.579e-01", "anc_acc": "5.392e-01", "epoch": 0.02409} {"step": 12050, "loss": 0.9672, "grad_norm": "3.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.220e+00", "dlm_acc": "5.611e-01", "anc_acc": "5.450e-01", "epoch": 0.0241} {"step": 12055, "loss": 0.6889, "grad_norm": "1.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.232e+00", "dlm_acc": "5.798e-01", "anc_acc": "5.630e-01", "epoch": 0.02411} {"step": 12060, "loss": 1.1255, "grad_norm": "3.070e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.567e+00", "anc_loss": "1.671e+00", "dlm_acc": "5.249e-01", "anc_acc": "5.060e-01", "epoch": 0.02412} {"step": 12065, "loss": 1.4582, "grad_norm": "4.799e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.785e+00", "dlm_acc": "4.692e-01", "anc_acc": "4.544e-01", "epoch": 0.02413} {"step": 12070, "loss": 1.0142, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.276e+00", "dlm_acc": "4.879e-01", "anc_acc": "4.741e-01", "epoch": 0.02414} {"step": 12075, "loss": 1.321, "grad_norm": "2.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.827e+00", "anc_loss": "1.893e+00", "dlm_acc": "3.846e-01", "anc_acc": "3.734e-01", "epoch": 0.02415} {"step": 12080, "loss": 1.0488, "grad_norm": "3.774e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.041e+00", "anc_loss": "1.102e+00", "dlm_acc": "5.444e-01", "anc_acc": "5.274e-01", "epoch": 0.02416} {"step": 12085, "loss": 0.944, "grad_norm": "2.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.816e-01", "anc_loss": "9.395e-01", "dlm_acc": "6.170e-01", "anc_acc": "6.033e-01", "epoch": 0.02417} {"step": 12090, "loss": 1.3983, "grad_norm": "2.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.292e+00", "anc_loss": "1.348e+00", "dlm_acc": "5.250e-01", "anc_acc": "5.158e-01", "epoch": 0.02418} {"step": 12095, "loss": 0.8936, "grad_norm": "3.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.133e-01", "anc_loss": "8.648e-01", "dlm_acc": "5.668e-01", "anc_acc": "5.527e-01", "epoch": 0.02419} {"step": 12100, "loss": 0.839, "grad_norm": "7.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.602e-01", "anc_loss": "1.023e+00", "dlm_acc": "5.928e-01", "anc_acc": "5.794e-01", "epoch": 0.0242} {"step": 12105, "loss": 0.8896, "grad_norm": "6.485e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.193e+00", "anc_loss": "1.252e+00", "dlm_acc": "4.500e-01", "anc_acc": "4.384e-01", "epoch": 0.02421} {"step": 12110, "loss": 1.0038, "grad_norm": "3.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.060e+00", "dlm_acc": "5.250e-01", "anc_acc": "5.132e-01", "epoch": 0.02422} {"step": 12115, "loss": 1.0171, "grad_norm": "3.762e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.438e-01", "anc_loss": "8.855e-01", "dlm_acc": "5.514e-01", "anc_acc": "5.367e-01", "epoch": 0.02423} {"step": 12120, "loss": 1.0449, "grad_norm": "4.447e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.235e+00", "dlm_acc": "5.316e-01", "anc_acc": "5.196e-01", "epoch": 0.02424} {"step": 12125, "loss": 0.9837, "grad_norm": "3.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.789e-01", "anc_loss": "9.289e-01", "dlm_acc": "6.050e-01", "anc_acc": "5.942e-01", "epoch": 0.02425} {"step": 12130, "loss": 1.2982, "grad_norm": "3.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.734e-01", "anc_loss": "7.273e-01", "dlm_acc": "6.856e-01", "anc_acc": "6.738e-01", "epoch": 0.02426} {"step": 12135, "loss": 1.5835, "grad_norm": "3.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.243e+00", "dlm_acc": "5.073e-01", "anc_acc": "4.991e-01", "epoch": 0.02427} {"step": 12140, "loss": 1.0754, "grad_norm": "3.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.262e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.394e-01", "epoch": 0.02428} {"step": 12145, "loss": 1.5435, "grad_norm": "6.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.664e+00", "anc_loss": "1.747e+00", "dlm_acc": "5.191e-01", "anc_acc": "5.045e-01", "epoch": 0.02429} {"step": 12150, "loss": 1.0598, "grad_norm": "2.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.187e-01", "anc_loss": "9.602e-01", "dlm_acc": "5.678e-01", "anc_acc": "5.563e-01", "epoch": 0.0243} {"step": 12155, "loss": 1.0755, "grad_norm": "8.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.473e-01", "anc_loss": "6.609e-01", "dlm_acc": "5.678e-01", "anc_acc": "5.578e-01", "epoch": 0.02431} {"step": 12160, "loss": 1.2278, "grad_norm": "2.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.297e-01", "anc_loss": "6.426e-01", "dlm_acc": "5.751e-01", "anc_acc": "5.684e-01", "epoch": 0.02432} {"step": 12165, "loss": 1.5622, "grad_norm": "3.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.516e-01", "anc_loss": "7.633e-01", "dlm_acc": "5.348e-01", "anc_acc": "5.288e-01", "epoch": 0.02433} {"step": 12170, "loss": 0.877, "grad_norm": "3.602e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.363e-01", "anc_loss": "4.504e-01", "dlm_acc": "6.695e-01", "anc_acc": "6.586e-01", "epoch": 0.02434} {"step": 12175, "loss": 1.1987, "grad_norm": "3.907e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.125e+00", "dlm_acc": "5.364e-01", "anc_acc": "5.263e-01", "epoch": 0.02435} {"step": 12180, "loss": 1.8198, "grad_norm": "3.074e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.259e-01", "anc_acc": "5.101e-01", "epoch": 0.02436} {"step": 12185, "loss": 1.0706, "grad_norm": "4.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.126e+00", "dlm_acc": "5.981e-01", "anc_acc": "5.822e-01", "epoch": 0.02437} {"step": 12190, "loss": 1.1052, "grad_norm": "1.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.047e-01", "anc_loss": "8.316e-01", "dlm_acc": "5.292e-01", "anc_acc": "5.172e-01", "epoch": 0.02438} {"step": 12195, "loss": 1.1897, "grad_norm": "4.955e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.445e-01", "anc_loss": "5.676e-01", "dlm_acc": "6.036e-01", "anc_acc": "5.906e-01", "epoch": 0.02439} {"step": 12200, "loss": 1.1498, "grad_norm": "4.537e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.347e-01", "anc_loss": "6.820e-01", "dlm_acc": "6.985e-01", "anc_acc": "6.836e-01", "epoch": 0.0244} {"step": 12205, "loss": 1.1787, "grad_norm": "2.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.986e-01", "anc_loss": "1.082e+00", "dlm_acc": "6.519e-01", "anc_acc": "6.341e-01", "epoch": 0.02441} {"step": 12210, "loss": 0.8551, "grad_norm": "1.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.341e-01", "anc_loss": "5.909e-01", "dlm_acc": "8.163e-01", "anc_acc": "7.992e-01", "epoch": 0.02442} {"step": 12215, "loss": 1.1313, "grad_norm": "2.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.418e-01", "anc_acc": "5.289e-01", "epoch": 0.02443} {"step": 12220, "loss": 0.9238, "grad_norm": "2.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.591e-01", "anc_loss": "5.993e-01", "dlm_acc": "8.071e-01", "anc_acc": "7.962e-01", "epoch": 0.02444} {"step": 12225, "loss": 1.0333, "grad_norm": "3.685e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.645e-01", "anc_loss": "1.902e-01", "dlm_acc": "9.343e-01", "anc_acc": "9.240e-01", "epoch": 0.02445} {"step": 12230, "loss": 0.9594, "grad_norm": "2.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.793e-01", "anc_loss": "5.168e-01", "dlm_acc": "8.114e-01", "anc_acc": "7.963e-01", "epoch": 0.02446} {"step": 12235, "loss": 1.0262, "grad_norm": "3.375e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.033e-01", "anc_loss": "6.422e-01", "dlm_acc": "7.186e-01", "anc_acc": "6.997e-01", "epoch": 0.02447} {"step": 12240, "loss": 1.2325, "grad_norm": "3.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.310e+00", "dlm_acc": "5.238e-01", "anc_acc": "5.087e-01", "epoch": 0.02448} {"step": 12245, "loss": 0.7763, "grad_norm": "3.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.688e-01", "anc_loss": "9.234e-01", "dlm_acc": "6.422e-01", "anc_acc": "6.289e-01", "epoch": 0.02449} {"step": 12250, "loss": 1.2615, "grad_norm": "3.869e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.652e-01", "anc_loss": "1.029e+00", "dlm_acc": "6.688e-01", "anc_acc": "6.549e-01", "epoch": 0.0245} {"step": 12255, "loss": 1.4314, "grad_norm": "4.909e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.140e-01", "epoch": 0.02451} {"step": 12260, "loss": 1.4987, "grad_norm": "3.932e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.468e+00", "dlm_acc": "5.334e-01", "anc_acc": "5.219e-01", "epoch": 0.02452} {"step": 12265, "loss": 1.2378, "grad_norm": "3.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.116e+00", "dlm_acc": "5.308e-01", "anc_acc": "5.158e-01", "epoch": 0.02453} {"step": 12270, "loss": 1.3625, "grad_norm": "2.832e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.188e-01", "anc_loss": "7.523e-01", "dlm_acc": "6.040e-01", "anc_acc": "5.936e-01", "epoch": 0.02454} {"step": 12275, "loss": 0.8484, "grad_norm": "2.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.160e-01", "anc_loss": "6.656e-01", "dlm_acc": "6.720e-01", "anc_acc": "6.583e-01", "epoch": 0.02455} {"step": 12280, "loss": 1.3041, "grad_norm": "4.662e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.141e+00", "dlm_acc": "5.877e-01", "anc_acc": "5.710e-01", "epoch": 0.02456} {"step": 12285, "loss": 1.5953, "grad_norm": "2.785e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.522e+00", "anc_loss": "1.603e+00", "dlm_acc": "5.171e-01", "anc_acc": "5.020e-01", "epoch": 0.02457} {"step": 12290, "loss": 1.143, "grad_norm": "2.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.875e-01", "anc_loss": "8.367e-01", "dlm_acc": "6.660e-01", "anc_acc": "6.475e-01", "epoch": 0.02458} {"step": 12295, "loss": 1.3915, "grad_norm": "5.418e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.325e+00", "anc_loss": "1.393e+00", "dlm_acc": "5.627e-01", "anc_acc": "5.493e-01", "epoch": 0.02459} {"step": 12300, "loss": 1.0549, "grad_norm": "3.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.750e-01", "anc_loss": "8.328e-01", "dlm_acc": "6.794e-01", "anc_acc": "6.663e-01", "epoch": 0.0246} {"step": 12305, "loss": 1.0891, "grad_norm": "3.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.879e-01", "anc_loss": "1.045e+00", "dlm_acc": "6.184e-01", "anc_acc": "6.070e-01", "epoch": 0.02461} {"step": 12310, "loss": 1.2524, "grad_norm": "2.229e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.387e+00", "dlm_acc": "4.875e-01", "anc_acc": "4.765e-01", "epoch": 0.02462} {"step": 12315, "loss": 1.3227, "grad_norm": "1.806e+00", "learning_rate": "1.000e-04", "dlm_loss": "4.285e-01", "anc_loss": "4.514e-01", "dlm_acc": "7.285e-01", "anc_acc": "7.194e-01", "epoch": 0.02463} {"step": 12320, "loss": 1.1748, "grad_norm": "2.538e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.680e-01", "anc_loss": "4.887e-01", "dlm_acc": "6.771e-01", "anc_acc": "6.627e-01", "epoch": 0.02464} {"step": 12325, "loss": 1.2837, "grad_norm": "3.732e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.053e+00", "dlm_acc": "3.446e-01", "anc_acc": "3.382e-01", "epoch": 0.02465} {"step": 12330, "loss": 1.1244, "grad_norm": "3.271e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.469e-01", "anc_loss": "5.682e-01", "dlm_acc": "6.301e-01", "anc_acc": "6.237e-01", "epoch": 0.02466} {"step": 12335, "loss": 1.3109, "grad_norm": "5.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.378e-01", "anc_acc": "5.255e-01", "epoch": 0.02467} {"step": 12340, "loss": 0.9017, "grad_norm": "2.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.067e+00", "anc_loss": "1.142e+00", "dlm_acc": "5.935e-01", "anc_acc": "5.756e-01", "epoch": 0.02468} {"step": 12345, "loss": 1.4266, "grad_norm": "4.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.520e+00", "anc_loss": "1.594e+00", "dlm_acc": "5.267e-01", "anc_acc": "5.107e-01", "epoch": 0.02469} {"step": 12350, "loss": 1.3362, "grad_norm": "3.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.235e+00", "anc_loss": "1.300e+00", "dlm_acc": "5.606e-01", "anc_acc": "5.488e-01", "epoch": 0.0247} {"step": 12355, "loss": 1.0321, "grad_norm": "4.290e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.457e-01", "anc_loss": "1.005e+00", "dlm_acc": "6.635e-01", "anc_acc": "6.485e-01", "epoch": 0.02471} {"step": 12360, "loss": 1.2807, "grad_norm": "2.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.258e-01", "anc_loss": "9.742e-01", "dlm_acc": "6.025e-01", "anc_acc": "5.910e-01", "epoch": 0.02472} {"step": 12365, "loss": 1.2841, "grad_norm": "2.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.268e+00", "dlm_acc": "6.025e-01", "anc_acc": "5.877e-01", "epoch": 0.02473} {"step": 12370, "loss": 1.1695, "grad_norm": "3.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.285e-01", "anc_loss": "7.609e-01", "dlm_acc": "6.175e-01", "anc_acc": "6.062e-01", "epoch": 0.02474} {"step": 12375, "loss": 0.7712, "grad_norm": "3.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.859e-01", "anc_loss": "1.062e+00", "dlm_acc": "5.633e-01", "anc_acc": "5.476e-01", "epoch": 0.02475} {"step": 12380, "loss": 1.1948, "grad_norm": "4.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.869e-01", "anc_loss": "8.260e-01", "dlm_acc": "7.135e-01", "anc_acc": "7.025e-01", "epoch": 0.02476} {"step": 12385, "loss": 1.2678, "grad_norm": "3.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.250e+00", "anc_loss": "1.338e+00", "dlm_acc": "5.717e-01", "anc_acc": "5.525e-01", "epoch": 0.02477} {"step": 12390, "loss": 1.4228, "grad_norm": "3.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.556e+00", "anc_loss": "1.655e+00", "dlm_acc": "5.125e-01", "anc_acc": "4.941e-01", "epoch": 0.02478} {"step": 12395, "loss": 1.0248, "grad_norm": "2.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.283e-01", "anc_acc": "5.129e-01", "epoch": 0.02479} {"step": 12400, "loss": 0.9085, "grad_norm": "2.632e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.695e-01", "anc_loss": "1.030e+00", "dlm_acc": "5.668e-01", "anc_acc": "5.515e-01", "epoch": 0.0248} {"step": 12405, "loss": 0.881, "grad_norm": "1.947e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.054e+00", "anc_loss": "1.116e+00", "dlm_acc": "6.024e-01", "anc_acc": "5.864e-01", "epoch": 0.02481} {"step": 12410, "loss": 0.7745, "grad_norm": "3.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.781e-01", "anc_loss": "7.234e-01", "dlm_acc": "6.484e-01", "anc_acc": "6.335e-01", "epoch": 0.02482} {"step": 12415, "loss": 0.729, "grad_norm": "2.532e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.840e-01", "anc_loss": "8.273e-01", "dlm_acc": "6.217e-01", "anc_acc": "6.094e-01", "epoch": 0.02483} {"step": 12420, "loss": 0.865, "grad_norm": "2.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.112e+00", "anc_loss": "1.163e+00", "dlm_acc": "5.254e-01", "anc_acc": "5.154e-01", "epoch": 0.02484} {"step": 12425, "loss": 1.5674, "grad_norm": "3.617e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.798e+00", "anc_loss": "1.902e+00", "dlm_acc": "4.779e-01", "anc_acc": "4.574e-01", "epoch": 0.02485} {"step": 12430, "loss": 0.9447, "grad_norm": "2.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.812e-01", "anc_loss": "1.023e+00", "dlm_acc": "5.429e-01", "anc_acc": "5.329e-01", "epoch": 0.02486} {"step": 12435, "loss": 1.1542, "grad_norm": "3.125e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.070e-01", "anc_loss": "9.570e-01", "dlm_acc": "6.109e-01", "anc_acc": "5.965e-01", "epoch": 0.02487} {"step": 12440, "loss": 1.0096, "grad_norm": "2.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.696e-01", "anc_loss": "8.162e-01", "dlm_acc": "6.987e-01", "anc_acc": "6.860e-01", "epoch": 0.02488} {"step": 12445, "loss": 1.0088, "grad_norm": "3.771e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.156e-01", "anc_loss": "7.691e-01", "dlm_acc": "6.691e-01", "anc_acc": "6.535e-01", "epoch": 0.02489} {"step": 12450, "loss": 1.6179, "grad_norm": "9.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.435e+00", "anc_loss": "1.500e+00", "dlm_acc": "5.208e-01", "anc_acc": "5.076e-01", "epoch": 0.0249} {"step": 12455, "loss": 1.2809, "grad_norm": "3.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.391e+00", "dlm_acc": "4.427e-01", "anc_acc": "4.281e-01", "epoch": 0.02491} {"step": 12460, "loss": 1.6887, "grad_norm": "4.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.149e+00", "dlm_acc": "6.064e-01", "anc_acc": "5.823e-01", "epoch": 0.02492} {"step": 12465, "loss": 1.2978, "grad_norm": "4.666e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.396e+00", "anc_loss": "1.473e+00", "dlm_acc": "4.906e-01", "anc_acc": "4.728e-01", "epoch": 0.02493} {"step": 12470, "loss": 1.5231, "grad_norm": "2.381e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.622e+00", "anc_loss": "1.688e+00", "dlm_acc": "4.816e-01", "anc_acc": "4.680e-01", "epoch": 0.02494} {"step": 12475, "loss": 1.0089, "grad_norm": "3.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.286e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.267e-01", "anc_acc": "5.003e-01", "epoch": 0.02495} {"step": 12480, "loss": 1.5311, "grad_norm": "3.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.294e-01", "anc_acc": "5.078e-01", "epoch": 0.02496} {"step": 12485, "loss": 1.3591, "grad_norm": "4.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.428e+00", "anc_loss": "1.516e+00", "dlm_acc": "5.372e-01", "anc_acc": "5.208e-01", "epoch": 0.02497} {"step": 12490, "loss": 1.3176, "grad_norm": "5.525e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.637e+00", "dlm_acc": "5.291e-01", "anc_acc": "5.122e-01", "epoch": 0.02498} {"step": 12495, "loss": 1.126, "grad_norm": "3.752e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.116e+00", "dlm_acc": "5.649e-01", "anc_acc": "5.356e-01", "epoch": 0.02499} {"step": 12500, "loss": 1.4432, "grad_norm": "4.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.379e+00", "dlm_acc": "4.946e-01", "anc_acc": "4.722e-01", "epoch": 0.025} {"step": 12505, "loss": 1.0489, "grad_norm": "3.622e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.150e+00", "dlm_acc": "5.796e-01", "anc_acc": "5.461e-01", "epoch": 0.02501} {"step": 12510, "loss": 1.4088, "grad_norm": "3.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.470e+00", "dlm_acc": "4.970e-01", "anc_acc": "4.779e-01", "epoch": 0.02502} {"step": 12515, "loss": 1.5201, "grad_norm": "3.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.602e+00", "anc_loss": "1.694e+00", "dlm_acc": "4.403e-01", "anc_acc": "4.255e-01", "epoch": 0.02503} {"step": 12520, "loss": 1.7265, "grad_norm": "3.914e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.545e+00", "anc_loss": "1.670e+00", "dlm_acc": "4.945e-01", "anc_acc": "4.678e-01", "epoch": 0.02504} {"step": 12525, "loss": 0.9234, "grad_norm": "3.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.273e+00", "dlm_acc": "5.495e-01", "anc_acc": "5.297e-01", "epoch": 0.02505} {"step": 12530, "loss": 0.7619, "grad_norm": "2.216e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.602e-01", "anc_loss": "1.008e+00", "dlm_acc": "5.715e-01", "anc_acc": "5.588e-01", "epoch": 0.02506} {"step": 12535, "loss": 1.3821, "grad_norm": "4.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.501e+00", "anc_loss": "1.587e+00", "dlm_acc": "5.249e-01", "anc_acc": "5.066e-01", "epoch": 0.02507} {"step": 12540, "loss": 1.2933, "grad_norm": "1.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.521e+00", "anc_loss": "1.602e+00", "dlm_acc": "4.950e-01", "anc_acc": "4.773e-01", "epoch": 0.02508} {"step": 12545, "loss": 1.2346, "grad_norm": "3.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.620e+00", "anc_loss": "1.700e+00", "dlm_acc": "4.461e-01", "anc_acc": "4.291e-01", "epoch": 0.02509} {"step": 12550, "loss": 1.1621, "grad_norm": "9.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.245e+00", "dlm_acc": "5.583e-01", "anc_acc": "5.414e-01", "epoch": 0.0251} {"step": 12555, "loss": 1.4589, "grad_norm": "3.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.691e+00", "anc_loss": "1.778e+00", "dlm_acc": "4.383e-01", "anc_acc": "4.223e-01", "epoch": 0.02511} {"step": 12560, "loss": 1.3503, "grad_norm": "2.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.535e-01", "anc_loss": "8.219e-01", "dlm_acc": "7.059e-01", "anc_acc": "6.894e-01", "epoch": 0.02512} {"step": 12565, "loss": 1.4162, "grad_norm": "3.667e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.880e+00", "anc_loss": "1.962e+00", "dlm_acc": "4.034e-01", "anc_acc": "3.887e-01", "epoch": 0.02513} {"step": 12570, "loss": 1.2342, "grad_norm": "3.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.078e+00", "anc_loss": "1.142e+00", "dlm_acc": "5.601e-01", "anc_acc": "5.456e-01", "epoch": 0.02514} {"step": 12575, "loss": 1.434, "grad_norm": "3.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.317e+00", "dlm_acc": "5.585e-01", "anc_acc": "5.401e-01", "epoch": 0.02515} {"step": 12580, "loss": 1.577, "grad_norm": "2.411e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.388e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.013e-01", "anc_acc": "4.850e-01", "epoch": 0.02516} {"step": 12585, "loss": 1.1894, "grad_norm": "3.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.200e+00", "dlm_acc": "5.625e-01", "anc_acc": "5.459e-01", "epoch": 0.02517} {"step": 12590, "loss": 1.117, "grad_norm": "4.077e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.324e+00", "anc_loss": "1.397e+00", "dlm_acc": "5.702e-01", "anc_acc": "5.563e-01", "epoch": 0.02518} {"step": 12595, "loss": 0.9187, "grad_norm": "8.420e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.580e+00", "dlm_acc": "4.459e-01", "anc_acc": "4.301e-01", "epoch": 0.02519} {"step": 12600, "loss": 0.9828, "grad_norm": "5.332e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.511e+00", "anc_loss": "1.589e+00", "dlm_acc": "5.051e-01", "anc_acc": "4.900e-01", "epoch": 0.0252} {"step": 12605, "loss": 0.884, "grad_norm": "2.124e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.478e+00", "anc_loss": "1.519e+00", "dlm_acc": "4.859e-01", "anc_acc": "4.751e-01", "epoch": 0.02521} {"step": 12610, "loss": 0.959, "grad_norm": "2.563e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.197e-01", "anc_acc": "5.037e-01", "epoch": 0.02522} {"step": 12615, "loss": 1.2724, "grad_norm": "3.128e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.516e+00", "anc_loss": "1.598e+00", "dlm_acc": "5.289e-01", "anc_acc": "5.134e-01", "epoch": 0.02523} {"step": 12620, "loss": 1.2059, "grad_norm": "4.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.408e+00", "dlm_acc": "4.450e-01", "anc_acc": "4.330e-01", "epoch": 0.02524} {"step": 12625, "loss": 1.8243, "grad_norm": "4.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.850e+00", "anc_loss": "1.952e+00", "dlm_acc": "4.762e-01", "anc_acc": "4.603e-01", "epoch": 0.02525} {"step": 12630, "loss": 1.4413, "grad_norm": "7.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.589e+00", "anc_loss": "1.684e+00", "dlm_acc": "4.925e-01", "anc_acc": "4.752e-01", "epoch": 0.02526} {"step": 12635, "loss": 0.9788, "grad_norm": "3.952e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.404e+00", "dlm_acc": "5.554e-01", "anc_acc": "5.384e-01", "epoch": 0.02527} {"step": 12640, "loss": 1.0578, "grad_norm": "3.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.459e+00", "anc_loss": "1.547e+00", "dlm_acc": "5.401e-01", "anc_acc": "5.233e-01", "epoch": 0.02528} {"step": 12645, "loss": 1.1872, "grad_norm": "2.312e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.367e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.088e-01", "anc_acc": "4.970e-01", "epoch": 0.02529} {"step": 12650, "loss": 0.9421, "grad_norm": "4.440e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.317e+00", "anc_loss": "1.397e+00", "dlm_acc": "5.477e-01", "anc_acc": "5.294e-01", "epoch": 0.0253} {"step": 12655, "loss": 1.1557, "grad_norm": "3.773e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.744e+00", "anc_loss": "1.842e+00", "dlm_acc": "4.604e-01", "anc_acc": "4.436e-01", "epoch": 0.02531} {"step": 12660, "loss": 0.9826, "grad_norm": "3.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.260e+00", "dlm_acc": "5.646e-01", "anc_acc": "5.481e-01", "epoch": 0.02532} {"step": 12665, "loss": 0.8126, "grad_norm": "6.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.317e+00", "anc_loss": "1.370e+00", "dlm_acc": "4.883e-01", "anc_acc": "4.804e-01", "epoch": 0.02533} {"step": 12670, "loss": 0.8343, "grad_norm": "6.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.399e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.321e-01", "anc_acc": "5.148e-01", "epoch": 0.02534} {"step": 12675, "loss": 0.9711, "grad_norm": "1.947e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.144e+00", "anc_loss": "1.219e+00", "dlm_acc": "5.481e-01", "anc_acc": "5.314e-01", "epoch": 0.02535} {"step": 12680, "loss": 1.2655, "grad_norm": "5.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.665e+00", "anc_loss": "1.752e+00", "dlm_acc": "4.959e-01", "anc_acc": "4.802e-01", "epoch": 0.02536} {"step": 12685, "loss": 1.1663, "grad_norm": "2.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.940e-01", "anc_acc": "5.807e-01", "epoch": 0.02537} {"step": 12690, "loss": 1.0949, "grad_norm": "4.591e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.608e+00", "anc_loss": "1.694e+00", "dlm_acc": "4.947e-01", "anc_acc": "4.806e-01", "epoch": 0.02538} {"step": 12695, "loss": 1.3545, "grad_norm": "3.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.437e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.352e-01", "anc_acc": "5.159e-01", "epoch": 0.02539} {"step": 12700, "loss": 1.0184, "grad_norm": "4.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.373e+00", "dlm_acc": "5.624e-01", "anc_acc": "5.422e-01", "epoch": 0.0254} {"step": 12705, "loss": 1.1463, "grad_norm": "3.065e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.484e-01", "anc_acc": "5.290e-01", "epoch": 0.02541} {"step": 12710, "loss": 1.1156, "grad_norm": "3.961e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.619e+00", "anc_loss": "1.683e+00", "dlm_acc": "4.282e-01", "anc_acc": "4.134e-01", "epoch": 0.02542} {"step": 12715, "loss": 1.2075, "grad_norm": "2.583e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.448e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.133e-01", "anc_acc": "4.961e-01", "epoch": 0.02543} {"step": 12720, "loss": 0.9571, "grad_norm": "3.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.656e-01", "anc_loss": "1.048e+00", "dlm_acc": "6.261e-01", "anc_acc": "6.071e-01", "epoch": 0.02544} {"step": 12725, "loss": 1.0933, "grad_norm": "2.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.374e-01", "anc_loss": "9.043e-01", "dlm_acc": "6.867e-01", "anc_acc": "6.679e-01", "epoch": 0.02545} {"step": 12730, "loss": 1.4746, "grad_norm": "5.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.733e+00", "anc_loss": "1.834e+00", "dlm_acc": "4.814e-01", "anc_acc": "4.630e-01", "epoch": 0.02546} {"step": 12735, "loss": 1.2809, "grad_norm": "3.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.509e+00", "dlm_acc": "5.313e-01", "anc_acc": "5.144e-01", "epoch": 0.02547} {"step": 12740, "loss": 1.3232, "grad_norm": "3.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.668e+00", "anc_loss": "1.752e+00", "dlm_acc": "5.090e-01", "anc_acc": "4.930e-01", "epoch": 0.02548} {"step": 12745, "loss": 1.1947, "grad_norm": "2.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.504e+00", "dlm_acc": "5.197e-01", "anc_acc": "4.997e-01", "epoch": 0.02549} {"step": 12750, "loss": 1.4894, "grad_norm": "3.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.502e+00", "anc_loss": "1.580e+00", "dlm_acc": "5.246e-01", "anc_acc": "5.102e-01", "epoch": 0.0255} {"step": 12755, "loss": 0.6772, "grad_norm": "2.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.838e-01", "anc_loss": "2.991e-01", "dlm_acc": "9.061e-01", "anc_acc": "9.014e-01", "epoch": 0.02551} {"step": 12760, "loss": 1.0118, "grad_norm": "3.092e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.042e-01", "anc_loss": "9.728e-01", "dlm_acc": "6.728e-01", "anc_acc": "6.554e-01", "epoch": 0.02552} {"step": 12765, "loss": 1.5096, "grad_norm": "6.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.189e+00", "dlm_acc": "5.836e-01", "anc_acc": "5.676e-01", "epoch": 0.02553} {"step": 12770, "loss": 1.2924, "grad_norm": "3.256e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.387e-01", "anc_loss": "5.570e-01", "dlm_acc": "6.341e-01", "anc_acc": "6.207e-01", "epoch": 0.02554} {"step": 12775, "loss": 0.9608, "grad_norm": "3.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.445e-01", "anc_loss": "4.582e-01", "dlm_acc": "6.591e-01", "anc_acc": "6.496e-01", "epoch": 0.02555} {"step": 12780, "loss": 1.4664, "grad_norm": "2.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.184e-01", "anc_loss": "6.367e-01", "dlm_acc": "6.051e-01", "anc_acc": "5.980e-01", "epoch": 0.02556} {"step": 12785, "loss": 1.2224, "grad_norm": "4.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.982e-01", "anc_loss": "4.116e-01", "dlm_acc": "7.342e-01", "anc_acc": "7.261e-01", "epoch": 0.02557} {"step": 12790, "loss": 1.0039, "grad_norm": "4.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.197e-01", "anc_loss": "7.635e-01", "dlm_acc": "7.412e-01", "anc_acc": "7.302e-01", "epoch": 0.02558} {"step": 12795, "loss": 1.3198, "grad_norm": "5.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.007e+00", "anc_loss": "1.068e+00", "dlm_acc": "6.520e-01", "anc_acc": "6.399e-01", "epoch": 0.02559} {"step": 12800, "loss": 1.7365, "grad_norm": "2.756e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.172e+00", "anc_loss": "1.247e+00", "dlm_acc": "5.922e-01", "anc_acc": "5.774e-01", "epoch": 0.0256} {"step": 12805, "loss": 1.4754, "grad_norm": "2.912e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.125e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.839e-01", "anc_acc": "5.667e-01", "epoch": 0.02561} {"step": 12810, "loss": 0.8454, "grad_norm": "4.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.989e-02", "anc_loss": "2.333e-02", "dlm_acc": "9.886e-01", "anc_acc": "9.874e-01", "epoch": 0.02562} {"step": 12815, "loss": 1.1165, "grad_norm": "2.061e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.108e-02", "anc_loss": "8.977e-02", "dlm_acc": "9.658e-01", "anc_acc": "9.642e-01", "epoch": 0.02563} {"step": 12820, "loss": 1.1606, "grad_norm": "3.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.044e-01", "anc_loss": "7.458e-01", "dlm_acc": "7.209e-01", "anc_acc": "7.115e-01", "epoch": 0.02564} {"step": 12825, "loss": 1.0547, "grad_norm": "3.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.404e-01", "anc_loss": "7.918e-01", "dlm_acc": "6.736e-01", "anc_acc": "6.569e-01", "epoch": 0.02565} {"step": 12830, "loss": 1.0603, "grad_norm": "2.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.887e-01", "anc_loss": "4.133e-01", "dlm_acc": "7.689e-01", "anc_acc": "7.559e-01", "epoch": 0.02566} {"step": 12835, "loss": 0.899, "grad_norm": "3.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.232e-01", "anc_loss": "5.566e-01", "dlm_acc": "7.452e-01", "anc_acc": "7.314e-01", "epoch": 0.02567} {"step": 12840, "loss": 1.1301, "grad_norm": "2.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.817e-01", "anc_loss": "3.107e-01", "dlm_acc": "8.534e-01", "anc_acc": "8.451e-01", "epoch": 0.02568} {"step": 12845, "loss": 1.3066, "grad_norm": "4.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.075e+00", "dlm_acc": "6.391e-01", "anc_acc": "6.250e-01", "epoch": 0.02569} {"step": 12850, "loss": 1.334, "grad_norm": "5.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.160e-01", "anc_loss": "9.725e-01", "dlm_acc": "6.762e-01", "anc_acc": "6.594e-01", "epoch": 0.0257} {"step": 12855, "loss": 1.2391, "grad_norm": "3.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.080e-01", "anc_loss": "8.564e-01", "dlm_acc": "6.892e-01", "anc_acc": "6.772e-01", "epoch": 0.02571} {"step": 12860, "loss": 1.3755, "grad_norm": "4.681e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.109e-01", "anc_loss": "8.469e-01", "dlm_acc": "6.892e-01", "anc_acc": "6.836e-01", "epoch": 0.02572} {"step": 12865, "loss": 1.3674, "grad_norm": "3.892e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.002e-01", "anc_loss": "5.262e-01", "dlm_acc": "8.080e-01", "anc_acc": "8.027e-01", "epoch": 0.02573} {"step": 12870, "loss": 1.3566, "grad_norm": "4.061e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.363e-01", "anc_loss": "6.766e-01", "dlm_acc": "6.952e-01", "anc_acc": "6.833e-01", "epoch": 0.02574} {"step": 12875, "loss": 1.2093, "grad_norm": "3.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.773e-01", "anc_loss": "7.211e-01", "dlm_acc": "7.123e-01", "anc_acc": "7.000e-01", "epoch": 0.02575} {"step": 12880, "loss": 1.568, "grad_norm": "3.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.449e+00", "dlm_acc": "5.590e-01", "anc_acc": "5.449e-01", "epoch": 0.02576} {"step": 12885, "loss": 1.5346, "grad_norm": "3.320e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.907e-01", "anc_acc": "5.752e-01", "epoch": 0.02577} {"step": 12890, "loss": 1.0687, "grad_norm": "2.003e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.055e-01", "anc_loss": "5.143e-01", "dlm_acc": "6.628e-01", "anc_acc": "6.602e-01", "epoch": 0.02578} {"step": 12895, "loss": 1.0397, "grad_norm": "3.280e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.235e-01", "anc_loss": "4.568e-01", "dlm_acc": "8.065e-01", "anc_acc": "7.981e-01", "epoch": 0.02579} {"step": 12900, "loss": 1.444, "grad_norm": "6.950e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.231e+00", "anc_loss": "1.311e+00", "dlm_acc": "5.839e-01", "anc_acc": "5.685e-01", "epoch": 0.0258} {"step": 12905, "loss": 0.745, "grad_norm": "4.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.238e-01", "anc_loss": "4.501e-01", "dlm_acc": "8.347e-01", "anc_acc": "8.288e-01", "epoch": 0.02581} {"step": 12910, "loss": 0.9403, "grad_norm": "3.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.070e+00", "dlm_acc": "3.325e-01", "anc_acc": "3.259e-01", "epoch": 0.02582} {"step": 12915, "loss": 1.3579, "grad_norm": "4.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.068e+00", "anc_loss": "1.071e+00", "dlm_acc": "1.098e-01", "anc_acc": "1.106e-01", "epoch": 0.02583} {"step": 12920, "loss": 1.0735, "grad_norm": "1.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.120e+00", "dlm_acc": "1.052e-01", "anc_acc": "1.072e-01", "epoch": 0.02584} {"step": 12925, "loss": 1.6141, "grad_norm": "1.099e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.341e+00", "anc_loss": "1.341e+00", "dlm_acc": "1.049e-01", "anc_acc": "1.052e-01", "epoch": 0.02585} {"step": 12930, "loss": 1.2564, "grad_norm": "3.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.139e+00", "dlm_acc": "9.975e-02", "anc_acc": "9.881e-02", "epoch": 0.02586} {"step": 12935, "loss": 1.3495, "grad_norm": "2.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.209e+00", "dlm_acc": "1.009e-01", "anc_acc": "1.026e-01", "epoch": 0.02587} {"step": 12940, "loss": 1.6167, "grad_norm": "3.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.239e+00", "dlm_acc": "1.012e-01", "anc_acc": "1.002e-01", "epoch": 0.02588} {"step": 12945, "loss": 1.2802, "grad_norm": "5.896e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.184e+00", "dlm_acc": "1.705e-01", "anc_acc": "1.702e-01", "epoch": 0.02589} {"step": 12950, "loss": 1.1872, "grad_norm": "2.930e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.083e-01", "anc_loss": "5.442e-01", "dlm_acc": "8.088e-01", "anc_acc": "8.016e-01", "epoch": 0.0259} {"step": 12955, "loss": 1.2025, "grad_norm": "4.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.340e-01", "anc_loss": "2.508e-01", "dlm_acc": "8.599e-01", "anc_acc": "8.524e-01", "epoch": 0.02591} {"step": 12960, "loss": 0.7696, "grad_norm": "4.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.400e-01", "anc_loss": "4.785e-01", "dlm_acc": "7.919e-01", "anc_acc": "7.779e-01", "epoch": 0.02592} {"step": 12965, "loss": 1.0064, "grad_norm": "3.255e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.348e-01", "anc_loss": "9.970e-01", "dlm_acc": "6.910e-01", "anc_acc": "6.769e-01", "epoch": 0.02593} {"step": 12970, "loss": 1.2282, "grad_norm": "3.193e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.891e-01", "anc_loss": "9.480e-01", "dlm_acc": "6.333e-01", "anc_acc": "6.163e-01", "epoch": 0.02594} {"step": 12975, "loss": 1.3696, "grad_norm": "3.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.402e-01", "anc_loss": "2.541e-01", "dlm_acc": "9.196e-01", "anc_acc": "9.178e-01", "epoch": 0.02595} {"step": 12980, "loss": 1.263, "grad_norm": "3.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.147e-01", "anc_loss": "7.705e-01", "dlm_acc": "7.100e-01", "anc_acc": "6.948e-01", "epoch": 0.02596} {"step": 12985, "loss": 0.9671, "grad_norm": "3.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.898e-01", "anc_loss": "8.270e-01", "dlm_acc": "6.628e-01", "anc_acc": "6.524e-01", "epoch": 0.02597} {"step": 12990, "loss": 1.1809, "grad_norm": "3.635e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.563e-01", "anc_loss": "1.014e+00", "dlm_acc": "5.943e-01", "anc_acc": "5.818e-01", "epoch": 0.02598} {"step": 12995, "loss": 1.3736, "grad_norm": "3.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.423e-01", "anc_loss": "8.944e-01", "dlm_acc": "7.346e-01", "anc_acc": "7.226e-01", "epoch": 0.02599} {"step": 13000, "loss": 1.0432, "grad_norm": "4.367e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.270e-01", "anc_loss": "8.793e-01", "dlm_acc": "6.813e-01", "anc_acc": "6.655e-01", "epoch": 0.026} {"step": 13005, "loss": 1.1506, "grad_norm": "4.365e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.819e-01", "anc_loss": "3.236e-01", "dlm_acc": "8.883e-01", "anc_acc": "8.732e-01", "epoch": 0.02601} {"step": 13010, "loss": 1.3101, "grad_norm": "5.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.270e-01", "anc_loss": "4.567e-01", "dlm_acc": "7.951e-01", "anc_acc": "7.826e-01", "epoch": 0.02602} {"step": 13015, "loss": 0.8026, "grad_norm": "5.070e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.723e-01", "anc_loss": "1.868e-01", "dlm_acc": "8.977e-01", "anc_acc": "8.879e-01", "epoch": 0.02603} {"step": 13020, "loss": 1.0813, "grad_norm": "2.932e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.074e-01", "anc_loss": "4.389e-01", "dlm_acc": "8.408e-01", "anc_acc": "8.337e-01", "epoch": 0.02604} {"step": 13025, "loss": 1.3142, "grad_norm": "3.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.269e-01", "anc_loss": "8.002e-01", "dlm_acc": "7.393e-01", "anc_acc": "7.252e-01", "epoch": 0.02605} {"step": 13030, "loss": 1.1665, "grad_norm": "2.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.141e+00", "dlm_acc": "5.794e-01", "anc_acc": "5.655e-01", "epoch": 0.02606} {"step": 13035, "loss": 1.1547, "grad_norm": "6.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.417e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.095e-01", "anc_acc": "4.918e-01", "epoch": 0.02607} {"step": 13040, "loss": 0.8371, "grad_norm": "2.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.086e-01", "anc_loss": "8.826e-01", "dlm_acc": "6.788e-01", "anc_acc": "6.581e-01", "epoch": 0.02608} {"step": 13045, "loss": 1.3936, "grad_norm": "3.694e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.723e+00", "anc_loss": "1.811e+00", "dlm_acc": "4.976e-01", "anc_acc": "4.817e-01", "epoch": 0.02609} {"step": 13050, "loss": 1.5016, "grad_norm": "3.239e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.929e-01", "anc_acc": "5.744e-01", "epoch": 0.0261} {"step": 13055, "loss": 1.3402, "grad_norm": "4.094e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.406e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.561e-01", "anc_acc": "5.404e-01", "epoch": 0.02611} {"step": 13060, "loss": 1.0114, "grad_norm": "3.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.324e-01", "anc_loss": "9.059e-01", "dlm_acc": "6.946e-01", "anc_acc": "6.747e-01", "epoch": 0.02612} {"step": 13065, "loss": 1.7215, "grad_norm": "5.043e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.591e+00", "dlm_acc": "5.201e-01", "anc_acc": "5.015e-01", "epoch": 0.02613} {"step": 13070, "loss": 1.5814, "grad_norm": "4.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.527e-01", "anc_acc": "5.358e-01", "epoch": 0.02614} {"step": 13075, "loss": 1.8458, "grad_norm": "6.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.683e+00", "anc_loss": "1.766e+00", "dlm_acc": "4.931e-01", "anc_acc": "4.777e-01", "epoch": 0.02615} {"step": 13080, "loss": 1.1959, "grad_norm": "3.662e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.378e+00", "anc_loss": "1.456e+00", "dlm_acc": "5.147e-01", "anc_acc": "4.969e-01", "epoch": 0.02616} {"step": 13085, "loss": 0.955, "grad_norm": "3.307e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.879e-01", "anc_loss": "9.637e-01", "dlm_acc": "6.291e-01", "anc_acc": "6.069e-01", "epoch": 0.02617} {"step": 13090, "loss": 1.498, "grad_norm": "3.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.499e-01", "anc_acc": "5.332e-01", "epoch": 0.02618} {"step": 13095, "loss": 1.2996, "grad_norm": "3.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.615e-01", "anc_acc": "5.415e-01", "epoch": 0.02619} {"step": 13100, "loss": 1.6336, "grad_norm": "4.291e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.422e+00", "anc_loss": "1.513e+00", "dlm_acc": "5.500e-01", "anc_acc": "5.323e-01", "epoch": 0.0262} {"step": 13105, "loss": 1.4806, "grad_norm": "4.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.229e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.499e-01", "anc_acc": "5.395e-01", "epoch": 0.02621} {"step": 13110, "loss": 1.3993, "grad_norm": "2.804e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.609e-01", "anc_loss": "1.009e+00", "dlm_acc": "5.716e-01", "anc_acc": "5.587e-01", "epoch": 0.02622} {"step": 13115, "loss": 1.1576, "grad_norm": "4.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.008e+00", "anc_loss": "1.077e+00", "dlm_acc": "5.962e-01", "anc_acc": "5.777e-01", "epoch": 0.02623} {"step": 13120, "loss": 1.3004, "grad_norm": "2.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.089e+00", "anc_loss": "1.130e+00", "dlm_acc": "5.009e-01", "anc_acc": "4.933e-01", "epoch": 0.02624} {"step": 13125, "loss": 1.2044, "grad_norm": "3.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.512e-01", "anc_loss": "7.758e-01", "dlm_acc": "5.602e-01", "anc_acc": "5.527e-01", "epoch": 0.02625} {"step": 13130, "loss": 1.4992, "grad_norm": "3.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.187e+00", "dlm_acc": "5.389e-01", "anc_acc": "5.258e-01", "epoch": 0.02626} {"step": 13135, "loss": 1.4875, "grad_norm": "3.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.297e-01", "anc_loss": "9.516e-01", "dlm_acc": "4.496e-01", "anc_acc": "4.426e-01", "epoch": 0.02627} {"step": 13140, "loss": 1.3607, "grad_norm": "3.340e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.156e+00", "anc_loss": "1.220e+00", "dlm_acc": "5.300e-01", "anc_acc": "5.146e-01", "epoch": 0.02628} {"step": 13145, "loss": 1.6341, "grad_norm": "4.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.184e+00", "dlm_acc": "5.425e-01", "anc_acc": "5.275e-01", "epoch": 0.02629} {"step": 13150, "loss": 1.2664, "grad_norm": "3.166e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.098e-01", "anc_loss": "7.520e-01", "dlm_acc": "5.836e-01", "anc_acc": "5.648e-01", "epoch": 0.0263} {"step": 13155, "loss": 1.4112, "grad_norm": "3.117e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.025e+00", "anc_loss": "1.085e+00", "dlm_acc": "5.978e-01", "anc_acc": "5.851e-01", "epoch": 0.02631} {"step": 13160, "loss": 1.3292, "grad_norm": "3.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.719e-01", "anc_loss": "9.289e-01", "dlm_acc": "5.688e-01", "anc_acc": "5.499e-01", "epoch": 0.02632} {"step": 13165, "loss": 1.3924, "grad_norm": "2.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.604e-01", "anc_loss": "8.068e-01", "dlm_acc": "6.546e-01", "anc_acc": "6.423e-01", "epoch": 0.02633} {"step": 13170, "loss": 1.0422, "grad_norm": "3.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.419e-01", "anc_loss": "2.700e-01", "dlm_acc": "7.817e-01", "anc_acc": "7.609e-01", "epoch": 0.02634} {"step": 13175, "loss": 1.3304, "grad_norm": "3.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.918e-01", "anc_loss": "4.313e-01", "dlm_acc": "7.001e-01", "anc_acc": "6.717e-01", "epoch": 0.02635} {"step": 13180, "loss": 1.7077, "grad_norm": "4.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.586e+00", "dlm_acc": "5.011e-01", "anc_acc": "4.854e-01", "epoch": 0.02636} {"step": 13185, "loss": 1.1913, "grad_norm": "2.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.026e+00", "anc_loss": "1.099e+00", "dlm_acc": "6.399e-01", "anc_acc": "6.241e-01", "epoch": 0.02637} {"step": 13190, "loss": 1.6517, "grad_norm": "4.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.071e+00", "dlm_acc": "5.893e-01", "anc_acc": "5.762e-01", "epoch": 0.02638} {"step": 13195, "loss": 1.7847, "grad_norm": "3.041e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.863e-01", "anc_loss": "5.977e-01", "dlm_acc": "5.904e-01", "anc_acc": "5.863e-01", "epoch": 0.02639} {"step": 13200, "loss": 1.3163, "grad_norm": "2.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.430e-01", "anc_loss": "6.605e-01", "dlm_acc": "5.664e-01", "anc_acc": "5.610e-01", "epoch": 0.0264} {"step": 13205, "loss": 1.2128, "grad_norm": "3.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.891e-01", "anc_loss": "5.165e-01", "dlm_acc": "8.426e-01", "anc_acc": "8.342e-01", "epoch": 0.02641} {"step": 13210, "loss": 0.9696, "grad_norm": "2.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.875e-01", "anc_loss": "9.465e-01", "dlm_acc": "6.043e-01", "anc_acc": "5.928e-01", "epoch": 0.02642} {"step": 13215, "loss": 1.4029, "grad_norm": "5.834e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.156e+00", "dlm_acc": "5.193e-01", "anc_acc": "5.065e-01", "epoch": 0.02643} {"step": 13220, "loss": 1.3179, "grad_norm": "2.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.365e+00", "dlm_acc": "5.424e-01", "anc_acc": "5.230e-01", "epoch": 0.02644} {"step": 13225, "loss": 1.1765, "grad_norm": "6.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.202e+00", "dlm_acc": "5.790e-01", "anc_acc": "5.590e-01", "epoch": 0.02645} {"step": 13230, "loss": 1.4793, "grad_norm": "4.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.536e+00", "dlm_acc": "4.861e-01", "anc_acc": "4.728e-01", "epoch": 0.02646} {"step": 13235, "loss": 1.3666, "grad_norm": "4.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.309e-01", "anc_loss": "9.840e-01", "dlm_acc": "6.317e-01", "anc_acc": "6.197e-01", "epoch": 0.02647} {"step": 13240, "loss": 1.0552, "grad_norm": "5.237e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.865e-01", "anc_loss": "5.244e-01", "dlm_acc": "7.315e-01", "anc_acc": "7.183e-01", "epoch": 0.02648} {"step": 13245, "loss": 0.9938, "grad_norm": "4.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.316e-01", "anc_loss": "8.703e-01", "dlm_acc": "5.776e-01", "anc_acc": "5.682e-01", "epoch": 0.02649} {"step": 13250, "loss": 1.392, "grad_norm": "4.201e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.163e+00", "dlm_acc": "5.509e-01", "anc_acc": "5.359e-01", "epoch": 0.0265} {"step": 13255, "loss": 1.2427, "grad_norm": "2.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.918e-01", "anc_loss": "7.211e-01", "dlm_acc": "5.870e-01", "anc_acc": "5.763e-01", "epoch": 0.02651} {"step": 13260, "loss": 1.0734, "grad_norm": "1.359e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.721e-01", "anc_loss": "6.934e-01", "dlm_acc": "6.301e-01", "anc_acc": "6.204e-01", "epoch": 0.02652} {"step": 13265, "loss": 1.3173, "grad_norm": "5.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.316e-01", "anc_loss": "8.871e-01", "dlm_acc": "6.863e-01", "anc_acc": "6.698e-01", "epoch": 0.02653} {"step": 13270, "loss": 1.1326, "grad_norm": "4.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.031e-01", "anc_loss": "9.437e-01", "dlm_acc": "6.244e-01", "anc_acc": "6.158e-01", "epoch": 0.02654} {"step": 13275, "loss": 0.8511, "grad_norm": "4.598e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.687e-01", "anc_loss": "7.109e-01", "dlm_acc": "6.465e-01", "anc_acc": "6.278e-01", "epoch": 0.02655} {"step": 13280, "loss": 1.0698, "grad_norm": "4.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.980e-01", "anc_loss": "8.605e-01", "dlm_acc": "6.783e-01", "anc_acc": "6.636e-01", "epoch": 0.02656} {"step": 13285, "loss": 1.386, "grad_norm": "4.667e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.783e-01", "anc_loss": "8.309e-01", "dlm_acc": "6.514e-01", "anc_acc": "6.379e-01", "epoch": 0.02657} {"step": 13290, "loss": 1.1146, "grad_norm": "4.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.139e+00", "dlm_acc": "6.019e-01", "anc_acc": "5.875e-01", "epoch": 0.02658} {"step": 13295, "loss": 1.3608, "grad_norm": "4.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.482e-01", "anc_loss": "3.603e-01", "dlm_acc": "7.493e-01", "anc_acc": "7.388e-01", "epoch": 0.02659} {"step": 13300, "loss": 1.2049, "grad_norm": "3.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.529e-01", "anc_loss": "3.598e-01", "dlm_acc": "7.898e-01", "anc_acc": "7.876e-01", "epoch": 0.0266} {"step": 13305, "loss": 1.0478, "grad_norm": "2.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.894e-02", "anc_loss": "8.179e-02", "dlm_acc": "9.429e-01", "anc_acc": "9.418e-01", "epoch": 0.02661} {"step": 13310, "loss": 0.9943, "grad_norm": "3.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.750e-02", "anc_loss": "1.869e-02", "dlm_acc": "9.863e-01", "anc_acc": "9.859e-01", "epoch": 0.02662} {"step": 13315, "loss": 1.5228, "grad_norm": "5.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.695e+00", "anc_loss": "1.786e+00", "dlm_acc": "4.751e-01", "anc_acc": "4.582e-01", "epoch": 0.02663} {"step": 13320, "loss": 1.6922, "grad_norm": "3.702e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.705e+00", "anc_loss": "1.795e+00", "dlm_acc": "4.894e-01", "anc_acc": "4.714e-01", "epoch": 0.02664} {"step": 13325, "loss": 1.3027, "grad_norm": "5.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.210e+00", "dlm_acc": "5.866e-01", "anc_acc": "5.687e-01", "epoch": 0.02665} {"step": 13330, "loss": 1.294, "grad_norm": "4.076e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.115e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.915e-01", "anc_acc": "5.746e-01", "epoch": 0.02666} {"step": 13335, "loss": 1.3236, "grad_norm": "1.880e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.471e+00", "dlm_acc": "5.604e-01", "anc_acc": "5.420e-01", "epoch": 0.02667} {"step": 13340, "loss": 1.4033, "grad_norm": "3.522e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.314e+00", "dlm_acc": "5.809e-01", "anc_acc": "5.649e-01", "epoch": 0.02668} {"step": 13345, "loss": 1.968, "grad_norm": "4.317e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.883e+00", "anc_loss": "1.981e+00", "dlm_acc": "4.439e-01", "anc_acc": "4.271e-01", "epoch": 0.02669} {"step": 13350, "loss": 1.3986, "grad_norm": "2.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.415e+00", "dlm_acc": "5.711e-01", "anc_acc": "5.527e-01", "epoch": 0.0267} {"step": 13355, "loss": 1.7737, "grad_norm": "3.385e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.620e+00", "dlm_acc": "5.262e-01", "anc_acc": "5.083e-01", "epoch": 0.02671} {"step": 13360, "loss": 1.2611, "grad_norm": "2.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.992e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.525e-01", "anc_acc": "6.350e-01", "epoch": 0.02672} {"step": 13365, "loss": 1.3957, "grad_norm": "3.418e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.703e-01", "anc_loss": "4.048e-01", "dlm_acc": "8.673e-01", "anc_acc": "8.595e-01", "epoch": 0.02673} {"step": 13370, "loss": 1.1823, "grad_norm": "2.858e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.078e+00", "anc_loss": "1.163e+00", "dlm_acc": "6.169e-01", "anc_acc": "5.999e-01", "epoch": 0.02674} {"step": 13375, "loss": 1.3871, "grad_norm": "5.380e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.705e-01", "anc_acc": "5.476e-01", "epoch": 0.02675} {"step": 13380, "loss": 1.5978, "grad_norm": "3.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.204e+00", "dlm_acc": "6.042e-01", "anc_acc": "5.866e-01", "epoch": 0.02676} {"step": 13385, "loss": 1.638, "grad_norm": "3.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.619e+00", "anc_loss": "1.716e+00", "dlm_acc": "4.761e-01", "anc_acc": "4.592e-01", "epoch": 0.02677} {"step": 13390, "loss": 1.397, "grad_norm": "3.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.325e+00", "anc_loss": "1.388e+00", "dlm_acc": "5.438e-01", "anc_acc": "5.288e-01", "epoch": 0.02678} {"step": 13395, "loss": 1.2106, "grad_norm": "3.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.297e+00", "dlm_acc": "5.409e-01", "anc_acc": "5.226e-01", "epoch": 0.02679} {"step": 13400, "loss": 1.4255, "grad_norm": "3.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.938e+00", "anc_loss": "2.029e+00", "dlm_acc": "2.847e-01", "anc_acc": "2.602e-01", "epoch": 0.0268} {"step": 13405, "loss": 1.7427, "grad_norm": "4.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.631e+00", "anc_loss": "2.703e+00", "dlm_acc": "7.583e-02", "anc_acc": "5.668e-02", "epoch": 0.02681} {"step": 13410, "loss": 1.5569, "grad_norm": "6.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.183e+00", "dlm_acc": "5.655e-01", "anc_acc": "5.505e-01", "epoch": 0.02682} {"step": 13415, "loss": 1.612, "grad_norm": "1.177e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.085e+00", "anc_loss": "1.157e+00", "dlm_acc": "6.321e-01", "anc_acc": "6.143e-01", "epoch": 0.02683} {"step": 13420, "loss": 1.5023, "grad_norm": "5.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.225e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.635e-01", "anc_acc": "5.522e-01", "epoch": 0.02684} {"step": 13425, "loss": 1.6908, "grad_norm": "4.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.487e+00", "dlm_acc": "5.231e-01", "anc_acc": "5.058e-01", "epoch": 0.02685} {"step": 13430, "loss": 1.1291, "grad_norm": "4.004e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.292e+00", "anc_loss": "1.375e+00", "dlm_acc": "5.367e-01", "anc_acc": "5.205e-01", "epoch": 0.02686} {"step": 13435, "loss": 1.2598, "grad_norm": "3.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.655e-01", "anc_acc": "5.464e-01", "epoch": 0.02687} {"step": 13440, "loss": 1.4107, "grad_norm": "2.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.511e-01", "anc_acc": "5.303e-01", "epoch": 0.02688} {"step": 13445, "loss": 1.1794, "grad_norm": "3.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.343e+00", "dlm_acc": "4.948e-01", "anc_acc": "4.798e-01", "epoch": 0.02689} {"step": 13450, "loss": 1.4083, "grad_norm": "2.522e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.152e+00", "dlm_acc": "5.949e-01", "anc_acc": "5.802e-01", "epoch": 0.0269} {"step": 13455, "loss": 1.6835, "grad_norm": "9.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.609e+00", "anc_loss": "1.681e+00", "dlm_acc": "4.832e-01", "anc_acc": "4.615e-01", "epoch": 0.02691} {"step": 13460, "loss": 1.3337, "grad_norm": "8.802e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.396e+00", "anc_loss": "1.450e+00", "dlm_acc": "4.782e-01", "anc_acc": "4.682e-01", "epoch": 0.02692} {"step": 13465, "loss": 1.497, "grad_norm": "3.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.467e+00", "anc_loss": "1.555e+00", "dlm_acc": "5.002e-01", "anc_acc": "4.795e-01", "epoch": 0.02693} {"step": 13470, "loss": 1.334, "grad_norm": "3.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.018e+00", "anc_loss": "1.095e+00", "dlm_acc": "6.154e-01", "anc_acc": "5.978e-01", "epoch": 0.02694} {"step": 13475, "loss": 1.2581, "grad_norm": "5.595e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.392e+00", "dlm_acc": "5.694e-01", "anc_acc": "5.526e-01", "epoch": 0.02695} {"step": 13480, "loss": 1.0027, "grad_norm": "2.755e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.250e-01", "anc_loss": "9.711e-01", "dlm_acc": "6.507e-01", "anc_acc": "6.388e-01", "epoch": 0.02696} {"step": 13485, "loss": 1.1772, "grad_norm": "8.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.641e-01", "anc_loss": "9.977e-01", "dlm_acc": "5.769e-01", "anc_acc": "5.623e-01", "epoch": 0.02697} {"step": 13490, "loss": 1.2698, "grad_norm": "2.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.289e+00", "dlm_acc": "5.784e-01", "anc_acc": "5.504e-01", "epoch": 0.02698} {"step": 13495, "loss": 1.4256, "grad_norm": "3.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.000e-01", "anc_loss": "9.328e-01", "dlm_acc": "6.658e-01", "anc_acc": "6.560e-01", "epoch": 0.02699} {"step": 13500, "loss": 1.4936, "grad_norm": "3.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.539e-01", "anc_loss": "5.836e-01", "dlm_acc": "8.122e-01", "anc_acc": "8.060e-01", "epoch": 0.027} {"step": 13505, "loss": 1.916, "grad_norm": "1.761e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.228e+00", "anc_loss": "2.283e+00", "dlm_acc": "3.213e-01", "anc_acc": "3.137e-01", "epoch": 0.02701} {"step": 13510, "loss": 1.5885, "grad_norm": "7.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.545e+00", "anc_loss": "1.636e+00", "dlm_acc": "4.516e-01", "anc_acc": "4.313e-01", "epoch": 0.02702} {"step": 13515, "loss": 1.3556, "grad_norm": "3.770e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.569e+00", "anc_loss": "1.670e+00", "dlm_acc": "4.736e-01", "anc_acc": "4.547e-01", "epoch": 0.02703} {"step": 13520, "loss": 1.1379, "grad_norm": "6.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.302e-01", "anc_acc": "5.127e-01", "epoch": 0.02704} {"step": 13525, "loss": 1.5625, "grad_norm": "4.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.371e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.288e-01", "anc_acc": "5.079e-01", "epoch": 0.02705} {"step": 13530, "loss": 1.6717, "grad_norm": "2.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.966e+00", "anc_loss": "2.034e+00", "dlm_acc": "3.948e-01", "anc_acc": "3.813e-01", "epoch": 0.02706} {"step": 13535, "loss": 1.2078, "grad_norm": "2.643e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.536e-01", "anc_acc": "5.363e-01", "epoch": 0.02707} {"step": 13540, "loss": 1.1741, "grad_norm": "1.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.270e+00", "dlm_acc": "5.953e-01", "anc_acc": "5.761e-01", "epoch": 0.02708} {"step": 13545, "loss": 1.8453, "grad_norm": "4.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.675e+00", "anc_loss": "1.769e+00", "dlm_acc": "4.770e-01", "anc_acc": "4.592e-01", "epoch": 0.02709} {"step": 13550, "loss": 1.6311, "grad_norm": "4.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.516e+00", "anc_loss": "1.606e+00", "dlm_acc": "5.244e-01", "anc_acc": "5.063e-01", "epoch": 0.0271} {"step": 13555, "loss": 1.5984, "grad_norm": "5.179e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.504e-01", "anc_acc": "5.319e-01", "epoch": 0.02711} {"step": 13560, "loss": 1.4212, "grad_norm": "3.160e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.502e+00", "anc_loss": "1.583e+00", "dlm_acc": "5.043e-01", "anc_acc": "4.873e-01", "epoch": 0.02712} {"step": 13565, "loss": 1.7035, "grad_norm": "1.032e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.831e+00", "anc_loss": "1.923e+00", "dlm_acc": "4.852e-01", "anc_acc": "4.689e-01", "epoch": 0.02713} {"step": 13570, "loss": 1.3703, "grad_norm": "4.527e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.820e+00", "anc_loss": "1.923e+00", "dlm_acc": "4.718e-01", "anc_acc": "4.509e-01", "epoch": 0.02714} {"step": 13575, "loss": 1.6198, "grad_norm": "4.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.536e+00", "dlm_acc": "5.195e-01", "anc_acc": "5.032e-01", "epoch": 0.02715} {"step": 13580, "loss": 1.497, "grad_norm": "3.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.458e+00", "anc_loss": "1.542e+00", "dlm_acc": "5.233e-01", "anc_acc": "5.039e-01", "epoch": 0.02716} {"step": 13585, "loss": 1.1266, "grad_norm": "3.010e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.522e+00", "dlm_acc": "5.509e-01", "anc_acc": "5.320e-01", "epoch": 0.02717} {"step": 13590, "loss": 1.3133, "grad_norm": "4.075e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.509e+00", "dlm_acc": "5.393e-01", "anc_acc": "5.231e-01", "epoch": 0.02718} {"step": 13595, "loss": 1.6721, "grad_norm": "5.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.555e+00", "anc_loss": "1.652e+00", "dlm_acc": "5.501e-01", "anc_acc": "5.309e-01", "epoch": 0.02719} {"step": 13600, "loss": 1.2476, "grad_norm": "3.569e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.487e+00", "anc_loss": "1.591e+00", "dlm_acc": "5.409e-01", "anc_acc": "5.203e-01", "epoch": 0.0272} {"step": 13605, "loss": 1.4806, "grad_norm": "3.883e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.675e+00", "dlm_acc": "4.898e-01", "anc_acc": "4.754e-01", "epoch": 0.02721} {"step": 13610, "loss": 1.4269, "grad_norm": "5.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.523e+00", "anc_loss": "1.612e+00", "dlm_acc": "5.223e-01", "anc_acc": "5.049e-01", "epoch": 0.02722} {"step": 13615, "loss": 1.4801, "grad_norm": "2.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.341e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.820e-01", "anc_acc": "5.711e-01", "epoch": 0.02723} {"step": 13620, "loss": 1.1971, "grad_norm": "3.049e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.412e+00", "dlm_acc": "5.331e-01", "anc_acc": "5.201e-01", "epoch": 0.02724} {"step": 13625, "loss": 1.2417, "grad_norm": "4.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.445e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.122e-01", "anc_acc": "4.952e-01", "epoch": 0.02725} {"step": 13630, "loss": 1.3158, "grad_norm": "5.401e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.545e+00", "dlm_acc": "5.237e-01", "anc_acc": "5.077e-01", "epoch": 0.02726} {"step": 13635, "loss": 1.3003, "grad_norm": "2.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.379e+00", "dlm_acc": "5.621e-01", "anc_acc": "5.477e-01", "epoch": 0.02727} {"step": 13640, "loss": 1.0166, "grad_norm": "2.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.239e+00", "dlm_acc": "5.592e-01", "anc_acc": "5.419e-01", "epoch": 0.02728} {"step": 13645, "loss": 1.3079, "grad_norm": "4.313e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.698e+00", "anc_loss": "1.794e+00", "dlm_acc": "4.705e-01", "anc_acc": "4.520e-01", "epoch": 0.02729} {"step": 13650, "loss": 1.1744, "grad_norm": "8.798e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.370e+00", "dlm_acc": "3.924e-01", "anc_acc": "3.845e-01", "epoch": 0.0273} {"step": 13655, "loss": 1.0936, "grad_norm": "4.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.180e+00", "dlm_acc": "4.156e-01", "anc_acc": "4.087e-01", "epoch": 0.02731} {"step": 13660, "loss": 1.2291, "grad_norm": "3.774e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.122e+00", "anc_loss": "1.185e+00", "dlm_acc": "5.693e-01", "anc_acc": "5.556e-01", "epoch": 0.02732} {"step": 13665, "loss": 1.8589, "grad_norm": "5.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.436e+00", "dlm_acc": "3.686e-01", "anc_acc": "3.576e-01", "epoch": 0.02733} {"step": 13670, "loss": 1.2308, "grad_norm": "2.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.443e+00", "anc_loss": "1.526e+00", "dlm_acc": "5.479e-01", "anc_acc": "5.300e-01", "epoch": 0.02734} {"step": 13675, "loss": 1.5821, "grad_norm": "3.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.859e+00", "anc_loss": "1.961e+00", "dlm_acc": "4.612e-01", "anc_acc": "4.427e-01", "epoch": 0.02735} {"step": 13680, "loss": 1.2862, "grad_norm": "4.401e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.493e+00", "dlm_acc": "5.653e-01", "anc_acc": "5.492e-01", "epoch": 0.02736} {"step": 13685, "loss": 1.5292, "grad_norm": "4.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.719e+00", "anc_loss": "1.800e+00", "dlm_acc": "4.421e-01", "anc_acc": "4.251e-01", "epoch": 0.02737} {"step": 13690, "loss": 1.0904, "grad_norm": "3.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.785e-01", "anc_loss": "1.036e+00", "dlm_acc": "6.145e-01", "anc_acc": "6.005e-01", "epoch": 0.02738} {"step": 13695, "loss": 1.4972, "grad_norm": "2.596e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.453e-01", "anc_loss": "9.887e-01", "dlm_acc": "5.601e-01", "anc_acc": "5.447e-01", "epoch": 0.02739} {"step": 13700, "loss": 1.2878, "grad_norm": "3.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.820e-01", "anc_loss": "7.941e-01", "dlm_acc": "4.337e-01", "anc_acc": "4.252e-01", "epoch": 0.0274} {"step": 13705, "loss": 1.0654, "grad_norm": "5.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.004e-01", "anc_loss": "6.074e-01", "dlm_acc": "5.342e-01", "anc_acc": "5.336e-01", "epoch": 0.02741} {"step": 13710, "loss": 1.5158, "grad_norm": "5.915e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.781e-01", "anc_loss": "6.969e-01", "dlm_acc": "5.571e-01", "anc_acc": "5.506e-01", "epoch": 0.02742} {"step": 13715, "loss": 1.3992, "grad_norm": "4.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.508e-01", "anc_loss": "8.914e-01", "dlm_acc": "5.705e-01", "anc_acc": "5.614e-01", "epoch": 0.02743} {"step": 13720, "loss": 1.5276, "grad_norm": "4.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.603e+00", "anc_loss": "1.697e+00", "dlm_acc": "5.071e-01", "anc_acc": "4.915e-01", "epoch": 0.02744} {"step": 13725, "loss": 1.0562, "grad_norm": "6.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.762e+00", "anc_loss": "1.809e+00", "dlm_acc": "3.118e-01", "anc_acc": "3.016e-01", "epoch": 0.02745} {"step": 13730, "loss": 1.0917, "grad_norm": "3.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.170e+00", "dlm_acc": "3.490e-01", "anc_acc": "3.364e-01", "epoch": 0.02746} {"step": 13735, "loss": 1.3941, "grad_norm": "4.053e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.313e+00", "anc_loss": "1.444e+00", "dlm_acc": "5.451e-01", "anc_acc": "5.212e-01", "epoch": 0.02747} {"step": 13740, "loss": 1.4621, "grad_norm": "9.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.197e+00", "dlm_acc": "6.023e-01", "anc_acc": "5.897e-01", "epoch": 0.02748} {"step": 13745, "loss": 0.8958, "grad_norm": "3.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.659e-01", "anc_loss": "4.113e-01", "dlm_acc": "8.430e-01", "anc_acc": "8.328e-01", "epoch": 0.02749} {"step": 13750, "loss": 1.5327, "grad_norm": "3.937e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.628e+00", "anc_loss": "1.716e+00", "dlm_acc": "4.842e-01", "anc_acc": "4.670e-01", "epoch": 0.0275} {"step": 13755, "loss": 1.3492, "grad_norm": "1.492e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.163e+00", "anc_loss": "1.241e+00", "dlm_acc": "5.423e-01", "anc_acc": "5.245e-01", "epoch": 0.02751} {"step": 13760, "loss": 1.1682, "grad_norm": "4.855e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.206e+00", "dlm_acc": "5.349e-01", "anc_acc": "4.963e-01", "epoch": 0.02752} {"step": 13765, "loss": 1.0933, "grad_norm": "2.955e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.175e+00", "dlm_acc": "5.866e-01", "anc_acc": "5.504e-01", "epoch": 0.02753} {"step": 13770, "loss": 1.0066, "grad_norm": "5.758e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.179e+00", "dlm_acc": "5.709e-01", "anc_acc": "5.516e-01", "epoch": 0.02754} {"step": 13775, "loss": 0.8218, "grad_norm": "2.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.207e-01", "anc_loss": "5.777e-01", "dlm_acc": "7.739e-01", "anc_acc": "7.576e-01", "epoch": 0.02755} {"step": 13780, "loss": 0.8151, "grad_norm": "4.379e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.062e-01", "anc_loss": "6.469e-01", "dlm_acc": "7.315e-01", "anc_acc": "7.238e-01", "epoch": 0.02756} {"step": 13785, "loss": 1.0873, "grad_norm": "3.785e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.186e+00", "anc_loss": "1.301e+00", "dlm_acc": "5.851e-01", "anc_acc": "5.578e-01", "epoch": 0.02757} {"step": 13790, "loss": 0.7419, "grad_norm": "1.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.926e-01", "anc_loss": "8.805e-01", "dlm_acc": "6.442e-01", "anc_acc": "6.156e-01", "epoch": 0.02758} {"step": 13795, "loss": 1.1555, "grad_norm": "2.688e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.122e+00", "anc_loss": "1.204e+00", "dlm_acc": "5.936e-01", "anc_acc": "5.740e-01", "epoch": 0.02759} {"step": 13800, "loss": 1.2785, "grad_norm": "2.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.001e+00", "anc_loss": "1.063e+00", "dlm_acc": "5.848e-01", "anc_acc": "5.679e-01", "epoch": 0.0276} {"step": 13805, "loss": 1.7441, "grad_norm": "3.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.238e+00", "dlm_acc": "4.912e-01", "anc_acc": "4.748e-01", "epoch": 0.02761} {"step": 13810, "loss": 1.3486, "grad_norm": "3.075e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.652e-01", "anc_loss": "8.113e-01", "dlm_acc": "6.125e-01", "anc_acc": "5.984e-01", "epoch": 0.02762} {"step": 13815, "loss": 1.282, "grad_norm": "6.620e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.393e+00", "anc_loss": "1.479e+00", "dlm_acc": "4.963e-01", "anc_acc": "4.791e-01", "epoch": 0.02763} {"step": 13820, "loss": 1.3382, "grad_norm": "4.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.475e+00", "dlm_acc": "5.114e-01", "anc_acc": "4.934e-01", "epoch": 0.02764} {"step": 13825, "loss": 1.2345, "grad_norm": "5.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.629e-01", "anc_loss": "9.180e-01", "dlm_acc": "5.956e-01", "anc_acc": "5.777e-01", "epoch": 0.02765} {"step": 13830, "loss": 1.2238, "grad_norm": "4.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.111e+00", "dlm_acc": "6.387e-01", "anc_acc": "6.145e-01", "epoch": 0.02766} {"step": 13835, "loss": 1.2608, "grad_norm": "4.964e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.613e+00", "anc_loss": "1.661e+00", "dlm_acc": "4.242e-01", "anc_acc": "4.132e-01", "epoch": 0.02767} {"step": 13840, "loss": 1.1252, "grad_norm": "4.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.727e-01", "anc_loss": "1.072e+00", "dlm_acc": "6.333e-01", "anc_acc": "6.092e-01", "epoch": 0.02768} {"step": 13845, "loss": 0.9791, "grad_norm": "2.964e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.465e-01", "anc_loss": "7.352e-01", "dlm_acc": "7.283e-01", "anc_acc": "6.992e-01", "epoch": 0.02769} {"step": 13850, "loss": 1.405, "grad_norm": "5.668e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.379e-01", "anc_loss": "9.922e-01", "dlm_acc": "6.521e-01", "anc_acc": "6.435e-01", "epoch": 0.0277} {"step": 13855, "loss": 1.652, "grad_norm": "4.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.859e-01", "anc_acc": "5.675e-01", "epoch": 0.02771} {"step": 13860, "loss": 1.2773, "grad_norm": "3.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.067e+00", "anc_loss": "1.142e+00", "dlm_acc": "6.182e-01", "anc_acc": "6.015e-01", "epoch": 0.02772} {"step": 13865, "loss": 0.9787, "grad_norm": "5.011e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.811e-01", "anc_loss": "9.561e-01", "dlm_acc": "6.493e-01", "anc_acc": "6.283e-01", "epoch": 0.02773} {"step": 13870, "loss": 1.0223, "grad_norm": "4.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.840e-01", "anc_loss": "7.574e-01", "dlm_acc": "6.607e-01", "anc_acc": "6.354e-01", "epoch": 0.02774} {"step": 13875, "loss": 1.4913, "grad_norm": "7.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.605e+00", "anc_loss": "1.693e+00", "dlm_acc": "4.893e-01", "anc_acc": "4.734e-01", "epoch": 0.02775} {"step": 13880, "loss": 1.2808, "grad_norm": "2.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.338e+00", "anc_loss": "1.429e+00", "dlm_acc": "5.429e-01", "anc_acc": "5.245e-01", "epoch": 0.02776} {"step": 13885, "loss": 0.8823, "grad_norm": "2.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.141e-01", "anc_loss": "7.340e-01", "dlm_acc": "5.798e-01", "anc_acc": "5.749e-01", "epoch": 0.02777} {"step": 13890, "loss": 1.3194, "grad_norm": "3.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.008e-01", "anc_loss": "6.117e-01", "dlm_acc": "5.887e-01", "anc_acc": "5.868e-01", "epoch": 0.02778} {"step": 13895, "loss": 1.0143, "grad_norm": "3.525e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.109e-01", "anc_loss": "5.199e-01", "dlm_acc": "6.110e-01", "anc_acc": "6.042e-01", "epoch": 0.02779} {"step": 13900, "loss": 0.8017, "grad_norm": "3.274e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.199e-01", "anc_loss": "4.266e-01", "dlm_acc": "6.310e-01", "anc_acc": "6.282e-01", "epoch": 0.0278} {"step": 13905, "loss": 1.2645, "grad_norm": "3.246e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.000e-01", "anc_loss": "9.352e-01", "dlm_acc": "5.158e-01", "anc_acc": "5.047e-01", "epoch": 0.02781} {"step": 13910, "loss": 1.7895, "grad_norm": "5.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.795e+00", "anc_loss": "1.891e+00", "dlm_acc": "4.680e-01", "anc_acc": "4.521e-01", "epoch": 0.02782} {"step": 13915, "loss": 1.7404, "grad_norm": "4.578e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.605e+00", "anc_loss": "1.673e+00", "dlm_acc": "4.530e-01", "anc_acc": "4.402e-01", "epoch": 0.02783} {"step": 13920, "loss": 1.6102, "grad_norm": "2.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.875e+00", "anc_loss": "2.883e+00", "dlm_acc": "2.223e-02", "anc_acc": "2.206e-02", "epoch": 0.02784} {"step": 13925, "loss": 1.6107, "grad_norm": "4.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.009e+00", "anc_loss": "3.016e+00", "dlm_acc": "2.357e-02", "anc_acc": "2.262e-02", "epoch": 0.02785} {"step": 13930, "loss": 1.2802, "grad_norm": "4.425e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.280e+00", "anc_loss": "2.322e+00", "dlm_acc": "1.906e-01", "anc_acc": "1.841e-01", "epoch": 0.02786} {"step": 13935, "loss": 1.2565, "grad_norm": "2.635e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.480e+00", "anc_loss": "1.567e+00", "dlm_acc": "5.313e-01", "anc_acc": "5.129e-01", "epoch": 0.02787} {"step": 13940, "loss": 1.3059, "grad_norm": "2.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.204e-01", "anc_acc": "5.008e-01", "epoch": 0.02788} {"step": 13945, "loss": 1.3488, "grad_norm": "2.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.388e+00", "anc_loss": "1.497e+00", "dlm_acc": "5.515e-01", "anc_acc": "5.317e-01", "epoch": 0.02789} {"step": 13950, "loss": 1.5733, "grad_norm": "4.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.159e+00", "dlm_acc": "5.354e-01", "anc_acc": "5.241e-01", "epoch": 0.0279} {"step": 13955, "loss": 1.5878, "grad_norm": "3.942e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.606e+00", "anc_loss": "1.711e+00", "dlm_acc": "4.847e-01", "anc_acc": "4.672e-01", "epoch": 0.02791} {"step": 13960, "loss": 1.3094, "grad_norm": "4.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.553e+00", "anc_loss": "1.642e+00", "dlm_acc": "4.782e-01", "anc_acc": "4.608e-01", "epoch": 0.02792} {"step": 13965, "loss": 1.4405, "grad_norm": "4.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.054e+00", "anc_loss": "1.127e+00", "dlm_acc": "5.854e-01", "anc_acc": "5.697e-01", "epoch": 0.02793} {"step": 13970, "loss": 1.3822, "grad_norm": "2.431e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.243e+00", "dlm_acc": "5.412e-01", "anc_acc": "5.249e-01", "epoch": 0.02794} {"step": 13975, "loss": 1.6461, "grad_norm": "4.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.664e+00", "anc_loss": "1.753e+00", "dlm_acc": "4.919e-01", "anc_acc": "4.735e-01", "epoch": 0.02795} {"step": 13980, "loss": 1.8552, "grad_norm": "3.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.597e+00", "anc_loss": "1.684e+00", "dlm_acc": "5.139e-01", "anc_acc": "4.974e-01", "epoch": 0.02796} {"step": 13985, "loss": 1.498, "grad_norm": "3.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.609e+00", "dlm_acc": "4.912e-01", "anc_acc": "4.741e-01", "epoch": 0.02797} {"step": 13990, "loss": 1.2267, "grad_norm": "2.420e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.031e+00", "anc_loss": "1.106e+00", "dlm_acc": "6.039e-01", "anc_acc": "5.845e-01", "epoch": 0.02798} {"step": 13995, "loss": 1.4631, "grad_norm": "9.487e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.567e+00", "anc_loss": "1.653e+00", "dlm_acc": "4.917e-01", "anc_acc": "4.736e-01", "epoch": 0.02799} {"step": 14000, "loss": 1.0553, "grad_norm": "2.006e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.094e-01", "anc_loss": "9.453e-01", "dlm_acc": "4.519e-01", "anc_acc": "4.396e-01", "epoch": 0.028} {"step": 14005, "loss": 1.2237, "grad_norm": "3.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.172e+00", "anc_loss": "1.229e+00", "dlm_acc": "4.969e-01", "anc_acc": "4.813e-01", "epoch": 0.02801} {"step": 14010, "loss": 1.7487, "grad_norm": "4.540e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.560e+00", "dlm_acc": "5.318e-01", "anc_acc": "5.150e-01", "epoch": 0.02802} {"step": 14015, "loss": 1.1371, "grad_norm": "3.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.249e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.292e-01", "anc_acc": "5.097e-01", "epoch": 0.02803} {"step": 14020, "loss": 1.3806, "grad_norm": "2.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.225e+00", "anc_loss": "1.303e+00", "dlm_acc": "5.936e-01", "anc_acc": "5.767e-01", "epoch": 0.02804} {"step": 14025, "loss": 1.2379, "grad_norm": "2.925e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.346e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.069e-01", "anc_acc": "4.897e-01", "epoch": 0.02805} {"step": 14030, "loss": 1.1847, "grad_norm": "2.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.452e-01", "anc_acc": "5.269e-01", "epoch": 0.02806} {"step": 14035, "loss": 1.3232, "grad_norm": "4.960e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.288e+00", "dlm_acc": "4.690e-01", "anc_acc": "4.556e-01", "epoch": 0.02807} {"step": 14040, "loss": 1.265, "grad_norm": "4.523e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.729e-01", "anc_loss": "7.402e-01", "dlm_acc": "7.431e-01", "anc_acc": "7.243e-01", "epoch": 0.02808} {"step": 14045, "loss": 1.1163, "grad_norm": "5.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.513e-01", "anc_acc": "5.351e-01", "epoch": 0.02809} {"step": 14050, "loss": 1.2129, "grad_norm": "2.748e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.825e+00", "anc_loss": "1.909e+00", "dlm_acc": "4.354e-01", "anc_acc": "4.197e-01", "epoch": 0.0281} {"step": 14055, "loss": 0.7944, "grad_norm": "1.849e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.286e+00", "dlm_acc": "5.430e-01", "anc_acc": "5.243e-01", "epoch": 0.02811} {"step": 14060, "loss": 1.1847, "grad_norm": "3.666e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.320e-01", "anc_acc": "5.183e-01", "epoch": 0.02812} {"step": 14065, "loss": 1.8735, "grad_norm": "3.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.775e+00", "anc_loss": "1.875e+00", "dlm_acc": "4.902e-01", "anc_acc": "4.722e-01", "epoch": 0.02813} {"step": 14070, "loss": 1.2987, "grad_norm": "2.931e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.680e+00", "dlm_acc": "4.964e-01", "anc_acc": "4.805e-01", "epoch": 0.02814} {"step": 14075, "loss": 0.9813, "grad_norm": "5.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.953e-01", "anc_loss": "9.613e-01", "dlm_acc": "6.169e-01", "anc_acc": "6.016e-01", "epoch": 0.02815} {"step": 14080, "loss": 1.1798, "grad_norm": "3.359e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.459e+00", "anc_loss": "1.541e+00", "dlm_acc": "4.877e-01", "anc_acc": "4.691e-01", "epoch": 0.02816} {"step": 14085, "loss": 1.6359, "grad_norm": "6.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.608e+00", "anc_loss": "1.692e+00", "dlm_acc": "4.789e-01", "anc_acc": "4.633e-01", "epoch": 0.02817} {"step": 14090, "loss": 1.2397, "grad_norm": "3.714e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.771e-01", "anc_acc": "5.567e-01", "epoch": 0.02818} {"step": 14095, "loss": 1.3675, "grad_norm": "2.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.271e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.706e-01", "anc_acc": "5.513e-01", "epoch": 0.02819} {"step": 14100, "loss": 1.507, "grad_norm": "3.340e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.429e+00", "dlm_acc": "5.429e-01", "anc_acc": "5.229e-01", "epoch": 0.0282} {"step": 14105, "loss": 1.321, "grad_norm": "1.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.505e+00", "dlm_acc": "5.108e-01", "anc_acc": "4.886e-01", "epoch": 0.02821} {"step": 14110, "loss": 1.5575, "grad_norm": "5.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.363e+00", "dlm_acc": "6.077e-01", "anc_acc": "5.921e-01", "epoch": 0.02822} {"step": 14115, "loss": 1.4759, "grad_norm": "3.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.771e-01", "anc_acc": "5.609e-01", "epoch": 0.02823} {"step": 14120, "loss": 1.2553, "grad_norm": "3.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.564e-01", "anc_acc": "5.361e-01", "epoch": 0.02824} {"step": 14125, "loss": 1.5034, "grad_norm": "3.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.703e+00", "anc_loss": "1.795e+00", "dlm_acc": "4.668e-01", "anc_acc": "4.497e-01", "epoch": 0.02825} {"step": 14130, "loss": 1.7915, "grad_norm": "3.613e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.707e+00", "dlm_acc": "5.236e-01", "anc_acc": "5.065e-01", "epoch": 0.02826} {"step": 14135, "loss": 1.3267, "grad_norm": "3.616e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.561e+00", "anc_loss": "1.652e+00", "dlm_acc": "4.718e-01", "anc_acc": "4.540e-01", "epoch": 0.02827} {"step": 14140, "loss": 1.491, "grad_norm": "3.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.487e-01", "anc_acc": "5.304e-01", "epoch": 0.02828} {"step": 14145, "loss": 1.3877, "grad_norm": "3.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.042e+00", "anc_loss": "1.107e+00", "dlm_acc": "6.286e-01", "anc_acc": "6.126e-01", "epoch": 0.02829} {"step": 14150, "loss": 1.3737, "grad_norm": "4.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.266e+00", "dlm_acc": "6.041e-01", "anc_acc": "5.844e-01", "epoch": 0.0283} {"step": 14155, "loss": 1.0739, "grad_norm": "2.759e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.279e+00", "dlm_acc": "5.377e-01", "anc_acc": "5.186e-01", "epoch": 0.02831} {"step": 14160, "loss": 1.6537, "grad_norm": "1.098e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.692e+00", "anc_loss": "1.786e+00", "dlm_acc": "5.130e-01", "anc_acc": "4.971e-01", "epoch": 0.02832} {"step": 14165, "loss": 1.1466, "grad_norm": "2.846e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.153e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.681e-01", "anc_acc": "5.492e-01", "epoch": 0.02833} {"step": 14170, "loss": 1.6183, "grad_norm": "5.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.555e+00", "anc_loss": "1.634e+00", "dlm_acc": "4.550e-01", "anc_acc": "4.411e-01", "epoch": 0.02834} {"step": 14175, "loss": 1.6638, "grad_norm": "8.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.677e+00", "anc_loss": "1.770e+00", "dlm_acc": "4.967e-01", "anc_acc": "4.788e-01", "epoch": 0.02835} {"step": 14180, "loss": 1.3144, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.565e-01", "anc_acc": "5.402e-01", "epoch": 0.02836} {"step": 14185, "loss": 1.3994, "grad_norm": "6.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.362e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.317e-01", "anc_acc": "5.137e-01", "epoch": 0.02837} {"step": 14190, "loss": 1.4317, "grad_norm": "7.998e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.476e+00", "dlm_acc": "5.313e-01", "anc_acc": "5.141e-01", "epoch": 0.02838} {"step": 14195, "loss": 1.8421, "grad_norm": "7.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.232e+00", "dlm_acc": "4.693e-01", "anc_acc": "4.579e-01", "epoch": 0.02839} {"step": 14200, "loss": 1.4827, "grad_norm": "6.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.580e+00", "anc_loss": "1.655e+00", "dlm_acc": "4.447e-01", "anc_acc": "4.280e-01", "epoch": 0.0284} {"step": 14205, "loss": 1.3993, "grad_norm": "4.304e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.697e+00", "anc_loss": "1.762e+00", "dlm_acc": "3.781e-01", "anc_acc": "3.667e-01", "epoch": 0.02841} {"step": 14210, "loss": 1.6397, "grad_norm": "5.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.243e+00", "anc_loss": "1.310e+00", "dlm_acc": "5.976e-01", "anc_acc": "5.820e-01", "epoch": 0.02842} {"step": 14215, "loss": 1.7914, "grad_norm": "6.101e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.365e+00", "anc_loss": "1.471e+00", "dlm_acc": "5.544e-01", "anc_acc": "5.322e-01", "epoch": 0.02843} {"step": 14220, "loss": 1.7794, "grad_norm": "4.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.445e+00", "anc_loss": "1.559e+00", "dlm_acc": "5.456e-01", "anc_acc": "5.246e-01", "epoch": 0.02844} {"step": 14225, "loss": 1.3003, "grad_norm": "5.372e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.232e+00", "anc_loss": "1.319e+00", "dlm_acc": "5.485e-01", "anc_acc": "5.290e-01", "epoch": 0.02845} {"step": 14230, "loss": 1.4034, "grad_norm": "4.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.268e-01", "anc_acc": "5.059e-01", "epoch": 0.02846} {"step": 14235, "loss": 1.0938, "grad_norm": "3.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.488e-01", "anc_loss": "5.289e-01", "dlm_acc": "8.111e-01", "anc_acc": "7.861e-01", "epoch": 0.02847} {"step": 14240, "loss": 1.2246, "grad_norm": "3.765e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.194e+00", "anc_loss": "1.272e+00", "dlm_acc": "5.948e-01", "anc_acc": "5.788e-01", "epoch": 0.02848} {"step": 14245, "loss": 1.339, "grad_norm": "3.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.452e+00", "dlm_acc": "5.318e-01", "anc_acc": "5.096e-01", "epoch": 0.02849} {"step": 14250, "loss": 1.4499, "grad_norm": "3.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.658e+00", "anc_loss": "1.739e+00", "dlm_acc": "5.122e-01", "anc_acc": "4.941e-01", "epoch": 0.0285} {"step": 14255, "loss": 1.1178, "grad_norm": "3.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.263e+00", "dlm_acc": "5.683e-01", "anc_acc": "5.459e-01", "epoch": 0.02851} {"step": 14260, "loss": 1.3429, "grad_norm": "2.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.255e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.583e-01", "anc_acc": "5.393e-01", "epoch": 0.02852} {"step": 14265, "loss": 1.5174, "grad_norm": "3.563e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.374e-01", "anc_acc": "5.156e-01", "epoch": 0.02853} {"step": 14270, "loss": 1.4651, "grad_norm": "4.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.386e-01", "anc_acc": "5.177e-01", "epoch": 0.02854} {"step": 14275, "loss": 1.219, "grad_norm": "2.201e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.766e-01", "anc_loss": "1.046e+00", "dlm_acc": "6.542e-01", "anc_acc": "6.350e-01", "epoch": 0.02855} {"step": 14280, "loss": 1.622, "grad_norm": "3.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.551e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.328e-01", "anc_acc": "5.155e-01", "epoch": 0.02856} {"step": 14285, "loss": 1.1532, "grad_norm": "1.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.773e-01", "anc_loss": "1.053e+00", "dlm_acc": "6.009e-01", "anc_acc": "5.807e-01", "epoch": 0.02857} {"step": 14290, "loss": 1.5322, "grad_norm": "3.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.543e-01", "anc_acc": "5.308e-01", "epoch": 0.02858} {"step": 14295, "loss": 1.1616, "grad_norm": "2.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.163e+00", "anc_loss": "1.244e+00", "dlm_acc": "5.596e-01", "anc_acc": "5.417e-01", "epoch": 0.02859} {"step": 14300, "loss": 1.2061, "grad_norm": "6.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.218e+00", "dlm_acc": "6.139e-01", "anc_acc": "5.971e-01", "epoch": 0.0286} {"step": 14305, "loss": 1.2225, "grad_norm": "3.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.416e+00", "dlm_acc": "5.591e-01", "anc_acc": "5.382e-01", "epoch": 0.02861} {"step": 14310, "loss": 1.1923, "grad_norm": "3.094e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.077e+00", "dlm_acc": "5.990e-01", "anc_acc": "5.860e-01", "epoch": 0.02862} {"step": 14315, "loss": 1.3529, "grad_norm": "2.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.380e-01", "anc_acc": "5.166e-01", "epoch": 0.02863} {"step": 14320, "loss": 1.2682, "grad_norm": "2.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.137e+00", "dlm_acc": "5.277e-01", "anc_acc": "5.100e-01", "epoch": 0.02864} {"step": 14325, "loss": 1.1042, "grad_norm": "2.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.759e-01", "anc_acc": "5.569e-01", "epoch": 0.02865} {"step": 14330, "loss": 1.0526, "grad_norm": "2.654e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.398e-01", "anc_loss": "8.609e-01", "dlm_acc": "5.139e-01", "anc_acc": "5.054e-01", "epoch": 0.02866} {"step": 14335, "loss": 1.0675, "grad_norm": "3.170e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.922e-01", "anc_loss": "6.043e-01", "dlm_acc": "5.423e-01", "anc_acc": "5.369e-01", "epoch": 0.02867} {"step": 14340, "loss": 1.1117, "grad_norm": "4.911e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.547e-01", "anc_loss": "5.664e-01", "dlm_acc": "5.383e-01", "anc_acc": "5.319e-01", "epoch": 0.02868} {"step": 14345, "loss": 1.1619, "grad_norm": "4.227e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.180e-01", "anc_loss": "6.289e-01", "dlm_acc": "5.110e-01", "anc_acc": "5.067e-01", "epoch": 0.02869} {"step": 14350, "loss": 1.0715, "grad_norm": "2.210e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.641e-01", "anc_loss": "5.766e-01", "dlm_acc": "5.535e-01", "anc_acc": "5.462e-01", "epoch": 0.0287} {"step": 14355, "loss": 0.9286, "grad_norm": "3.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.152e-01", "anc_loss": "7.617e-01", "dlm_acc": "5.964e-01", "anc_acc": "5.773e-01", "epoch": 0.02871} {"step": 14360, "loss": 1.1089, "grad_norm": "5.065e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.332e+00", "anc_loss": "1.404e+00", "dlm_acc": "5.155e-01", "anc_acc": "4.970e-01", "epoch": 0.02872} {"step": 14365, "loss": 0.8957, "grad_norm": "3.791e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.617e-01", "anc_loss": "9.070e-01", "dlm_acc": "6.206e-01", "anc_acc": "6.122e-01", "epoch": 0.02873} {"step": 14370, "loss": 1.0841, "grad_norm": "3.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.031e+00", "anc_loss": "1.097e+00", "dlm_acc": "5.688e-01", "anc_acc": "5.507e-01", "epoch": 0.02874} {"step": 14375, "loss": 1.3958, "grad_norm": "2.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.277e+00", "dlm_acc": "4.728e-01", "anc_acc": "4.573e-01", "epoch": 0.02875} {"step": 14380, "loss": 0.8488, "grad_norm": "2.921e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.171e+00", "dlm_acc": "5.651e-01", "anc_acc": "5.450e-01", "epoch": 0.02876} {"step": 14385, "loss": 0.8273, "grad_norm": "2.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.239e+00", "dlm_acc": "5.556e-01", "anc_acc": "5.378e-01", "epoch": 0.02877} {"step": 14390, "loss": 0.8884, "grad_norm": "3.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.123e+00", "dlm_acc": "4.995e-01", "anc_acc": "4.808e-01", "epoch": 0.02878} {"step": 14395, "loss": 1.4457, "grad_norm": "2.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.674e+00", "anc_loss": "1.750e+00", "dlm_acc": "4.459e-01", "anc_acc": "4.296e-01", "epoch": 0.02879} {"step": 14400, "loss": 1.2392, "grad_norm": "7.527e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.040e+00", "anc_loss": "1.130e+00", "dlm_acc": "6.452e-01", "anc_acc": "6.223e-01", "epoch": 0.0288} {"step": 14405, "loss": 1.2827, "grad_norm": "3.267e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.278e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.368e-01", "anc_acc": "5.098e-01", "epoch": 0.02881} {"step": 14410, "loss": 1.1672, "grad_norm": "7.265e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.421e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.633e-01", "anc_acc": "5.512e-01", "epoch": 0.02882} {"step": 14415, "loss": 0.888, "grad_norm": "5.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.263e+00", "dlm_acc": "5.908e-01", "anc_acc": "5.727e-01", "epoch": 0.02883} {"step": 14420, "loss": 1.2996, "grad_norm": "4.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.791e+00", "anc_loss": "1.841e+00", "dlm_acc": "3.220e-01", "anc_acc": "3.080e-01", "epoch": 0.02884} {"step": 14425, "loss": 1.3103, "grad_norm": "2.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.884e-01", "anc_loss": "1.046e+00", "dlm_acc": "6.500e-01", "anc_acc": "6.373e-01", "epoch": 0.02885} {"step": 14430, "loss": 1.4321, "grad_norm": "3.873e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.628e-01", "anc_acc": "5.471e-01", "epoch": 0.02886} {"step": 14435, "loss": 0.8261, "grad_norm": "3.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.852e-01", "anc_loss": "6.390e-01", "dlm_acc": "7.441e-01", "anc_acc": "7.233e-01", "epoch": 0.02887} {"step": 14440, "loss": 1.2561, "grad_norm": "3.527e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.220e+00", "dlm_acc": "5.987e-01", "anc_acc": "5.793e-01", "epoch": 0.02888} {"step": 14445, "loss": 0.9894, "grad_norm": "3.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.377e-01", "anc_loss": "8.104e-01", "dlm_acc": "7.179e-01", "anc_acc": "6.998e-01", "epoch": 0.02889} {"step": 14450, "loss": 0.912, "grad_norm": "1.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.137e-01", "anc_loss": "6.707e-01", "dlm_acc": "7.299e-01", "anc_acc": "7.125e-01", "epoch": 0.0289} {"step": 14455, "loss": 1.1385, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.311e+00", "dlm_acc": "5.587e-01", "anc_acc": "5.394e-01", "epoch": 0.02891} {"step": 14460, "loss": 1.1907, "grad_norm": "4.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.844e+00", "anc_loss": "1.895e+00", "dlm_acc": "3.835e-01", "anc_acc": "3.740e-01", "epoch": 0.02892} {"step": 14465, "loss": 1.3406, "grad_norm": "4.738e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.715e+00", "anc_loss": "1.775e+00", "dlm_acc": "3.748e-01", "anc_acc": "3.598e-01", "epoch": 0.02893} {"step": 14470, "loss": 1.1115, "grad_norm": "4.008e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.396e+00", "anc_loss": "1.460e+00", "dlm_acc": "4.845e-01", "anc_acc": "4.701e-01", "epoch": 0.02894} {"step": 14475, "loss": 0.8885, "grad_norm": "2.498e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.930e-01", "anc_loss": "8.352e-01", "dlm_acc": "5.399e-01", "anc_acc": "5.289e-01", "epoch": 0.02895} {"step": 14480, "loss": 1.1571, "grad_norm": "1.056e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.227e-01", "anc_loss": "9.781e-01", "dlm_acc": "5.735e-01", "anc_acc": "5.581e-01", "epoch": 0.02896} {"step": 14485, "loss": 1.1056, "grad_norm": "4.628e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.598e-01", "anc_acc": "5.370e-01", "epoch": 0.02897} {"step": 14490, "loss": 1.2505, "grad_norm": "4.112e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.391e-01", "anc_loss": "1.009e+00", "dlm_acc": "5.823e-01", "anc_acc": "5.647e-01", "epoch": 0.02898} {"step": 14495, "loss": 1.187, "grad_norm": "1.702e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.241e+00", "dlm_acc": "6.021e-01", "anc_acc": "5.756e-01", "epoch": 0.02899} {"step": 14500, "loss": 1.5663, "grad_norm": "5.180e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.570e+00", "dlm_acc": "5.369e-01", "anc_acc": "5.204e-01", "epoch": 0.029} {"step": 14505, "loss": 1.3211, "grad_norm": "3.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.504e+00", "anc_loss": "1.574e+00", "dlm_acc": "4.505e-01", "anc_acc": "4.363e-01", "epoch": 0.02901} {"step": 14510, "loss": 1.4284, "grad_norm": "3.438e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.834e+00", "anc_loss": "1.913e+00", "dlm_acc": "4.003e-01", "anc_acc": "3.844e-01", "epoch": 0.02902} {"step": 14515, "loss": 1.241, "grad_norm": "3.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.393e+00", "dlm_acc": "5.486e-01", "anc_acc": "5.323e-01", "epoch": 0.02903} {"step": 14520, "loss": 1.6404, "grad_norm": "3.685e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.977e+00", "anc_loss": "2.016e+00", "dlm_acc": "3.090e-01", "anc_acc": "2.980e-01", "epoch": 0.02904} {"step": 14525, "loss": 2.0348, "grad_norm": "4.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.909e+00", "anc_loss": "2.934e+00", "dlm_acc": "4.311e-02", "anc_acc": "4.054e-02", "epoch": 0.02905} {"step": 14530, "loss": 1.8156, "grad_norm": "3.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.869e+00", "anc_loss": "2.891e+00", "dlm_acc": "5.247e-02", "anc_acc": "4.876e-02", "epoch": 0.02906} {"step": 14535, "loss": 1.8352, "grad_norm": "4.090e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.909e+00", "anc_loss": "2.931e+00", "dlm_acc": "5.000e-02", "anc_acc": "4.606e-02", "epoch": 0.02907} {"step": 14540, "loss": 1.439, "grad_norm": "4.159e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.955e+00", "anc_loss": "2.011e+00", "dlm_acc": "2.655e-01", "anc_acc": "2.576e-01", "epoch": 0.02908} {"step": 14545, "loss": 1.6779, "grad_norm": "3.799e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.842e+00", "anc_loss": "1.930e+00", "dlm_acc": "4.316e-01", "anc_acc": "4.148e-01", "epoch": 0.02909} {"step": 14550, "loss": 1.3053, "grad_norm": "1.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.311e+00", "dlm_acc": "6.211e-01", "anc_acc": "6.060e-01", "epoch": 0.0291} {"step": 14555, "loss": 1.3108, "grad_norm": "2.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.206e-01", "anc_loss": "9.716e-01", "dlm_acc": "6.108e-01", "anc_acc": "6.026e-01", "epoch": 0.02911} {"step": 14560, "loss": 1.2439, "grad_norm": "2.458e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.321e+00", "dlm_acc": "5.252e-01", "anc_acc": "5.044e-01", "epoch": 0.02912} {"step": 14565, "loss": 1.624, "grad_norm": "4.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.534e+00", "anc_loss": "1.594e+00", "dlm_acc": "3.532e-01", "anc_acc": "3.407e-01", "epoch": 0.02913} {"step": 14570, "loss": 1.4179, "grad_norm": "5.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.428e+00", "anc_loss": "1.500e+00", "dlm_acc": "5.443e-01", "anc_acc": "5.238e-01", "epoch": 0.02914} {"step": 14575, "loss": 1.6533, "grad_norm": "3.156e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.552e+00", "anc_loss": "1.641e+00", "dlm_acc": "5.099e-01", "anc_acc": "4.936e-01", "epoch": 0.02915} {"step": 14580, "loss": 1.3565, "grad_norm": "1.813e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.370e+00", "anc_loss": "1.454e+00", "dlm_acc": "5.463e-01", "anc_acc": "5.298e-01", "epoch": 0.02916} {"step": 14585, "loss": 1.2545, "grad_norm": "2.590e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.169e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.822e-01", "anc_acc": "5.613e-01", "epoch": 0.02917} {"step": 14590, "loss": 1.2235, "grad_norm": "1.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.290e+00", "anc_loss": "1.371e+00", "dlm_acc": "5.700e-01", "anc_acc": "5.513e-01", "epoch": 0.02918} {"step": 14595, "loss": 1.31, "grad_norm": "2.573e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.218e+00", "dlm_acc": "6.140e-01", "anc_acc": "5.959e-01", "epoch": 0.02919} {"step": 14600, "loss": 1.5687, "grad_norm": "2.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.412e+00", "dlm_acc": "5.799e-01", "anc_acc": "5.636e-01", "epoch": 0.0292} {"step": 14605, "loss": 1.5312, "grad_norm": "2.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.349e+00", "anc_loss": "1.424e+00", "dlm_acc": "6.258e-01", "anc_acc": "6.123e-01", "epoch": 0.02921} {"step": 14610, "loss": 1.5196, "grad_norm": "4.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.086e+00", "dlm_acc": "6.517e-01", "anc_acc": "6.393e-01", "epoch": 0.02922} {"step": 14615, "loss": 1.5599, "grad_norm": "6.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.148e-01", "anc_loss": "9.426e-01", "dlm_acc": "6.201e-01", "anc_acc": "6.136e-01", "epoch": 0.02923} {"step": 14620, "loss": 1.4276, "grad_norm": "3.405e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.176e+00", "anc_loss": "1.244e+00", "dlm_acc": "5.240e-01", "anc_acc": "5.095e-01", "epoch": 0.02924} {"step": 14625, "loss": 1.32, "grad_norm": "4.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.733e-01", "anc_acc": "5.578e-01", "epoch": 0.02925} {"step": 14630, "loss": 0.9565, "grad_norm": "2.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.414e-01", "anc_loss": "3.854e-01", "dlm_acc": "8.058e-01", "anc_acc": "7.902e-01", "epoch": 0.02926} {"step": 14635, "loss": 1.4462, "grad_norm": "2.596e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.754e-01", "anc_loss": "7.242e-01", "dlm_acc": "6.916e-01", "anc_acc": "6.751e-01", "epoch": 0.02927} {"step": 14640, "loss": 1.0637, "grad_norm": "2.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.171e-01", "anc_loss": "3.245e-01", "dlm_acc": "7.807e-01", "anc_acc": "7.764e-01", "epoch": 0.02928} {"step": 14645, "loss": 1.7693, "grad_norm": "2.572e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.869e-01", "anc_loss": "4.958e-01", "dlm_acc": "7.209e-01", "anc_acc": "7.166e-01", "epoch": 0.02929} {"step": 14650, "loss": 1.4655, "grad_norm": "3.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.469e-01", "anc_loss": "7.867e-01", "dlm_acc": "6.553e-01", "anc_acc": "6.446e-01", "epoch": 0.0293} {"step": 14655, "loss": 1.3903, "grad_norm": "3.906e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.988e-01", "anc_loss": "5.078e-01", "dlm_acc": "6.694e-01", "anc_acc": "6.654e-01", "epoch": 0.02931} {"step": 14660, "loss": 1.7831, "grad_norm": "4.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.344e-01", "anc_loss": "9.891e-01", "dlm_acc": "6.247e-01", "anc_acc": "6.152e-01", "epoch": 0.02932} {"step": 14665, "loss": 1.1985, "grad_norm": "2.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.805e-01", "anc_loss": "1.048e+00", "dlm_acc": "5.586e-01", "anc_acc": "5.417e-01", "epoch": 0.02933} {"step": 14670, "loss": 0.9452, "grad_norm": "3.306e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.969e-01", "anc_loss": "9.641e-01", "dlm_acc": "6.096e-01", "anc_acc": "5.939e-01", "epoch": 0.02934} {"step": 14675, "loss": 0.9726, "grad_norm": "3.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.137e-01", "anc_loss": "7.773e-01", "dlm_acc": "7.229e-01", "anc_acc": "7.032e-01", "epoch": 0.02935} {"step": 14680, "loss": 0.9957, "grad_norm": "2.905e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.250e+00", "dlm_acc": "6.038e-01", "anc_acc": "5.862e-01", "epoch": 0.02936} {"step": 14685, "loss": 1.2239, "grad_norm": "2.762e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.349e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.620e-01", "epoch": 0.02937} {"step": 14690, "loss": 1.2187, "grad_norm": "6.444e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.210e+00", "dlm_acc": "6.019e-01", "anc_acc": "5.829e-01", "epoch": 0.02938} {"step": 14695, "loss": 1.1624, "grad_norm": "3.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.172e-01", "anc_loss": "6.309e-01", "dlm_acc": "5.531e-01", "anc_acc": "5.496e-01", "epoch": 0.02939} {"step": 14700, "loss": 1.5065, "grad_norm": "3.381e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.305e-01", "anc_loss": "6.855e-01", "dlm_acc": "6.799e-01", "anc_acc": "6.562e-01", "epoch": 0.0294} {"step": 14705, "loss": 0.8298, "grad_norm": "2.926e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.418e-01", "anc_loss": "2.855e-01", "dlm_acc": "8.097e-01", "anc_acc": "7.789e-01", "epoch": 0.02941} {"step": 14710, "loss": 1.0412, "grad_norm": "2.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.929e-01", "anc_loss": "7.312e-01", "dlm_acc": "6.849e-01", "anc_acc": "6.694e-01", "epoch": 0.02942} {"step": 14715, "loss": 1.4293, "grad_norm": "3.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.163e+00", "dlm_acc": "6.135e-01", "anc_acc": "5.970e-01", "epoch": 0.02943} {"step": 14720, "loss": 1.0503, "grad_norm": "3.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.191e-01", "anc_loss": "8.691e-01", "dlm_acc": "6.873e-01", "anc_acc": "6.741e-01", "epoch": 0.02944} {"step": 14725, "loss": 1.4302, "grad_norm": "2.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.201e+00", "dlm_acc": "5.285e-01", "anc_acc": "5.135e-01", "epoch": 0.02945} {"step": 14730, "loss": 1.0331, "grad_norm": "2.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.023e-01", "anc_loss": "8.406e-01", "dlm_acc": "5.255e-01", "anc_acc": "5.120e-01", "epoch": 0.02946} {"step": 14735, "loss": 1.4476, "grad_norm": "2.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.367e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.680e-01", "anc_acc": "5.516e-01", "epoch": 0.02947} {"step": 14740, "loss": 0.9594, "grad_norm": "4.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.534e-01", "anc_loss": "6.950e-01", "dlm_acc": "6.918e-01", "anc_acc": "6.779e-01", "epoch": 0.02948} {"step": 14745, "loss": 1.2927, "grad_norm": "4.367e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.150e+00", "dlm_acc": "6.036e-01", "anc_acc": "5.862e-01", "epoch": 0.02949} {"step": 14750, "loss": 1.3568, "grad_norm": "4.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.298e+00", "dlm_acc": "6.051e-01", "anc_acc": "5.824e-01", "epoch": 0.0295} {"step": 14755, "loss": 1.644, "grad_norm": "4.808e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.308e+00", "dlm_acc": "5.856e-01", "anc_acc": "5.716e-01", "epoch": 0.02951} {"step": 14760, "loss": 1.473, "grad_norm": "2.969e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.089e+00", "dlm_acc": "5.556e-01", "anc_acc": "5.389e-01", "epoch": 0.02952} {"step": 14765, "loss": 1.0627, "grad_norm": "3.300e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.816e-01", "anc_loss": "7.211e-01", "dlm_acc": "5.699e-01", "anc_acc": "5.601e-01", "epoch": 0.02953} {"step": 14770, "loss": 1.1766, "grad_norm": "2.506e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.469e-01", "anc_loss": "8.025e-01", "dlm_acc": "7.129e-01", "anc_acc": "6.968e-01", "epoch": 0.02954} {"step": 14775, "loss": 1.6166, "grad_norm": "4.951e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.045e+00", "dlm_acc": "4.929e-01", "anc_acc": "4.804e-01", "epoch": 0.02955} {"step": 14780, "loss": 1.4125, "grad_norm": "6.491e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.172e-01", "anc_loss": "9.477e-01", "dlm_acc": "4.473e-01", "anc_acc": "4.343e-01", "epoch": 0.02956} {"step": 14785, "loss": 1.1322, "grad_norm": "4.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.398e+00", "anc_loss": "1.483e+00", "dlm_acc": "5.250e-01", "anc_acc": "5.071e-01", "epoch": 0.02957} {"step": 14790, "loss": 1.0571, "grad_norm": "6.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.116e+00", "dlm_acc": "6.198e-01", "anc_acc": "6.034e-01", "epoch": 0.02958} {"step": 14795, "loss": 0.9736, "grad_norm": "2.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.977e-01", "anc_loss": "8.551e-01", "dlm_acc": "6.714e-01", "anc_acc": "6.555e-01", "epoch": 0.02959} {"step": 14800, "loss": 1.4445, "grad_norm": "3.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.559e+00", "anc_loss": "1.672e+00", "dlm_acc": "4.821e-01", "anc_acc": "4.634e-01", "epoch": 0.0296} {"step": 14805, "loss": 1.7245, "grad_norm": "5.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.613e+00", "anc_loss": "1.709e+00", "dlm_acc": "5.087e-01", "anc_acc": "4.934e-01", "epoch": 0.02961} {"step": 14810, "loss": 1.7073, "grad_norm": "2.713e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.631e+00", "dlm_acc": "5.311e-01", "anc_acc": "5.105e-01", "epoch": 0.02962} {"step": 14815, "loss": 1.2219, "grad_norm": "3.046e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.255e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.473e-01", "anc_acc": "5.311e-01", "epoch": 0.02963} {"step": 14820, "loss": 1.3655, "grad_norm": "3.210e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.772e+00", "anc_loss": "1.844e+00", "dlm_acc": "3.894e-01", "anc_acc": "3.753e-01", "epoch": 0.02964} {"step": 14825, "loss": 1.3753, "grad_norm": "2.925e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.348e+00", "dlm_acc": "5.698e-01", "anc_acc": "5.502e-01", "epoch": 0.02965} {"step": 14830, "loss": 1.0734, "grad_norm": "2.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.112e-01", "anc_acc": "4.961e-01", "epoch": 0.02966} {"step": 14835, "loss": 1.0676, "grad_norm": "3.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.127e-01", "anc_acc": "4.948e-01", "epoch": 0.02967} {"step": 14840, "loss": 1.165, "grad_norm": "3.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.158e+00", "anc_loss": "1.229e+00", "dlm_acc": "5.820e-01", "anc_acc": "5.645e-01", "epoch": 0.02968} {"step": 14845, "loss": 1.5877, "grad_norm": "4.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.449e-01", "anc_acc": "5.254e-01", "epoch": 0.02969} {"step": 14850, "loss": 0.9823, "grad_norm": "3.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.217e+00", "dlm_acc": "5.511e-01", "anc_acc": "5.331e-01", "epoch": 0.0297} {"step": 14855, "loss": 2.0817, "grad_norm": "4.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.805e+00", "anc_loss": "1.886e+00", "dlm_acc": "4.477e-01", "anc_acc": "4.312e-01", "epoch": 0.02971} {"step": 14860, "loss": 1.7298, "grad_norm": "4.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.454e+00", "anc_loss": "1.536e+00", "dlm_acc": "5.614e-01", "anc_acc": "5.479e-01", "epoch": 0.02972} {"step": 14865, "loss": 1.6096, "grad_norm": "4.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.553e+00", "anc_loss": "1.644e+00", "dlm_acc": "4.834e-01", "anc_acc": "4.656e-01", "epoch": 0.02973} {"step": 14870, "loss": 1.4943, "grad_norm": "3.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.238e+00", "dlm_acc": "6.528e-01", "anc_acc": "6.415e-01", "epoch": 0.02974} {"step": 14875, "loss": 1.5176, "grad_norm": "8.255e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.602e-01", "anc_loss": "7.930e-01", "dlm_acc": "5.795e-01", "anc_acc": "5.666e-01", "epoch": 0.02975} {"step": 14880, "loss": 1.4263, "grad_norm": "4.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.240e+00", "dlm_acc": "5.687e-01", "anc_acc": "5.505e-01", "epoch": 0.02976} {"step": 14885, "loss": 1.2919, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.957e-01", "anc_loss": "1.076e+00", "dlm_acc": "6.315e-01", "anc_acc": "6.136e-01", "epoch": 0.02977} {"step": 14890, "loss": 0.7539, "grad_norm": "2.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.941e-01", "anc_loss": "8.541e-01", "dlm_acc": "6.921e-01", "anc_acc": "6.776e-01", "epoch": 0.02978} {"step": 14895, "loss": 1.6148, "grad_norm": "4.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.489e+00", "anc_loss": "1.594e+00", "dlm_acc": "4.953e-01", "anc_acc": "4.766e-01", "epoch": 0.02979} {"step": 14900, "loss": 1.3575, "grad_norm": "2.783e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.531e-01", "anc_loss": "5.924e-01", "dlm_acc": "7.689e-01", "anc_acc": "7.536e-01", "epoch": 0.0298} {"step": 14905, "loss": 1.0637, "grad_norm": "2.320e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.105e+00", "dlm_acc": "6.189e-01", "anc_acc": "6.036e-01", "epoch": 0.02981} {"step": 14910, "loss": 0.958, "grad_norm": "2.005e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.790e-01", "anc_loss": "5.012e-01", "dlm_acc": "7.313e-01", "anc_acc": "7.219e-01", "epoch": 0.02982} {"step": 14915, "loss": 1.3538, "grad_norm": "5.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.065e+00", "dlm_acc": "6.471e-01", "anc_acc": "6.380e-01", "epoch": 0.02983} {"step": 14920, "loss": 1.1428, "grad_norm": "3.971e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.554e-01", "anc_loss": "2.832e-01", "dlm_acc": "8.659e-01", "anc_acc": "8.522e-01", "epoch": 0.02984} {"step": 14925, "loss": 1.1794, "grad_norm": "2.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.018e-01", "anc_loss": "9.601e-01", "dlm_acc": "6.954e-01", "anc_acc": "6.805e-01", "epoch": 0.02985} {"step": 14930, "loss": 1.5309, "grad_norm": "3.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.566e+00", "anc_loss": "1.641e+00", "dlm_acc": "4.270e-01", "anc_acc": "4.132e-01", "epoch": 0.02986} {"step": 14935, "loss": 1.1042, "grad_norm": "3.785e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.840e-01", "anc_loss": "8.344e-01", "dlm_acc": "7.016e-01", "anc_acc": "6.875e-01", "epoch": 0.02987} {"step": 14940, "loss": 1.2163, "grad_norm": "5.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.820e-01", "anc_loss": "1.028e+00", "dlm_acc": "5.460e-01", "anc_acc": "5.329e-01", "epoch": 0.02988} {"step": 14945, "loss": 1.3681, "grad_norm": "3.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.216e+00", "dlm_acc": "6.218e-01", "anc_acc": "6.049e-01", "epoch": 0.02989} {"step": 14950, "loss": 0.8017, "grad_norm": "3.186e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.817e-01", "anc_loss": "6.239e-01", "dlm_acc": "7.292e-01", "anc_acc": "7.179e-01", "epoch": 0.0299} {"step": 14955, "loss": 0.989, "grad_norm": "3.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.924e-01", "anc_loss": "8.535e-01", "dlm_acc": "7.029e-01", "anc_acc": "6.897e-01", "epoch": 0.02991} {"step": 14960, "loss": 1.3936, "grad_norm": "5.664e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.079e+00", "anc_loss": "1.133e+00", "dlm_acc": "6.041e-01", "anc_acc": "5.937e-01", "epoch": 0.02992} {"step": 14965, "loss": 1.1215, "grad_norm": "6.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.055e-01", "anc_loss": "6.464e-01", "dlm_acc": "7.776e-01", "anc_acc": "7.690e-01", "epoch": 0.02993} {"step": 14970, "loss": 0.9633, "grad_norm": "3.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.592e-01", "anc_loss": "8.154e-01", "dlm_acc": "6.793e-01", "anc_acc": "6.667e-01", "epoch": 0.02994} {"step": 14975, "loss": 1.4241, "grad_norm": "4.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.394e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.412e-01", "anc_acc": "5.269e-01", "epoch": 0.02995} {"step": 14980, "loss": 0.8597, "grad_norm": "4.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.793e-01", "anc_loss": "8.274e-01", "dlm_acc": "7.627e-01", "anc_acc": "7.553e-01", "epoch": 0.02996} {"step": 14985, "loss": 1.2176, "grad_norm": "4.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.988e-01", "anc_loss": "1.061e+00", "dlm_acc": "6.273e-01", "anc_acc": "6.114e-01", "epoch": 0.02997} {"step": 14990, "loss": 1.1561, "grad_norm": "6.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.054e+00", "anc_loss": "1.145e+00", "dlm_acc": "6.568e-01", "anc_acc": "6.351e-01", "epoch": 0.02998} {"step": 14995, "loss": 1.2357, "grad_norm": "2.716e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.063e+00", "anc_loss": "1.172e+00", "dlm_acc": "6.291e-01", "anc_acc": "6.050e-01", "epoch": 0.02999} {"step": 15000, "loss": 1.1512, "grad_norm": "5.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.528e+00", "dlm_acc": "5.339e-01", "anc_acc": "5.146e-01", "epoch": 0.03} {"step": 15005, "loss": 1.5226, "grad_norm": "3.481e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.661e+00", "anc_loss": "1.753e+00", "dlm_acc": "4.841e-01", "anc_acc": "4.677e-01", "epoch": 0.03001} {"step": 15010, "loss": 1.0575, "grad_norm": "2.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.242e-01", "anc_loss": "7.578e-01", "dlm_acc": "5.868e-01", "anc_acc": "5.780e-01", "epoch": 0.03002} {"step": 15015, "loss": 1.221, "grad_norm": "2.956e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.067e-01", "anc_loss": "5.414e-01", "dlm_acc": "7.755e-01", "anc_acc": "7.661e-01", "epoch": 0.03003} {"step": 15020, "loss": 0.9168, "grad_norm": "3.276e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.541e-01", "anc_loss": "3.853e-01", "dlm_acc": "8.225e-01", "anc_acc": "8.129e-01", "epoch": 0.03004} {"step": 15025, "loss": 1.3146, "grad_norm": "4.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.996e-01", "anc_loss": "9.557e-01", "dlm_acc": "6.565e-01", "anc_acc": "6.409e-01", "epoch": 0.03005} {"step": 15030, "loss": 1.3943, "grad_norm": "3.381e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.052e-01", "anc_loss": "4.234e-01", "dlm_acc": "7.967e-01", "anc_acc": "7.899e-01", "epoch": 0.03006} {"step": 15035, "loss": 1.3408, "grad_norm": "8.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.056e+00", "anc_loss": "1.119e+00", "dlm_acc": "6.434e-01", "anc_acc": "6.268e-01", "epoch": 0.03007} {"step": 15040, "loss": 0.8057, "grad_norm": "3.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.582e-01", "anc_loss": "1.706e-01", "dlm_acc": "8.843e-01", "anc_acc": "8.786e-01", "epoch": 0.03008} {"step": 15045, "loss": 1.0438, "grad_norm": "5.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.565e-01", "anc_loss": "3.812e-01", "dlm_acc": "8.135e-01", "anc_acc": "8.034e-01", "epoch": 0.03009} {"step": 15050, "loss": 0.9891, "grad_norm": "1.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.414e-01", "anc_loss": "5.797e-01", "dlm_acc": "7.670e-01", "anc_acc": "7.535e-01", "epoch": 0.0301} {"step": 15055, "loss": 1.383, "grad_norm": "3.315e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.143e-01", "anc_loss": "5.596e-01", "dlm_acc": "7.968e-01", "anc_acc": "7.817e-01", "epoch": 0.03011} {"step": 15060, "loss": 1.2006, "grad_norm": "3.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.221e+00", "dlm_acc": "5.796e-01", "anc_acc": "5.624e-01", "epoch": 0.03012} {"step": 15065, "loss": 1.0087, "grad_norm": "1.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.762e-01", "anc_loss": "9.473e-01", "dlm_acc": "6.389e-01", "anc_acc": "6.215e-01", "epoch": 0.03013} {"step": 15070, "loss": 1.2865, "grad_norm": "6.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.766e-01", "anc_loss": "1.039e+00", "dlm_acc": "5.535e-01", "anc_acc": "5.336e-01", "epoch": 0.03014} {"step": 15075, "loss": 1.6362, "grad_norm": "1.259e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.295e+00", "dlm_acc": "5.540e-01", "anc_acc": "5.168e-01", "epoch": 0.03015} {"step": 15080, "loss": 1.7758, "grad_norm": "5.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.637e+00", "anc_loss": "1.714e+00", "dlm_acc": "4.117e-01", "anc_acc": "3.968e-01", "epoch": 0.03016} {"step": 15085, "loss": 1.5411, "grad_norm": "1.533e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.216e+00", "dlm_acc": "6.354e-01", "anc_acc": "6.142e-01", "epoch": 0.03017} {"step": 15090, "loss": 1.417, "grad_norm": "1.144e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.017e-01", "anc_acc": "4.721e-01", "epoch": 0.03018} {"step": 15095, "loss": 1.1693, "grad_norm": "1.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.079e+00", "anc_loss": "1.179e+00", "dlm_acc": "5.711e-01", "anc_acc": "5.423e-01", "epoch": 0.03019} {"step": 15100, "loss": 1.3895, "grad_norm": "3.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.072e+00", "anc_loss": "1.200e+00", "dlm_acc": "6.345e-01", "anc_acc": "5.948e-01", "epoch": 0.0302} {"step": 15105, "loss": 1.4365, "grad_norm": "4.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.578e-01", "anc_loss": "1.037e+00", "dlm_acc": "6.465e-01", "anc_acc": "6.285e-01", "epoch": 0.03021} {"step": 15110, "loss": 1.3159, "grad_norm": "2.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.070e-01", "anc_loss": "9.938e-01", "dlm_acc": "6.425e-01", "anc_acc": "6.225e-01", "epoch": 0.03022} {"step": 15115, "loss": 1.3723, "grad_norm": "2.581e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.237e+00", "dlm_acc": "5.941e-01", "anc_acc": "5.702e-01", "epoch": 0.03023} {"step": 15120, "loss": 1.385, "grad_norm": "3.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.891e-01", "anc_loss": "1.060e+00", "dlm_acc": "5.980e-01", "anc_acc": "5.803e-01", "epoch": 0.03024} {"step": 15125, "loss": 1.1059, "grad_norm": "5.279e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.891e-01", "anc_loss": "1.043e+00", "dlm_acc": "5.757e-01", "anc_acc": "5.590e-01", "epoch": 0.03025} {"step": 15130, "loss": 1.231, "grad_norm": "2.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.445e-01", "anc_acc": "5.233e-01", "epoch": 0.03026} {"step": 15135, "loss": 1.8152, "grad_norm": "2.545e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.839e+00", "anc_loss": "1.877e+00", "dlm_acc": "3.669e-01", "anc_acc": "3.567e-01", "epoch": 0.03027} {"step": 15140, "loss": 1.3284, "grad_norm": "3.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.392e+00", "dlm_acc": "4.592e-01", "anc_acc": "4.412e-01", "epoch": 0.03028} {"step": 15145, "loss": 0.9611, "grad_norm": "3.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.656e-01", "anc_loss": "9.367e-01", "dlm_acc": "5.576e-01", "anc_acc": "5.317e-01", "epoch": 0.03029} {"step": 15150, "loss": 1.6919, "grad_norm": "3.332e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.784e+00", "dlm_acc": "4.513e-01", "anc_acc": "4.335e-01", "epoch": 0.0303} {"step": 15155, "loss": 1.5222, "grad_norm": "4.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.558e+00", "dlm_acc": "4.718e-01", "anc_acc": "4.503e-01", "epoch": 0.03031} {"step": 15160, "loss": 1.2172, "grad_norm": "2.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.688e-01", "anc_loss": "1.024e+00", "dlm_acc": "6.663e-01", "anc_acc": "6.527e-01", "epoch": 0.03032} {"step": 15165, "loss": 1.5452, "grad_norm": "3.768e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.510e-01", "anc_loss": "8.324e-01", "dlm_acc": "7.254e-01", "anc_acc": "7.032e-01", "epoch": 0.03033} {"step": 15170, "loss": 1.2702, "grad_norm": "2.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.183e+00", "dlm_acc": "5.845e-01", "anc_acc": "5.638e-01", "epoch": 0.03034} {"step": 15175, "loss": 1.615, "grad_norm": "1.418e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.597e+00", "dlm_acc": "5.227e-01", "anc_acc": "5.058e-01", "epoch": 0.03035} {"step": 15180, "loss": 1.2031, "grad_norm": "9.511e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.208e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.551e-01", "anc_acc": "5.331e-01", "epoch": 0.03036} {"step": 15185, "loss": 1.262, "grad_norm": "3.316e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.117e-01", "anc_loss": "7.848e-01", "dlm_acc": "7.101e-01", "anc_acc": "6.864e-01", "epoch": 0.03037} {"step": 15190, "loss": 1.4769, "grad_norm": "3.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.893e-01", "anc_acc": "5.688e-01", "epoch": 0.03038} {"step": 15195, "loss": 1.5771, "grad_norm": "2.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.781e+00", "anc_loss": "1.845e+00", "dlm_acc": "3.309e-01", "anc_acc": "3.143e-01", "epoch": 0.03039} {"step": 15200, "loss": 0.9883, "grad_norm": "2.109e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.439e-01", "anc_loss": "4.795e-01", "dlm_acc": "8.194e-01", "anc_acc": "8.074e-01", "epoch": 0.0304} {"step": 15205, "loss": 1.13, "grad_norm": "2.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.592e-01", "anc_loss": "9.199e-01", "dlm_acc": "6.764e-01", "anc_acc": "6.621e-01", "epoch": 0.03041} {"step": 15210, "loss": 1.2792, "grad_norm": "8.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.578e-01", "anc_loss": "1.017e+00", "dlm_acc": "6.172e-01", "anc_acc": "6.022e-01", "epoch": 0.03042} {"step": 15215, "loss": 1.3815, "grad_norm": "1.707e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.490e-01", "anc_acc": "5.239e-01", "epoch": 0.03043} {"step": 15220, "loss": 1.235, "grad_norm": "3.186e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.766e-01", "anc_loss": "7.273e-01", "dlm_acc": "7.201e-01", "anc_acc": "7.037e-01", "epoch": 0.03044} {"step": 15225, "loss": 1.3135, "grad_norm": "3.332e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.132e+00", "dlm_acc": "5.852e-01", "anc_acc": "5.672e-01", "epoch": 0.03045} {"step": 15230, "loss": 1.279, "grad_norm": "4.752e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.416e+00", "dlm_acc": "5.494e-01", "anc_acc": "5.207e-01", "epoch": 0.03046} {"step": 15235, "loss": 1.0173, "grad_norm": "4.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.000e+00", "anc_loss": "1.064e+00", "dlm_acc": "5.715e-01", "anc_acc": "5.586e-01", "epoch": 0.03047} {"step": 15240, "loss": 1.0594, "grad_norm": "7.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.414e-01", "anc_loss": "1.000e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.693e-01", "epoch": 0.03048} {"step": 15245, "loss": 1.2928, "grad_norm": "4.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.373e+00", "dlm_acc": "5.106e-01", "anc_acc": "4.957e-01", "epoch": 0.03049} {"step": 15250, "loss": 1.0995, "grad_norm": "5.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.513e+00", "dlm_acc": "5.046e-01", "anc_acc": "4.739e-01", "epoch": 0.0305} {"step": 15255, "loss": 1.5702, "grad_norm": "4.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.837e+00", "anc_loss": "1.903e+00", "dlm_acc": "3.979e-01", "anc_acc": "3.854e-01", "epoch": 0.03051} {"step": 15260, "loss": 1.2986, "grad_norm": "4.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.308e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.166e-01", "anc_acc": "5.012e-01", "epoch": 0.03052} {"step": 15265, "loss": 0.7815, "grad_norm": "6.598e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.911e-01", "anc_loss": "6.365e-01", "dlm_acc": "7.570e-01", "anc_acc": "7.459e-01", "epoch": 0.03053} {"step": 15270, "loss": 0.9791, "grad_norm": "2.117e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.322e-01", "anc_loss": "6.541e-01", "dlm_acc": "6.658e-01", "anc_acc": "6.601e-01", "epoch": 0.03054} {"step": 15275, "loss": 0.6708, "grad_norm": "2.815e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.656e-01", "anc_loss": "4.770e-01", "dlm_acc": "6.611e-01", "anc_acc": "6.584e-01", "epoch": 0.03055} {"step": 15280, "loss": 0.7821, "grad_norm": "4.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.014e-01", "anc_loss": "4.105e-01", "dlm_acc": "6.963e-01", "anc_acc": "6.913e-01", "epoch": 0.03056} {"step": 15285, "loss": 0.8622, "grad_norm": "4.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.457e-01", "anc_loss": "6.621e-01", "dlm_acc": "5.908e-01", "anc_acc": "5.848e-01", "epoch": 0.03057} {"step": 15290, "loss": 0.8779, "grad_norm": "3.321e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.434e-01", "anc_loss": "5.527e-01", "dlm_acc": "6.137e-01", "anc_acc": "6.106e-01", "epoch": 0.03058} {"step": 15295, "loss": 0.7527, "grad_norm": "5.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.648e-01", "anc_loss": "5.773e-01", "dlm_acc": "5.865e-01", "anc_acc": "5.780e-01", "epoch": 0.03059} {"step": 15300, "loss": 0.6759, "grad_norm": "1.580e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.777e-01", "anc_loss": "8.141e-01", "dlm_acc": "5.931e-01", "anc_acc": "5.820e-01", "epoch": 0.0306} {"step": 15305, "loss": 1.0497, "grad_norm": "5.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.202e+00", "dlm_acc": "6.231e-01", "anc_acc": "6.060e-01", "epoch": 0.03061} {"step": 15310, "loss": 0.8368, "grad_norm": "8.980e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.168e+00", "dlm_acc": "5.664e-01", "anc_acc": "5.499e-01", "epoch": 0.03062} {"step": 15315, "loss": 0.6584, "grad_norm": "2.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.607e-01", "anc_loss": "8.014e-01", "dlm_acc": "6.380e-01", "anc_acc": "6.256e-01", "epoch": 0.03063} {"step": 15320, "loss": 0.9335, "grad_norm": "6.242e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.816e-01", "anc_loss": "9.361e-01", "dlm_acc": "6.891e-01", "anc_acc": "6.760e-01", "epoch": 0.03064} {"step": 15325, "loss": 1.0469, "grad_norm": "2.449e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.262e+00", "anc_loss": "1.356e+00", "dlm_acc": "5.391e-01", "anc_acc": "5.193e-01", "epoch": 0.03065} {"step": 15330, "loss": 0.8279, "grad_norm": "2.339e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.315e-01", "anc_loss": "8.843e-01", "dlm_acc": "7.041e-01", "anc_acc": "6.888e-01", "epoch": 0.03066} {"step": 15335, "loss": 0.9103, "grad_norm": "3.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.492e-01", "anc_loss": "8.035e-01", "dlm_acc": "7.206e-01", "anc_acc": "7.050e-01", "epoch": 0.03067} {"step": 15340, "loss": 0.9415, "grad_norm": "4.012e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.887e-01", "anc_loss": "1.034e+00", "dlm_acc": "6.327e-01", "anc_acc": "6.237e-01", "epoch": 0.03068} {"step": 15345, "loss": 1.3315, "grad_norm": "3.716e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.828e-01", "anc_acc": "5.699e-01", "epoch": 0.03069} {"step": 15350, "loss": 1.1056, "grad_norm": "2.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.068e+00", "anc_loss": "1.113e+00", "dlm_acc": "6.064e-01", "anc_acc": "5.972e-01", "epoch": 0.0307} {"step": 15355, "loss": 0.9085, "grad_norm": "3.204e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.066e+00", "dlm_acc": "6.262e-01", "anc_acc": "6.129e-01", "epoch": 0.03071} {"step": 15360, "loss": 1.2593, "grad_norm": "4.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.391e-01", "anc_loss": "8.773e-01", "dlm_acc": "6.486e-01", "anc_acc": "6.401e-01", "epoch": 0.03072} {"step": 15365, "loss": 1.0428, "grad_norm": "2.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.827e-01", "anc_loss": "9.384e-01", "dlm_acc": "6.809e-01", "anc_acc": "6.637e-01", "epoch": 0.03073} {"step": 15370, "loss": 1.0846, "grad_norm": "4.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.189e+00", "dlm_acc": "6.065e-01", "anc_acc": "5.934e-01", "epoch": 0.03074} {"step": 15375, "loss": 1.2861, "grad_norm": "3.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.397e+00", "anc_loss": "1.492e+00", "dlm_acc": "5.606e-01", "anc_acc": "5.444e-01", "epoch": 0.03075} {"step": 15380, "loss": 0.8543, "grad_norm": "3.089e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.883e-01", "anc_loss": "7.211e-01", "dlm_acc": "6.921e-01", "anc_acc": "6.841e-01", "epoch": 0.03076} {"step": 15385, "loss": 0.6953, "grad_norm": "2.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.592e-01", "anc_loss": "1.650e-01", "dlm_acc": "8.842e-01", "anc_acc": "8.811e-01", "epoch": 0.03077} {"step": 15390, "loss": 0.7973, "grad_norm": "3.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.240e-01", "anc_loss": "2.340e-01", "dlm_acc": "8.564e-01", "anc_acc": "8.542e-01", "epoch": 0.03078} {"step": 15395, "loss": 1.0073, "grad_norm": "3.313e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.378e-01", "anc_loss": "7.759e-01", "dlm_acc": "7.455e-01", "anc_acc": "7.341e-01", "epoch": 0.03079} {"step": 15400, "loss": 0.8158, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.652e-01", "anc_loss": "7.977e-01", "dlm_acc": "6.469e-01", "anc_acc": "6.388e-01", "epoch": 0.0308} {"step": 15405, "loss": 0.8559, "grad_norm": "6.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.595e-01", "anc_loss": "5.963e-01", "dlm_acc": "7.687e-01", "anc_acc": "7.549e-01", "epoch": 0.03081} {"step": 15410, "loss": 0.6423, "grad_norm": "1.345e+00", "learning_rate": "1.000e-04", "dlm_loss": "5.094e-01", "anc_loss": "5.633e-01", "dlm_acc": "8.075e-01", "anc_acc": "7.926e-01", "epoch": 0.03082} {"step": 15415, "loss": 1.0249, "grad_norm": "3.256e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.147e+00", "dlm_acc": "5.888e-01", "anc_acc": "5.748e-01", "epoch": 0.03083} {"step": 15420, "loss": 0.9279, "grad_norm": "2.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.008e+00", "anc_loss": "1.077e+00", "dlm_acc": "6.189e-01", "anc_acc": "6.027e-01", "epoch": 0.03084} {"step": 15425, "loss": 0.9693, "grad_norm": "2.970e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.087e+00", "dlm_acc": "5.628e-01", "anc_acc": "5.464e-01", "epoch": 0.03085} {"step": 15430, "loss": 0.9601, "grad_norm": "3.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.326e+00", "anc_loss": "1.366e+00", "dlm_acc": "3.608e-01", "anc_acc": "3.469e-01", "epoch": 0.03086} {"step": 15435, "loss": 0.9173, "grad_norm": "4.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.582e-01", "anc_loss": "1.026e+00", "dlm_acc": "6.639e-01", "anc_acc": "6.472e-01", "epoch": 0.03087} {"step": 15440, "loss": 0.6948, "grad_norm": "3.124e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.992e-01", "anc_loss": "8.359e-01", "dlm_acc": "6.783e-01", "anc_acc": "6.696e-01", "epoch": 0.03088} {"step": 15445, "loss": 0.7666, "grad_norm": "5.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.770e-01", "anc_loss": "5.023e-01", "dlm_acc": "6.988e-01", "anc_acc": "6.896e-01", "epoch": 0.03089} {"step": 15450, "loss": 0.9267, "grad_norm": "5.041e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.165e+00", "dlm_acc": "6.367e-01", "anc_acc": "6.216e-01", "epoch": 0.0309} {"step": 15455, "loss": 0.9734, "grad_norm": "3.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.775e-01", "anc_loss": "9.297e-01", "dlm_acc": "6.738e-01", "anc_acc": "6.620e-01", "epoch": 0.03091} {"step": 15460, "loss": 1.0562, "grad_norm": "2.878e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.161e+00", "dlm_acc": "5.793e-01", "anc_acc": "5.627e-01", "epoch": 0.03092} {"step": 15465, "loss": 1.3837, "grad_norm": "4.695e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.644e+00", "dlm_acc": "5.118e-01", "anc_acc": "4.917e-01", "epoch": 0.03093} {"step": 15470, "loss": 1.4838, "grad_norm": "3.400e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.625e-01", "anc_acc": "5.408e-01", "epoch": 0.03094} {"step": 15475, "loss": 1.4434, "grad_norm": "5.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.636e+00", "dlm_acc": "4.868e-01", "anc_acc": "4.669e-01", "epoch": 0.03095} {"step": 15480, "loss": 1.3762, "grad_norm": "3.359e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.294e-01", "anc_acc": "5.118e-01", "epoch": 0.03096} {"step": 15485, "loss": 0.9805, "grad_norm": "3.658e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.103e+00", "anc_loss": "1.178e+00", "dlm_acc": "5.246e-01", "anc_acc": "5.039e-01", "epoch": 0.03097} {"step": 15490, "loss": 1.0552, "grad_norm": "1.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.977e-01", "anc_loss": "1.066e+00", "dlm_acc": "5.821e-01", "anc_acc": "5.632e-01", "epoch": 0.03098} {"step": 15495, "loss": 1.193, "grad_norm": "3.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.747e+00", "anc_loss": "1.839e+00", "dlm_acc": "4.647e-01", "anc_acc": "4.469e-01", "epoch": 0.03099} {"step": 15500, "loss": 1.2503, "grad_norm": "3.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.560e+00", "anc_loss": "1.668e+00", "dlm_acc": "5.364e-01", "anc_acc": "5.147e-01", "epoch": 0.031} {"step": 15505, "loss": 1.1282, "grad_norm": "4.736e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.500e-01", "anc_acc": "5.332e-01", "epoch": 0.03101} {"step": 15510, "loss": 0.8565, "grad_norm": "1.628e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.229e+00", "dlm_acc": "6.312e-01", "anc_acc": "6.134e-01", "epoch": 0.03102} {"step": 15515, "loss": 1.1007, "grad_norm": "3.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.448e+00", "anc_loss": "1.538e+00", "dlm_acc": "5.312e-01", "anc_acc": "5.148e-01", "epoch": 0.03103} {"step": 15520, "loss": 0.8246, "grad_norm": "1.204e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.263e-01", "epoch": 0.03104} {"step": 15525, "loss": 1.2108, "grad_norm": "2.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.512e+00", "anc_loss": "1.599e+00", "dlm_acc": "5.149e-01", "anc_acc": "4.980e-01", "epoch": 0.03105} {"step": 15530, "loss": 1.6091, "grad_norm": "3.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.538e+00", "dlm_acc": "4.010e-01", "anc_acc": "3.932e-01", "epoch": 0.03106} {"step": 15535, "loss": 1.2075, "grad_norm": "3.317e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.399e+00", "dlm_acc": "5.014e-01", "anc_acc": "4.814e-01", "epoch": 0.03107} {"step": 15540, "loss": 1.445, "grad_norm": "1.198e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.555e+00", "anc_loss": "1.650e+00", "dlm_acc": "5.233e-01", "anc_acc": "5.033e-01", "epoch": 0.03108} {"step": 15545, "loss": 1.1813, "grad_norm": "3.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.272e+00", "anc_loss": "1.348e+00", "dlm_acc": "4.698e-01", "anc_acc": "4.532e-01", "epoch": 0.03109} {"step": 15550, "loss": 1.2796, "grad_norm": "3.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.211e+00", "anc_loss": "1.289e+00", "dlm_acc": "5.615e-01", "anc_acc": "5.455e-01", "epoch": 0.0311} {"step": 15555, "loss": 1.2078, "grad_norm": "2.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.456e+00", "anc_loss": "1.534e+00", "dlm_acc": "5.435e-01", "anc_acc": "5.283e-01", "epoch": 0.03111} {"step": 15560, "loss": 1.0435, "grad_norm": "2.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.258e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.377e-01", "anc_acc": "5.173e-01", "epoch": 0.03112} {"step": 15565, "loss": 1.2709, "grad_norm": "3.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.435e-01", "anc_acc": "5.254e-01", "epoch": 0.03113} {"step": 15570, "loss": 1.1907, "grad_norm": "2.452e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.403e+00", "dlm_acc": "5.034e-01", "anc_acc": "4.847e-01", "epoch": 0.03114} {"step": 15575, "loss": 1.5045, "grad_norm": "2.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.197e+00", "dlm_acc": "5.413e-01", "anc_acc": "5.232e-01", "epoch": 0.03115} {"step": 15580, "loss": 1.5338, "grad_norm": "6.366e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.451e+00", "anc_loss": "1.535e+00", "dlm_acc": "5.356e-01", "anc_acc": "5.170e-01", "epoch": 0.03116} {"step": 15585, "loss": 1.2665, "grad_norm": "4.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.737e-01", "anc_acc": "5.515e-01", "epoch": 0.03117} {"step": 15590, "loss": 1.0016, "grad_norm": "2.473e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.695e-01", "anc_acc": "5.488e-01", "epoch": 0.03118} {"step": 15595, "loss": 1.6017, "grad_norm": "3.970e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.627e+00", "anc_loss": "1.705e+00", "dlm_acc": "4.647e-01", "anc_acc": "4.496e-01", "epoch": 0.03119} {"step": 15600, "loss": 1.1383, "grad_norm": "3.211e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.232e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.543e-01", "anc_acc": "5.337e-01", "epoch": 0.0312} {"step": 15605, "loss": 1.3994, "grad_norm": "7.792e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.222e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.978e-01", "anc_acc": "5.785e-01", "epoch": 0.03121} {"step": 15610, "loss": 1.5084, "grad_norm": "4.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.476e+00", "anc_loss": "1.581e+00", "dlm_acc": "5.223e-01", "anc_acc": "5.027e-01", "epoch": 0.03122} {"step": 15615, "loss": 1.6709, "grad_norm": "3.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.766e+00", "anc_loss": "1.855e+00", "dlm_acc": "4.904e-01", "anc_acc": "4.736e-01", "epoch": 0.03123} {"step": 15620, "loss": 1.5986, "grad_norm": "2.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.655e+00", "anc_loss": "1.756e+00", "dlm_acc": "4.992e-01", "anc_acc": "4.787e-01", "epoch": 0.03124} {"step": 15625, "loss": 0.8132, "grad_norm": "7.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.546e-01", "anc_loss": "3.995e-01", "dlm_acc": "8.373e-01", "anc_acc": "8.239e-01", "epoch": 0.03125} {"step": 15630, "loss": 0.9931, "grad_norm": "3.227e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.932e-01", "anc_loss": "3.398e-01", "dlm_acc": "8.640e-01", "anc_acc": "8.486e-01", "epoch": 0.03126} {"step": 15635, "loss": 0.8441, "grad_norm": "4.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e-01", "anc_loss": "1.922e-01", "dlm_acc": "9.128e-01", "anc_acc": "8.885e-01", "epoch": 0.03127} {"step": 15640, "loss": 1.1004, "grad_norm": "6.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.589e-01", "anc_loss": "5.128e-01", "dlm_acc": "8.413e-01", "anc_acc": "8.194e-01", "epoch": 0.03128} {"step": 15645, "loss": 1.6501, "grad_norm": "3.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.548e+00", "anc_loss": "1.625e+00", "dlm_acc": "5.169e-01", "anc_acc": "5.007e-01", "epoch": 0.03129} {"step": 15650, "loss": 1.2275, "grad_norm": "2.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.531e-01", "anc_acc": "5.314e-01", "epoch": 0.0313} {"step": 15655, "loss": 1.3551, "grad_norm": "2.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.213e+00", "dlm_acc": "6.339e-01", "anc_acc": "6.130e-01", "epoch": 0.03131} {"step": 15660, "loss": 1.4489, "grad_norm": "3.943e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.303e-01", "anc_acc": "5.113e-01", "epoch": 0.03132} {"step": 15665, "loss": 1.2117, "grad_norm": "3.526e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.652e-01", "anc_acc": "5.449e-01", "epoch": 0.03133} {"step": 15670, "loss": 0.9296, "grad_norm": "3.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.299e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.393e-01", "anc_acc": "5.221e-01", "epoch": 0.03134} {"step": 15675, "loss": 1.4064, "grad_norm": "3.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.761e+00", "anc_loss": "1.863e+00", "dlm_acc": "4.861e-01", "anc_acc": "4.679e-01", "epoch": 0.03135} {"step": 15680, "loss": 1.022, "grad_norm": "2.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.195e+00", "dlm_acc": "6.062e-01", "anc_acc": "5.860e-01", "epoch": 0.03136} {"step": 15685, "loss": 1.3179, "grad_norm": "3.193e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.580e-01", "anc_acc": "5.386e-01", "epoch": 0.03137} {"step": 15690, "loss": 1.4674, "grad_norm": "3.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.388e+00", "dlm_acc": "5.930e-01", "anc_acc": "5.764e-01", "epoch": 0.03138} {"step": 15695, "loss": 1.295, "grad_norm": "3.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.669e+00", "anc_loss": "1.769e+00", "dlm_acc": "5.060e-01", "anc_acc": "4.851e-01", "epoch": 0.03139} {"step": 15700, "loss": 1.5898, "grad_norm": "5.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.716e+00", "anc_loss": "1.817e+00", "dlm_acc": "4.614e-01", "anc_acc": "4.449e-01", "epoch": 0.0314} {"step": 15705, "loss": 1.178, "grad_norm": "5.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.177e+00", "dlm_acc": "5.976e-01", "anc_acc": "5.776e-01", "epoch": 0.03141} {"step": 15710, "loss": 1.1416, "grad_norm": "6.243e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.315e+00", "dlm_acc": "5.875e-01", "anc_acc": "5.691e-01", "epoch": 0.03142} {"step": 15715, "loss": 1.1777, "grad_norm": "4.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.541e+00", "anc_loss": "1.627e+00", "dlm_acc": "4.626e-01", "anc_acc": "4.468e-01", "epoch": 0.03143} {"step": 15720, "loss": 0.9143, "grad_norm": "2.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.359e-01", "anc_loss": "1.004e+00", "dlm_acc": "6.607e-01", "anc_acc": "6.447e-01", "epoch": 0.03144} {"step": 15725, "loss": 1.1596, "grad_norm": "3.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.346e+00", "dlm_acc": "5.538e-01", "anc_acc": "5.339e-01", "epoch": 0.03145} {"step": 15730, "loss": 1.412, "grad_norm": "3.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.622e+00", "dlm_acc": "4.685e-01", "anc_acc": "4.511e-01", "epoch": 0.03146} {"step": 15735, "loss": 1.3418, "grad_norm": "6.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.344e-01", "anc_acc": "5.149e-01", "epoch": 0.03147} {"step": 15740, "loss": 1.2713, "grad_norm": "4.081e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.359e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.178e-01", "anc_acc": "4.978e-01", "epoch": 0.03148} {"step": 15745, "loss": 1.5646, "grad_norm": "2.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.095e+00", "dlm_acc": "6.580e-01", "anc_acc": "6.479e-01", "epoch": 0.03149} {"step": 15750, "loss": 1.3344, "grad_norm": "4.227e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.954e-01", "anc_loss": "9.547e-01", "dlm_acc": "6.964e-01", "anc_acc": "6.837e-01", "epoch": 0.0315} {"step": 15755, "loss": 1.2474, "grad_norm": "2.858e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.076e+00", "dlm_acc": "6.211e-01", "anc_acc": "6.036e-01", "epoch": 0.03151} {"step": 15760, "loss": 1.3425, "grad_norm": "4.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.573e+00", "anc_loss": "1.675e+00", "dlm_acc": "4.891e-01", "anc_acc": "4.708e-01", "epoch": 0.03152} {"step": 15765, "loss": 1.4504, "grad_norm": "3.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.711e+00", "anc_loss": "1.811e+00", "dlm_acc": "4.835e-01", "anc_acc": "4.649e-01", "epoch": 0.03153} {"step": 15770, "loss": 1.3249, "grad_norm": "3.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.406e+00", "anc_loss": "1.494e+00", "dlm_acc": "5.188e-01", "anc_acc": "4.995e-01", "epoch": 0.03154} {"step": 15775, "loss": 1.3135, "grad_norm": "2.228e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.400e+00", "dlm_acc": "4.561e-01", "anc_acc": "4.336e-01", "epoch": 0.03155} {"step": 15780, "loss": 1.2131, "grad_norm": "2.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.190e+00", "dlm_acc": "6.165e-01", "anc_acc": "5.883e-01", "epoch": 0.03156} {"step": 15785, "loss": 1.2711, "grad_norm": "4.239e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.244e-01", "anc_acc": "5.049e-01", "epoch": 0.03157} {"step": 15790, "loss": 1.1497, "grad_norm": "4.170e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.175e-01", "anc_acc": "4.994e-01", "epoch": 0.03158} {"step": 15795, "loss": 1.1635, "grad_norm": "2.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.520e+00", "dlm_acc": "5.208e-01", "anc_acc": "4.999e-01", "epoch": 0.03159} {"step": 15800, "loss": 1.4623, "grad_norm": "5.380e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.401e+00", "dlm_acc": "5.340e-01", "anc_acc": "5.189e-01", "epoch": 0.0316} {"step": 15805, "loss": 1.7503, "grad_norm": "3.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.812e+00", "anc_loss": "1.916e+00", "dlm_acc": "4.452e-01", "anc_acc": "4.247e-01", "epoch": 0.03161} {"step": 15810, "loss": 1.2484, "grad_norm": "3.957e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.542e+00", "anc_loss": "1.606e+00", "dlm_acc": "4.388e-01", "anc_acc": "4.265e-01", "epoch": 0.03162} {"step": 15815, "loss": 1.4437, "grad_norm": "7.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.312e-01", "anc_acc": "5.202e-01", "epoch": 0.03163} {"step": 15820, "loss": 1.3846, "grad_norm": "3.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.204e-01", "anc_acc": "4.973e-01", "epoch": 0.03164} {"step": 15825, "loss": 1.5549, "grad_norm": "5.214e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.580e+00", "anc_loss": "1.666e+00", "dlm_acc": "4.497e-01", "anc_acc": "4.276e-01", "epoch": 0.03165} {"step": 15830, "loss": 2.0291, "grad_norm": "8.594e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.177e+00", "anc_loss": "2.230e+00", "dlm_acc": "3.131e-01", "anc_acc": "3.022e-01", "epoch": 0.03166} {"step": 15835, "loss": 1.2881, "grad_norm": "5.510e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.627e-01", "anc_loss": "1.046e+00", "dlm_acc": "6.409e-01", "anc_acc": "6.226e-01", "epoch": 0.03167} {"step": 15840, "loss": 1.5508, "grad_norm": "3.380e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.331e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.682e-01", "anc_acc": "5.500e-01", "epoch": 0.03168} {"step": 15845, "loss": 1.3798, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.204e+00", "dlm_acc": "5.814e-01", "anc_acc": "5.568e-01", "epoch": 0.03169} {"step": 15850, "loss": 1.3994, "grad_norm": "3.101e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.294e+00", "anc_loss": "1.378e+00", "dlm_acc": "5.439e-01", "anc_acc": "5.227e-01", "epoch": 0.0317} {"step": 15855, "loss": 1.1635, "grad_norm": "7.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.251e+00", "dlm_acc": "5.249e-01", "anc_acc": "5.110e-01", "epoch": 0.03171} {"step": 15860, "loss": 1.5378, "grad_norm": "4.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.762e-01", "anc_acc": "5.600e-01", "epoch": 0.03172} {"step": 15865, "loss": 1.9161, "grad_norm": "3.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.324e+00", "dlm_acc": "5.534e-01", "anc_acc": "5.331e-01", "epoch": 0.03173} {"step": 15870, "loss": 1.6672, "grad_norm": "2.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.163e+00", "anc_loss": "1.270e+00", "dlm_acc": "5.521e-01", "anc_acc": "5.252e-01", "epoch": 0.03174} {"step": 15875, "loss": 1.5948, "grad_norm": "2.545e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.189e+00", "dlm_acc": "5.390e-01", "anc_acc": "5.127e-01", "epoch": 0.03175} {"step": 15880, "loss": 1.1763, "grad_norm": "4.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.008e-01", "anc_loss": "8.641e-01", "dlm_acc": "6.640e-01", "anc_acc": "6.483e-01", "epoch": 0.03176} {"step": 15885, "loss": 0.7939, "grad_norm": "3.591e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.453e-01", "anc_loss": "9.143e-01", "dlm_acc": "6.634e-01", "anc_acc": "6.450e-01", "epoch": 0.03177} {"step": 15890, "loss": 1.0417, "grad_norm": "3.539e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.407e+00", "dlm_acc": "5.076e-01", "anc_acc": "4.856e-01", "epoch": 0.03178} {"step": 15895, "loss": 1.2199, "grad_norm": "5.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.157e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.273e-01", "epoch": 0.03179} {"step": 15900, "loss": 1.5219, "grad_norm": "3.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.541e+00", "dlm_acc": "4.689e-01", "anc_acc": "4.505e-01", "epoch": 0.0318} {"step": 15905, "loss": 1.2973, "grad_norm": "2.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.153e+00", "dlm_acc": "5.789e-01", "anc_acc": "5.605e-01", "epoch": 0.03181} {"step": 15910, "loss": 1.4253, "grad_norm": "7.785e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.325e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.416e-01", "anc_acc": "5.234e-01", "epoch": 0.03182} {"step": 15915, "loss": 0.8529, "grad_norm": "2.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.609e-01", "anc_loss": "1.048e+00", "dlm_acc": "6.212e-01", "anc_acc": "6.000e-01", "epoch": 0.03183} {"step": 15920, "loss": 1.2042, "grad_norm": "4.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.891e-01", "anc_loss": "8.039e-01", "dlm_acc": "4.579e-01", "anc_acc": "4.494e-01", "epoch": 0.03184} {"step": 15925, "loss": 1.1616, "grad_norm": "2.714e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.113e+00", "dlm_acc": "4.755e-01", "anc_acc": "4.678e-01", "epoch": 0.03185} {"step": 15930, "loss": 1.3939, "grad_norm": "4.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.818e+00", "anc_loss": "1.927e+00", "dlm_acc": "4.360e-01", "anc_acc": "4.262e-01", "epoch": 0.03186} {"step": 15935, "loss": 0.816, "grad_norm": "2.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.294e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.263e-01", "anc_acc": "5.063e-01", "epoch": 0.03187} {"step": 15940, "loss": 0.8282, "grad_norm": "1.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.324e+00", "anc_loss": "1.383e+00", "dlm_acc": "5.112e-01", "anc_acc": "4.977e-01", "epoch": 0.03188} {"step": 15945, "loss": 0.6563, "grad_norm": "1.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.111e+00", "anc_loss": "1.169e+00", "dlm_acc": "6.207e-01", "anc_acc": "6.072e-01", "epoch": 0.03189} {"step": 15950, "loss": 0.6366, "grad_norm": "2.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.539e-01", "anc_loss": "1.017e+00", "dlm_acc": "6.779e-01", "anc_acc": "6.610e-01", "epoch": 0.0319} {"step": 15955, "loss": 0.9054, "grad_norm": "2.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.584e-01", "anc_acc": "5.361e-01", "epoch": 0.03191} {"step": 15960, "loss": 0.9619, "grad_norm": "1.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.756e+00", "anc_loss": "1.831e+00", "dlm_acc": "4.045e-01", "anc_acc": "3.866e-01", "epoch": 0.03192} {"step": 15965, "loss": 1.0258, "grad_norm": "4.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.145e+00", "anc_loss": "2.173e+00", "dlm_acc": "2.443e-01", "anc_acc": "2.369e-01", "epoch": 0.03193} {"step": 15970, "loss": 0.9767, "grad_norm": "5.527e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.582e-01", "anc_loss": "1.018e+00", "dlm_acc": "5.493e-01", "anc_acc": "5.326e-01", "epoch": 0.03194} {"step": 15975, "loss": 1.2104, "grad_norm": "3.294e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.410e+00", "anc_loss": "1.501e+00", "dlm_acc": "5.172e-01", "anc_acc": "5.001e-01", "epoch": 0.03195} {"step": 15980, "loss": 1.5175, "grad_norm": "4.598e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.823e+00", "anc_loss": "1.942e+00", "dlm_acc": "4.587e-01", "anc_acc": "4.359e-01", "epoch": 0.03196} {"step": 15985, "loss": 1.1324, "grad_norm": "3.580e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.217e+00", "dlm_acc": "5.494e-01", "anc_acc": "5.297e-01", "epoch": 0.03197} {"step": 15990, "loss": 0.831, "grad_norm": "5.207e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.477e-01", "anc_loss": "9.000e-01", "dlm_acc": "5.470e-01", "anc_acc": "5.313e-01", "epoch": 0.03198} {"step": 15995, "loss": 0.7713, "grad_norm": "3.053e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.383e-01", "anc_loss": "9.914e-01", "dlm_acc": "5.690e-01", "anc_acc": "5.560e-01", "epoch": 0.03199} {"step": 16000, "loss": 1.0079, "grad_norm": "4.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.387e-01", "anc_loss": "9.289e-01", "dlm_acc": "6.621e-01", "anc_acc": "6.302e-01", "epoch": 0.032} {"step": 16005, "loss": 0.9211, "grad_norm": "2.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.292e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.416e-01", "anc_acc": "5.196e-01", "epoch": 0.03201} {"step": 16010, "loss": 1.0375, "grad_norm": "3.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.633e+00", "anc_loss": "1.706e+00", "dlm_acc": "4.425e-01", "anc_acc": "4.322e-01", "epoch": 0.03202} {"step": 16015, "loss": 1.0091, "grad_norm": "6.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.410e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.081e-01", "anc_acc": "4.913e-01", "epoch": 0.03203} {"step": 16020, "loss": 1.271, "grad_norm": "3.939e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.292e+00", "anc_loss": "2.348e+00", "dlm_acc": "1.168e-01", "anc_acc": "1.116e-01", "epoch": 0.03204} {"step": 16025, "loss": 1.0357, "grad_norm": "5.136e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.278e+00", "anc_loss": "1.335e+00", "dlm_acc": "5.281e-01", "anc_acc": "5.145e-01", "epoch": 0.03205} {"step": 16030, "loss": 1.3202, "grad_norm": "5.041e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.359e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.280e-01", "anc_acc": "5.092e-01", "epoch": 0.03206} {"step": 16035, "loss": 1.0816, "grad_norm": "3.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.150e-01", "anc_acc": "4.926e-01", "epoch": 0.03207} {"step": 16040, "loss": 1.0552, "grad_norm": "3.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.225e+00", "anc_loss": "1.315e+00", "dlm_acc": "5.774e-01", "anc_acc": "5.572e-01", "epoch": 0.03208} {"step": 16045, "loss": 1.1031, "grad_norm": "4.649e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.641e+00", "anc_loss": "1.732e+00", "dlm_acc": "4.536e-01", "anc_acc": "4.320e-01", "epoch": 0.03209} {"step": 16050, "loss": 0.7167, "grad_norm": "5.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.646e-01", "anc_loss": "7.365e-01", "dlm_acc": "7.384e-01", "anc_acc": "7.150e-01", "epoch": 0.0321} {"step": 16055, "loss": 1.3791, "grad_norm": "2.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.083e+00", "anc_loss": "1.169e+00", "dlm_acc": "5.700e-01", "anc_acc": "5.423e-01", "epoch": 0.03211} {"step": 16060, "loss": 1.0459, "grad_norm": "2.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.141e+00", "dlm_acc": "5.909e-01", "anc_acc": "5.542e-01", "epoch": 0.03212} {"step": 16065, "loss": 1.1896, "grad_norm": "5.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.315e+00", "anc_loss": "1.397e+00", "dlm_acc": "5.199e-01", "anc_acc": "5.014e-01", "epoch": 0.03213} {"step": 16070, "loss": 1.3608, "grad_norm": "6.675e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.336e+00", "anc_loss": "1.431e+00", "dlm_acc": "5.392e-01", "anc_acc": "5.167e-01", "epoch": 0.03214} {"step": 16075, "loss": 1.0894, "grad_norm": "3.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.295e-01", "anc_acc": "5.078e-01", "epoch": 0.03215} {"step": 16080, "loss": 1.1795, "grad_norm": "3.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.253e-01", "anc_acc": "5.075e-01", "epoch": 0.03216} {"step": 16085, "loss": 1.2626, "grad_norm": "3.306e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.148e-01", "anc_loss": "9.523e-01", "dlm_acc": "5.896e-01", "anc_acc": "5.756e-01", "epoch": 0.03217} {"step": 16090, "loss": 1.0188, "grad_norm": "3.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.313e-01", "anc_loss": "8.594e-01", "dlm_acc": "5.412e-01", "anc_acc": "5.360e-01", "epoch": 0.03218} {"step": 16095, "loss": 1.3099, "grad_norm": "3.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.082e+00", "dlm_acc": "5.501e-01", "anc_acc": "5.308e-01", "epoch": 0.03219} {"step": 16100, "loss": 1.1872, "grad_norm": "2.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.348e+00", "dlm_acc": "5.341e-01", "anc_acc": "5.140e-01", "epoch": 0.0322} {"step": 16105, "loss": 1.1247, "grad_norm": "9.872e-02", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.257e+00", "dlm_acc": "5.149e-01", "anc_acc": "4.913e-01", "epoch": 0.03221} {"step": 16110, "loss": 0.981, "grad_norm": "3.358e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.258e-01", "anc_loss": "7.336e-01", "dlm_acc": "4.142e-01", "anc_acc": "4.079e-01", "epoch": 0.03222} {"step": 16115, "loss": 1.2892, "grad_norm": "3.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.719e-01", "anc_loss": "7.875e-01", "dlm_acc": "4.023e-01", "anc_acc": "3.922e-01", "epoch": 0.03223} {"step": 16120, "loss": 1.0317, "grad_norm": "4.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.531e-01", "anc_loss": "7.613e-01", "dlm_acc": "3.796e-01", "anc_acc": "3.752e-01", "epoch": 0.03224} {"step": 16125, "loss": 1.219, "grad_norm": "2.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.031e-01", "anc_loss": "9.508e-01", "dlm_acc": "5.699e-01", "anc_acc": "5.570e-01", "epoch": 0.03225} {"step": 16130, "loss": 1.5838, "grad_norm": "2.622e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.820e+00", "anc_loss": "1.883e+00", "dlm_acc": "3.958e-01", "anc_acc": "3.814e-01", "epoch": 0.03226} {"step": 16135, "loss": 1.1946, "grad_norm": "3.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.483e-01", "anc_acc": "5.284e-01", "epoch": 0.03227} {"step": 16140, "loss": 1.4684, "grad_norm": "3.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.326e+00", "dlm_acc": "5.977e-01", "anc_acc": "5.737e-01", "epoch": 0.03228} {"step": 16145, "loss": 1.2885, "grad_norm": "1.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.825e-01", "anc_acc": "5.605e-01", "epoch": 0.03229} {"step": 16150, "loss": 1.284, "grad_norm": "3.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.329e+00", "anc_loss": "1.416e+00", "dlm_acc": "5.563e-01", "anc_acc": "5.375e-01", "epoch": 0.0323} {"step": 16155, "loss": 1.3396, "grad_norm": "3.596e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.487e-01", "anc_acc": "5.271e-01", "epoch": 0.03231} {"step": 16160, "loss": 1.3929, "grad_norm": "5.271e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.500e+00", "dlm_acc": "4.864e-01", "anc_acc": "4.691e-01", "epoch": 0.03232} {"step": 16165, "loss": 1.4842, "grad_norm": "4.179e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.353e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.642e-01", "anc_acc": "5.459e-01", "epoch": 0.03233} {"step": 16170, "loss": 1.5935, "grad_norm": "4.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.883e+00", "anc_loss": "1.983e+00", "dlm_acc": "4.696e-01", "anc_acc": "4.513e-01", "epoch": 0.03234} {"step": 16175, "loss": 1.3673, "grad_norm": "4.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.577e+00", "dlm_acc": "5.247e-01", "anc_acc": "5.037e-01", "epoch": 0.03235} {"step": 16180, "loss": 0.9249, "grad_norm": "2.893e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.409e-01", "anc_loss": "8.172e-01", "dlm_acc": "7.126e-01", "anc_acc": "6.912e-01", "epoch": 0.03236} {"step": 16185, "loss": 1.0869, "grad_norm": "2.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.824e-01", "anc_acc": "5.577e-01", "epoch": 0.03237} {"step": 16190, "loss": 1.1108, "grad_norm": "3.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.286e+00", "anc_loss": "1.379e+00", "dlm_acc": "5.653e-01", "anc_acc": "5.458e-01", "epoch": 0.03238} {"step": 16195, "loss": 0.9589, "grad_norm": "4.813e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.756e-01", "anc_acc": "5.537e-01", "epoch": 0.03239} {"step": 16200, "loss": 1.141, "grad_norm": "3.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.573e+00", "anc_loss": "1.663e+00", "dlm_acc": "4.916e-01", "anc_acc": "4.745e-01", "epoch": 0.0324} {"step": 16205, "loss": 1.1793, "grad_norm": "2.954e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.367e-01", "anc_acc": "5.164e-01", "epoch": 0.03241} {"step": 16210, "loss": 1.274, "grad_norm": "2.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.549e+00", "anc_loss": "1.653e+00", "dlm_acc": "4.908e-01", "anc_acc": "4.677e-01", "epoch": 0.03242} {"step": 16215, "loss": 1.3758, "grad_norm": "4.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.716e+00", "anc_loss": "1.819e+00", "dlm_acc": "4.819e-01", "anc_acc": "4.624e-01", "epoch": 0.03243} {"step": 16220, "loss": 1.1186, "grad_norm": "2.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.424e+00", "anc_loss": "1.528e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.110e-01", "epoch": 0.03244} {"step": 16225, "loss": 1.535, "grad_norm": "4.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.627e+00", "anc_loss": "1.733e+00", "dlm_acc": "4.911e-01", "anc_acc": "4.712e-01", "epoch": 0.03245} {"step": 16230, "loss": 1.3112, "grad_norm": "5.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.156e+00", "dlm_acc": "5.971e-01", "anc_acc": "5.796e-01", "epoch": 0.03246} {"step": 16235, "loss": 1.6685, "grad_norm": "3.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.844e+00", "anc_loss": "1.927e+00", "dlm_acc": "4.326e-01", "anc_acc": "4.164e-01", "epoch": 0.03247} {"step": 16240, "loss": 0.9905, "grad_norm": "1.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.489e-01", "anc_acc": "5.297e-01", "epoch": 0.03248} {"step": 16245, "loss": 1.1765, "grad_norm": "2.377e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.189e+00", "anc_loss": "1.260e+00", "dlm_acc": "5.703e-01", "anc_acc": "5.525e-01", "epoch": 0.03249} {"step": 16250, "loss": 1.3849, "grad_norm": "1.884e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.557e+00", "anc_loss": "1.630e+00", "dlm_acc": "4.469e-01", "anc_acc": "4.316e-01", "epoch": 0.0325} {"step": 16255, "loss": 1.098, "grad_norm": "3.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.258e+00", "dlm_acc": "4.449e-01", "anc_acc": "4.334e-01", "epoch": 0.03251} {"step": 16260, "loss": 1.1936, "grad_norm": "2.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.315e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.380e-01", "anc_acc": "5.151e-01", "epoch": 0.03252} {"step": 16265, "loss": 1.0991, "grad_norm": "2.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.215e+00", "dlm_acc": "5.866e-01", "anc_acc": "5.713e-01", "epoch": 0.03253} {"step": 16270, "loss": 1.1329, "grad_norm": "2.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.543e-01", "anc_acc": "5.339e-01", "epoch": 0.03254} {"step": 16275, "loss": 1.1651, "grad_norm": "3.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.362e+00", "anc_loss": "1.439e+00", "dlm_acc": "4.962e-01", "anc_acc": "4.812e-01", "epoch": 0.03255} {"step": 16280, "loss": 1.4959, "grad_norm": "3.225e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.483e+00", "dlm_acc": "5.285e-01", "anc_acc": "5.096e-01", "epoch": 0.03256} {"step": 16285, "loss": 1.2625, "grad_norm": "5.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.752e+00", "anc_loss": "1.855e+00", "dlm_acc": "4.638e-01", "anc_acc": "4.446e-01", "epoch": 0.03257} {"step": 16290, "loss": 1.2469, "grad_norm": "2.912e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.310e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.193e-01", "anc_acc": "4.977e-01", "epoch": 0.03258} {"step": 16295, "loss": 1.2847, "grad_norm": "3.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.539e+00", "anc_loss": "1.609e+00", "dlm_acc": "4.707e-01", "anc_acc": "4.544e-01", "epoch": 0.03259} {"step": 16300, "loss": 0.8481, "grad_norm": "3.077e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.470e+00", "dlm_acc": "5.054e-01", "anc_acc": "4.880e-01", "epoch": 0.0326} {"step": 16305, "loss": 1.0715, "grad_norm": "4.893e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.443e-01", "anc_loss": "1.009e+00", "dlm_acc": "6.527e-01", "anc_acc": "6.308e-01", "epoch": 0.03261} {"step": 16310, "loss": 1.4792, "grad_norm": "3.780e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.700e+00", "anc_loss": "1.786e+00", "dlm_acc": "4.823e-01", "anc_acc": "4.649e-01", "epoch": 0.03262} {"step": 16315, "loss": 1.379, "grad_norm": "4.834e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.684e+00", "anc_loss": "1.778e+00", "dlm_acc": "4.882e-01", "anc_acc": "4.709e-01", "epoch": 0.03263} {"step": 16320, "loss": 1.1352, "grad_norm": "3.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.795e+00", "anc_loss": "1.909e+00", "dlm_acc": "4.543e-01", "anc_acc": "4.326e-01", "epoch": 0.03264} {"step": 16325, "loss": 0.9128, "grad_norm": "2.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.168e+00", "dlm_acc": "5.816e-01", "anc_acc": "5.598e-01", "epoch": 0.03265} {"step": 16330, "loss": 1.1271, "grad_norm": "3.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.623e+00", "anc_loss": "1.708e+00", "dlm_acc": "4.767e-01", "anc_acc": "4.589e-01", "epoch": 0.03266} {"step": 16335, "loss": 0.9219, "grad_norm": "6.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.867e-01", "anc_loss": "8.008e-01", "dlm_acc": "4.902e-01", "anc_acc": "4.865e-01", "epoch": 0.03267} {"step": 16340, "loss": 1.4749, "grad_norm": "3.616e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.191e+00", "dlm_acc": "3.338e-01", "anc_acc": "3.324e-01", "epoch": 0.03268} {"step": 16345, "loss": 1.2632, "grad_norm": "2.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.570e+00", "anc_loss": "1.653e+00", "dlm_acc": "4.912e-01", "anc_acc": "4.709e-01", "epoch": 0.03269} {"step": 16350, "loss": 1.4616, "grad_norm": "3.522e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.581e+00", "anc_loss": "1.666e+00", "dlm_acc": "5.112e-01", "anc_acc": "4.953e-01", "epoch": 0.0327} {"step": 16355, "loss": 1.526, "grad_norm": "3.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.891e+00", "anc_loss": "1.998e+00", "dlm_acc": "4.855e-01", "anc_acc": "4.680e-01", "epoch": 0.03271} {"step": 16360, "loss": 1.0666, "grad_norm": "2.245e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.191e+00", "dlm_acc": "5.622e-01", "anc_acc": "5.426e-01", "epoch": 0.03272} {"step": 16365, "loss": 1.3059, "grad_norm": "3.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.568e+00", "dlm_acc": "5.110e-01", "anc_acc": "4.975e-01", "epoch": 0.03273} {"step": 16370, "loss": 0.9934, "grad_norm": "2.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.692e-01", "anc_acc": "5.519e-01", "epoch": 0.03274} {"step": 16375, "loss": 1.1714, "grad_norm": "1.794e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.508e+00", "dlm_acc": "4.938e-01", "anc_acc": "4.728e-01", "epoch": 0.03275} {"step": 16380, "loss": 1.4506, "grad_norm": "5.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.989e+00", "anc_loss": "2.069e+00", "dlm_acc": "4.424e-01", "anc_acc": "4.303e-01", "epoch": 0.03276} {"step": 16385, "loss": 1.0385, "grad_norm": "4.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.051e-01", "anc_loss": "8.625e-01", "dlm_acc": "6.497e-01", "anc_acc": "6.304e-01", "epoch": 0.03277} {"step": 16390, "loss": 1.0219, "grad_norm": "3.493e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.012e-01", "anc_loss": "8.367e-01", "dlm_acc": "5.656e-01", "anc_acc": "5.557e-01", "epoch": 0.03278} {"step": 16395, "loss": 1.3125, "grad_norm": "2.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.656e-01", "anc_loss": "1.030e+00", "dlm_acc": "5.770e-01", "anc_acc": "5.577e-01", "epoch": 0.03279} {"step": 16400, "loss": 1.5039, "grad_norm": "6.639e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.487e+00", "anc_loss": "1.542e+00", "dlm_acc": "5.116e-01", "anc_acc": "4.993e-01", "epoch": 0.0328} {"step": 16405, "loss": 1.1815, "grad_norm": "7.782e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.389e-01", "anc_loss": "8.833e-01", "dlm_acc": "7.360e-01", "anc_acc": "7.272e-01", "epoch": 0.03281} {"step": 16410, "loss": 1.1323, "grad_norm": "5.438e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.447e+00", "anc_loss": "1.538e+00", "dlm_acc": "5.341e-01", "anc_acc": "5.175e-01", "epoch": 0.03282} {"step": 16415, "loss": 0.9953, "grad_norm": "2.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.092e+00", "dlm_acc": "5.982e-01", "anc_acc": "5.786e-01", "epoch": 0.03283} {"step": 16420, "loss": 0.8322, "grad_norm": "3.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.695e-01", "anc_loss": "1.055e+00", "dlm_acc": "6.522e-01", "anc_acc": "6.303e-01", "epoch": 0.03284} {"step": 16425, "loss": 1.0997, "grad_norm": "5.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.840e-01", "anc_loss": "9.473e-01", "dlm_acc": "6.412e-01", "anc_acc": "6.234e-01", "epoch": 0.03285} {"step": 16430, "loss": 1.1494, "grad_norm": "3.158e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.255e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.545e-01", "anc_acc": "5.386e-01", "epoch": 0.03286} {"step": 16435, "loss": 1.1962, "grad_norm": "4.640e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.225e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.000e-01", "anc_acc": "4.816e-01", "epoch": 0.03287} {"step": 16440, "loss": 1.1677, "grad_norm": "3.152e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.473e-01", "anc_loss": "5.516e-01", "dlm_acc": "6.296e-01", "anc_acc": "6.265e-01", "epoch": 0.03288} {"step": 16445, "loss": 0.8736, "grad_norm": "2.757e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.053e-01", "anc_loss": "4.109e-01", "dlm_acc": "6.907e-01", "anc_acc": "6.887e-01", "epoch": 0.03289} {"step": 16450, "loss": 1.3596, "grad_norm": "4.545e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.310e-01", "anc_acc": "5.191e-01", "epoch": 0.0329} {"step": 16455, "loss": 1.2435, "grad_norm": "4.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.173e+00", "dlm_acc": "6.050e-01", "anc_acc": "5.863e-01", "epoch": 0.03291} {"step": 16460, "loss": 0.9051, "grad_norm": "2.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.090e-01", "anc_loss": "5.600e-01", "dlm_acc": "7.831e-01", "anc_acc": "7.708e-01", "epoch": 0.03292} {"step": 16465, "loss": 1.5146, "grad_norm": "5.012e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.466e+00", "anc_loss": "1.553e+00", "dlm_acc": "5.374e-01", "anc_acc": "5.193e-01", "epoch": 0.03293} {"step": 16470, "loss": 1.137, "grad_norm": "5.689e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.602e-01", "anc_loss": "8.098e-01", "dlm_acc": "6.102e-01", "anc_acc": "5.923e-01", "epoch": 0.03294} {"step": 16475, "loss": 1.2913, "grad_norm": "3.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.124e+00", "dlm_acc": "5.465e-01", "anc_acc": "5.311e-01", "epoch": 0.03295} {"step": 16480, "loss": 0.7438, "grad_norm": "1.719e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.258e-01", "anc_loss": "6.570e-01", "dlm_acc": "6.112e-01", "anc_acc": "5.990e-01", "epoch": 0.03296} {"step": 16485, "loss": 1.3595, "grad_norm": "4.725e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.069e+00", "dlm_acc": "5.297e-01", "anc_acc": "5.140e-01", "epoch": 0.03297} {"step": 16490, "loss": 1.0911, "grad_norm": "2.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.953e-01", "anc_loss": "7.023e-01", "dlm_acc": "5.488e-01", "anc_acc": "5.466e-01", "epoch": 0.03298} {"step": 16495, "loss": 1.4839, "grad_norm": "3.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.049e+00", "anc_loss": "1.101e+00", "dlm_acc": "5.931e-01", "anc_acc": "5.812e-01", "epoch": 0.03299} {"step": 16500, "loss": 0.928, "grad_norm": "2.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.719e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.392e-01", "anc_acc": "6.215e-01", "epoch": 0.033} {"step": 16505, "loss": 1.168, "grad_norm": "2.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.602e-01", "anc_loss": "7.051e-01", "dlm_acc": "6.391e-01", "anc_acc": "6.221e-01", "epoch": 0.03301} {"step": 16510, "loss": 1.448, "grad_norm": "1.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.716e-01", "anc_acc": "5.552e-01", "epoch": 0.03302} {"step": 16515, "loss": 0.9034, "grad_norm": "2.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.063e+00", "dlm_acc": "6.905e-01", "anc_acc": "6.796e-01", "epoch": 0.03303} {"step": 16520, "loss": 1.3691, "grad_norm": "3.559e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.935e-01", "anc_loss": "8.488e-01", "dlm_acc": "6.853e-01", "anc_acc": "6.699e-01", "epoch": 0.03304} {"step": 16525, "loss": 1.5114, "grad_norm": "4.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.226e+00", "dlm_acc": "5.405e-01", "anc_acc": "5.193e-01", "epoch": 0.03305} {"step": 16530, "loss": 1.2622, "grad_norm": "2.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.422e-01", "anc_loss": "6.562e-01", "dlm_acc": "5.898e-01", "anc_acc": "5.840e-01", "epoch": 0.03306} {"step": 16535, "loss": 1.2325, "grad_norm": "2.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.898e-01", "anc_loss": "6.961e-01", "dlm_acc": "5.630e-01", "anc_acc": "5.603e-01", "epoch": 0.03307} {"step": 16540, "loss": 1.5849, "grad_norm": "3.538e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.969e-01", "anc_loss": "8.094e-01", "dlm_acc": "5.329e-01", "anc_acc": "5.303e-01", "epoch": 0.03308} {"step": 16545, "loss": 1.1146, "grad_norm": "1.624e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.832e-01", "anc_loss": "7.203e-01", "dlm_acc": "5.487e-01", "anc_acc": "5.353e-01", "epoch": 0.03309} {"step": 16550, "loss": 1.3781, "grad_norm": "3.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.855e-01", "anc_loss": "7.395e-01", "dlm_acc": "6.839e-01", "anc_acc": "6.692e-01", "epoch": 0.0331} {"step": 16555, "loss": 1.2783, "grad_norm": "2.813e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.778e-01", "anc_loss": "1.043e+00", "dlm_acc": "6.529e-01", "anc_acc": "6.320e-01", "epoch": 0.03311} {"step": 16560, "loss": 1.2283, "grad_norm": "3.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.301e-01", "anc_loss": "7.828e-01", "dlm_acc": "7.368e-01", "anc_acc": "7.217e-01", "epoch": 0.03312} {"step": 16565, "loss": 1.6856, "grad_norm": "4.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.601e+00", "dlm_acc": "5.329e-01", "anc_acc": "5.162e-01", "epoch": 0.03313} {"step": 16570, "loss": 0.9893, "grad_norm": "3.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.570e-01", "anc_loss": "9.977e-01", "dlm_acc": "5.503e-01", "anc_acc": "5.429e-01", "epoch": 0.03314} {"step": 16575, "loss": 1.415, "grad_norm": "1.185e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.211e-01", "anc_loss": "8.242e-01", "dlm_acc": "5.311e-01", "anc_acc": "5.298e-01", "epoch": 0.03315} {"step": 16580, "loss": 1.1246, "grad_norm": "2.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.469e-01", "anc_loss": "6.625e-01", "dlm_acc": "5.822e-01", "anc_acc": "5.758e-01", "epoch": 0.03316} {"step": 16585, "loss": 1.3615, "grad_norm": "3.639e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.061e-01", "anc_loss": "9.844e-01", "dlm_acc": "6.573e-01", "anc_acc": "6.336e-01", "epoch": 0.03317} {"step": 16590, "loss": 1.1124, "grad_norm": "3.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.625e-01", "anc_loss": "1.048e+00", "dlm_acc": "6.178e-01", "anc_acc": "5.891e-01", "epoch": 0.03318} {"step": 16595, "loss": 1.5267, "grad_norm": "3.937e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.575e-01", "anc_acc": "5.267e-01", "epoch": 0.03319} {"step": 16600, "loss": 1.2152, "grad_norm": "1.507e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.076e+00", "anc_loss": "1.179e+00", "dlm_acc": "5.926e-01", "anc_acc": "5.638e-01", "epoch": 0.0332} {"step": 16605, "loss": 1.0358, "grad_norm": "5.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.216e+00", "dlm_acc": "6.044e-01", "anc_acc": "5.839e-01", "epoch": 0.03321} {"step": 16610, "loss": 1.3412, "grad_norm": "3.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.009e-01", "anc_acc": "4.824e-01", "epoch": 0.03322} {"step": 16615, "loss": 1.6282, "grad_norm": "2.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.333e+00", "dlm_acc": "6.155e-01", "anc_acc": "5.955e-01", "epoch": 0.03323} {"step": 16620, "loss": 1.2034, "grad_norm": "5.256e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.320e-01", "anc_loss": "2.732e-01", "dlm_acc": "8.900e-01", "anc_acc": "8.773e-01", "epoch": 0.03324} {"step": 16625, "loss": 1.4687, "grad_norm": "2.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.896e-01", "anc_loss": "9.871e-01", "dlm_acc": "6.830e-01", "anc_acc": "6.572e-01", "epoch": 0.03325} {"step": 16630, "loss": 1.9647, "grad_norm": "7.325e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.809e+00", "anc_loss": "1.902e+00", "dlm_acc": "4.646e-01", "anc_acc": "4.449e-01", "epoch": 0.03326} {"step": 16635, "loss": 1.2895, "grad_norm": "3.259e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.106e+00", "dlm_acc": "6.306e-01", "anc_acc": "6.060e-01", "epoch": 0.03327} {"step": 16640, "loss": 1.1181, "grad_norm": "2.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.434e-01", "anc_loss": "9.359e-01", "dlm_acc": "6.457e-01", "anc_acc": "6.175e-01", "epoch": 0.03328} {"step": 16645, "loss": 1.2837, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.010e+00", "anc_loss": "1.078e+00", "dlm_acc": "6.143e-01", "anc_acc": "5.979e-01", "epoch": 0.03329} {"step": 16650, "loss": 1.3635, "grad_norm": "3.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.341e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.526e-01", "anc_acc": "5.341e-01", "epoch": 0.0333} {"step": 16655, "loss": 1.7701, "grad_norm": "3.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.712e+00", "anc_loss": "1.848e+00", "dlm_acc": "4.744e-01", "anc_acc": "4.474e-01", "epoch": 0.03331} {"step": 16660, "loss": 1.2929, "grad_norm": "6.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.836e-01", "anc_acc": "5.683e-01", "epoch": 0.03332} {"step": 16665, "loss": 1.2292, "grad_norm": "2.418e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.346e+00", "dlm_acc": "5.371e-01", "anc_acc": "5.188e-01", "epoch": 0.03333} {"step": 16670, "loss": 1.3274, "grad_norm": "3.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.314e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.324e-01", "epoch": 0.03334} {"step": 16675, "loss": 1.4847, "grad_norm": "3.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.343e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.622e-01", "anc_acc": "5.378e-01", "epoch": 0.03335} {"step": 16680, "loss": 1.7358, "grad_norm": "5.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.468e+00", "anc_loss": "1.526e+00", "dlm_acc": "4.508e-01", "anc_acc": "4.377e-01", "epoch": 0.03336} {"step": 16685, "loss": 1.3077, "grad_norm": "3.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.219e-01", "anc_loss": "8.766e-01", "dlm_acc": "6.609e-01", "anc_acc": "6.440e-01", "epoch": 0.03337} {"step": 16690, "loss": 1.4103, "grad_norm": "4.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.125e-01", "anc_loss": "9.797e-01", "dlm_acc": "6.209e-01", "anc_acc": "5.998e-01", "epoch": 0.03338} {"step": 16695, "loss": 1.1338, "grad_norm": "1.626e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.199e+00", "dlm_acc": "5.627e-01", "anc_acc": "5.366e-01", "epoch": 0.03339} {"step": 16700, "loss": 1.4286, "grad_norm": "2.866e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.625e+00", "anc_loss": "1.686e+00", "dlm_acc": "4.196e-01", "anc_acc": "4.083e-01", "epoch": 0.0334} {"step": 16705, "loss": 1.9283, "grad_norm": "4.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.549e+00", "anc_loss": "1.644e+00", "dlm_acc": "5.532e-01", "anc_acc": "5.332e-01", "epoch": 0.03341} {"step": 16710, "loss": 1.3474, "grad_norm": "2.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.257e+00", "dlm_acc": "5.629e-01", "anc_acc": "5.443e-01", "epoch": 0.03342} {"step": 16715, "loss": 1.5201, "grad_norm": "2.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.084e+00", "dlm_acc": "6.034e-01", "anc_acc": "5.951e-01", "epoch": 0.03343} {"step": 16720, "loss": 1.574, "grad_norm": "2.198e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.151e+00", "anc_loss": "1.228e+00", "dlm_acc": "5.433e-01", "anc_acc": "5.239e-01", "epoch": 0.03344} {"step": 16725, "loss": 1.1794, "grad_norm": "4.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.699e-01", "anc_loss": "1.014e+00", "dlm_acc": "5.807e-01", "anc_acc": "5.711e-01", "epoch": 0.03345} {"step": 16730, "loss": 1.9697, "grad_norm": "2.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.228e+00", "anc_loss": "2.237e+00", "dlm_acc": "1.546e-01", "anc_acc": "1.504e-01", "epoch": 0.03346} {"step": 16735, "loss": 1.2639, "grad_norm": "2.494e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.445e+00", "dlm_acc": "3.683e-01", "anc_acc": "3.609e-01", "epoch": 0.03347} {"step": 16740, "loss": 1.3321, "grad_norm": "6.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.803e+00", "anc_loss": "1.820e+00", "dlm_acc": "2.978e-01", "anc_acc": "2.906e-01", "epoch": 0.03348} {"step": 16745, "loss": 1.6135, "grad_norm": "3.074e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.544e+00", "anc_loss": "1.626e+00", "dlm_acc": "4.753e-01", "anc_acc": "4.544e-01", "epoch": 0.03349} {"step": 16750, "loss": 1.2246, "grad_norm": "2.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.294e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.208e-01", "anc_acc": "4.996e-01", "epoch": 0.0335} {"step": 16755, "loss": 1.236, "grad_norm": "1.190e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.979e-01", "anc_loss": "7.438e-01", "dlm_acc": "6.618e-01", "anc_acc": "6.399e-01", "epoch": 0.03351} {"step": 16760, "loss": 1.5414, "grad_norm": "4.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.152e-01", "anc_loss": "5.605e-01", "dlm_acc": "7.288e-01", "anc_acc": "7.077e-01", "epoch": 0.03352} {"step": 16765, "loss": 1.4741, "grad_norm": "4.379e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.897e-01", "anc_acc": "5.698e-01", "epoch": 0.03353} {"step": 16770, "loss": 1.7551, "grad_norm": "4.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.584e+00", "anc_loss": "1.670e+00", "dlm_acc": "4.961e-01", "anc_acc": "4.799e-01", "epoch": 0.03354} {"step": 16775, "loss": 2.0671, "grad_norm": "4.043e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.837e+00", "anc_loss": "1.939e+00", "dlm_acc": "4.600e-01", "anc_acc": "4.404e-01", "epoch": 0.03355} {"step": 16780, "loss": 0.8638, "grad_norm": "2.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.562e-01", "anc_loss": "9.219e-01", "dlm_acc": "6.000e-01", "anc_acc": "5.817e-01", "epoch": 0.03356} {"step": 16785, "loss": 1.3263, "grad_norm": "5.430e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.583e+00", "dlm_acc": "4.738e-01", "anc_acc": "4.574e-01", "epoch": 0.03357} {"step": 16790, "loss": 1.6962, "grad_norm": "3.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.493e+00", "anc_loss": "1.587e+00", "dlm_acc": "5.534e-01", "anc_acc": "5.342e-01", "epoch": 0.03358} {"step": 16795, "loss": 1.4354, "grad_norm": "3.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.086e-01", "anc_loss": "6.732e-01", "dlm_acc": "7.860e-01", "anc_acc": "7.697e-01", "epoch": 0.03359} {"step": 16800, "loss": 1.6425, "grad_norm": "1.012e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.393e+00", "anc_loss": "1.467e+00", "dlm_acc": "5.537e-01", "anc_acc": "5.359e-01", "epoch": 0.0336} {"step": 16805, "loss": 1.5703, "grad_norm": "5.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.666e+00", "dlm_acc": "5.196e-01", "anc_acc": "5.012e-01", "epoch": 0.03361} {"step": 16810, "loss": 1.1359, "grad_norm": "1.061e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.215e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.053e-01", "anc_acc": "4.890e-01", "epoch": 0.03362} {"step": 16815, "loss": 1.2147, "grad_norm": "3.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.103e+00", "dlm_acc": "4.466e-01", "anc_acc": "4.364e-01", "epoch": 0.03363} {"step": 16820, "loss": 1.548, "grad_norm": "2.834e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.486e+00", "anc_loss": "1.563e+00", "dlm_acc": "4.944e-01", "anc_acc": "4.793e-01", "epoch": 0.03364} {"step": 16825, "loss": 1.3803, "grad_norm": "4.424e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.123e-01", "anc_loss": "7.691e-01", "dlm_acc": "7.393e-01", "anc_acc": "7.241e-01", "epoch": 0.03365} {"step": 16830, "loss": 1.0215, "grad_norm": "2.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.542e-02", "anc_loss": "1.591e-02", "dlm_acc": "9.930e-01", "anc_acc": "9.929e-01", "epoch": 0.03366} {"step": 16835, "loss": 2.2072, "grad_norm": "6.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.025e+00", "anc_loss": "3.069e+00", "dlm_acc": "8.864e-02", "anc_acc": "8.530e-02", "epoch": 0.03367} {"step": 16840, "loss": 1.5209, "grad_norm": "7.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.569e+00", "anc_loss": "1.677e+00", "dlm_acc": "4.811e-01", "anc_acc": "4.572e-01", "epoch": 0.03368} {"step": 16845, "loss": 1.1393, "grad_norm": "9.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.336e+00", "dlm_acc": "5.753e-01", "anc_acc": "5.569e-01", "epoch": 0.03369} {"step": 16850, "loss": 1.8185, "grad_norm": "2.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.966e+00", "anc_loss": "2.059e+00", "dlm_acc": "4.703e-01", "anc_acc": "4.545e-01", "epoch": 0.0337} {"step": 16855, "loss": 1.2373, "grad_norm": "3.608e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.331e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.558e-01", "anc_acc": "5.331e-01", "epoch": 0.03371} {"step": 16860, "loss": 1.1821, "grad_norm": "8.005e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.383e+00", "anc_loss": "1.434e+00", "dlm_acc": "4.798e-01", "anc_acc": "4.701e-01", "epoch": 0.03372} {"step": 16865, "loss": 1.1976, "grad_norm": "2.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.101e-01", "anc_loss": "8.538e-01", "dlm_acc": "6.831e-01", "anc_acc": "6.719e-01", "epoch": 0.03373} {"step": 16870, "loss": 1.1946, "grad_norm": "2.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.214e+00", "dlm_acc": "5.858e-01", "anc_acc": "5.660e-01", "epoch": 0.03374} {"step": 16875, "loss": 1.5061, "grad_norm": "2.844e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.955e+00", "anc_loss": "2.032e+00", "dlm_acc": "4.107e-01", "anc_acc": "3.977e-01", "epoch": 0.03375} {"step": 16880, "loss": 1.1606, "grad_norm": "2.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.423e+00", "dlm_acc": "4.900e-01", "anc_acc": "4.685e-01", "epoch": 0.03376} {"step": 16885, "loss": 1.5706, "grad_norm": "5.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.828e-01", "anc_loss": "1.054e+00", "dlm_acc": "5.476e-01", "anc_acc": "5.247e-01", "epoch": 0.03377} {"step": 16890, "loss": 1.5982, "grad_norm": "4.381e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.526e+00", "dlm_acc": "5.632e-01", "anc_acc": "5.419e-01", "epoch": 0.03378} {"step": 16895, "loss": 1.048, "grad_norm": "4.803e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.309e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.213e-01", "anc_acc": "5.025e-01", "epoch": 0.03379} {"step": 16900, "loss": 1.1829, "grad_norm": "4.950e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.261e+00", "anc_loss": "1.348e+00", "dlm_acc": "4.798e-01", "anc_acc": "4.476e-01", "epoch": 0.0338} {"step": 16905, "loss": 1.3235, "grad_norm": "5.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.361e+00", "dlm_acc": "5.712e-01", "anc_acc": "5.353e-01", "epoch": 0.03381} {"step": 16910, "loss": 1.0564, "grad_norm": "3.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.703e-01", "anc_acc": "5.484e-01", "epoch": 0.03382} {"step": 16915, "loss": 1.2075, "grad_norm": "3.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.422e+00", "anc_loss": "1.509e+00", "dlm_acc": "5.027e-01", "anc_acc": "4.837e-01", "epoch": 0.03383} {"step": 16920, "loss": 1.6424, "grad_norm": "8.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.723e+00", "anc_loss": "1.828e+00", "dlm_acc": "4.973e-01", "anc_acc": "4.793e-01", "epoch": 0.03384} {"step": 16925, "loss": 0.9086, "grad_norm": "2.747e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.278e+00", "dlm_acc": "5.876e-01", "anc_acc": "5.664e-01", "epoch": 0.03385} {"step": 16930, "loss": 0.9725, "grad_norm": "5.236e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.475e+00", "anc_loss": "1.561e+00", "dlm_acc": "5.080e-01", "anc_acc": "4.897e-01", "epoch": 0.03386} {"step": 16935, "loss": 0.9435, "grad_norm": "3.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.602e-01", "anc_loss": "8.121e-01", "dlm_acc": "6.614e-01", "anc_acc": "6.513e-01", "epoch": 0.03387} {"step": 16940, "loss": 0.9007, "grad_norm": "1.738e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.844e-01", "anc_loss": "9.555e-01", "dlm_acc": "6.185e-01", "anc_acc": "5.964e-01", "epoch": 0.03388} {"step": 16945, "loss": 1.2528, "grad_norm": "3.337e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.213e-01", "anc_acc": "4.978e-01", "epoch": 0.03389} {"step": 16950, "loss": 1.4595, "grad_norm": "5.074e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.944e+00", "anc_loss": "2.002e+00", "dlm_acc": "3.547e-01", "anc_acc": "3.430e-01", "epoch": 0.0339} {"step": 16955, "loss": 1.0003, "grad_norm": "5.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.207e+00", "dlm_acc": "4.996e-01", "anc_acc": "4.827e-01", "epoch": 0.03391} {"step": 16960, "loss": 0.953, "grad_norm": "6.624e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.832e-01", "anc_loss": "9.344e-01", "dlm_acc": "6.121e-01", "anc_acc": "6.014e-01", "epoch": 0.03392} {"step": 16965, "loss": 1.296, "grad_norm": "2.970e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.777e+00", "anc_loss": "1.844e+00", "dlm_acc": "3.955e-01", "anc_acc": "3.810e-01", "epoch": 0.03393} {"step": 16970, "loss": 0.9136, "grad_norm": "2.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.680e-01", "anc_loss": "9.484e-01", "dlm_acc": "6.466e-01", "anc_acc": "6.256e-01", "epoch": 0.03394} {"step": 16975, "loss": 1.2801, "grad_norm": "2.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.129e+00", "dlm_acc": "6.419e-01", "anc_acc": "6.225e-01", "epoch": 0.03395} {"step": 16980, "loss": 1.1578, "grad_norm": "5.196e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.645e-01", "anc_loss": "1.061e+00", "dlm_acc": "6.086e-01", "anc_acc": "5.724e-01", "epoch": 0.03396} {"step": 16985, "loss": 1.111, "grad_norm": "3.930e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.031e+00", "anc_loss": "1.099e+00", "dlm_acc": "5.751e-01", "anc_acc": "5.548e-01", "epoch": 0.03397} {"step": 16990, "loss": 1.1253, "grad_norm": "4.242e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.197e-01", "anc_loss": "3.469e-01", "dlm_acc": "8.075e-01", "anc_acc": "7.932e-01", "epoch": 0.03398} {"step": 16995, "loss": 0.9914, "grad_norm": "4.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.624e-01", "anc_loss": "3.918e-01", "dlm_acc": "7.871e-01", "anc_acc": "7.693e-01", "epoch": 0.03399} {"step": 17000, "loss": 1.2456, "grad_norm": "4.065e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.461e-01", "anc_loss": "8.887e-01", "dlm_acc": "6.583e-01", "anc_acc": "6.553e-01", "epoch": 0.034} {"step": 17005, "loss": 1.2326, "grad_norm": "3.530e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.315e+00", "dlm_acc": "5.649e-01", "anc_acc": "5.497e-01", "epoch": 0.03401} {"step": 17010, "loss": 1.2236, "grad_norm": "2.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.400e-01", "anc_loss": "8.881e-01", "dlm_acc": "7.099e-01", "anc_acc": "6.957e-01", "epoch": 0.03402} {"step": 17015, "loss": 1.2084, "grad_norm": "4.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.433e+00", "dlm_acc": "5.070e-01", "anc_acc": "4.836e-01", "epoch": 0.03403} {"step": 17020, "loss": 1.3161, "grad_norm": "4.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.125e+00", "anc_loss": "1.195e+00", "dlm_acc": "5.729e-01", "anc_acc": "5.569e-01", "epoch": 0.03404} {"step": 17025, "loss": 1.1075, "grad_norm": "6.024e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.491e+00", "dlm_acc": "4.570e-01", "anc_acc": "4.432e-01", "epoch": 0.03405} {"step": 17030, "loss": 1.1368, "grad_norm": "3.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.577e+00", "anc_loss": "1.655e+00", "dlm_acc": "4.556e-01", "anc_acc": "4.392e-01", "epoch": 0.03406} {"step": 17035, "loss": 0.83, "grad_norm": "3.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.279e+00", "anc_loss": "1.354e+00", "dlm_acc": "5.457e-01", "anc_acc": "5.276e-01", "epoch": 0.03407} {"step": 17040, "loss": 1.255, "grad_norm": "3.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.268e+00", "anc_loss": "1.351e+00", "dlm_acc": "5.696e-01", "anc_acc": "5.483e-01", "epoch": 0.03408} {"step": 17045, "loss": 1.2325, "grad_norm": "3.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.480e-01", "anc_acc": "5.287e-01", "epoch": 0.03409} {"step": 17050, "loss": 1.3771, "grad_norm": "6.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.866e+00", "anc_loss": "1.924e+00", "dlm_acc": "4.172e-01", "anc_acc": "4.059e-01", "epoch": 0.0341} {"step": 17055, "loss": 1.4326, "grad_norm": "4.109e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.919e+00", "anc_loss": "1.992e+00", "dlm_acc": "3.999e-01", "anc_acc": "3.885e-01", "epoch": 0.03411} {"step": 17060, "loss": 1.1675, "grad_norm": "7.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.168e+00", "dlm_acc": "5.518e-01", "anc_acc": "5.309e-01", "epoch": 0.03412} {"step": 17065, "loss": 1.274, "grad_norm": "3.516e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.329e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.427e-01", "anc_acc": "5.185e-01", "epoch": 0.03413} {"step": 17070, "loss": 1.3831, "grad_norm": "4.768e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.467e+00", "dlm_acc": "5.161e-01", "anc_acc": "4.982e-01", "epoch": 0.03414} {"step": 17075, "loss": 1.3614, "grad_norm": "4.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.363e+00", "dlm_acc": "4.139e-01", "anc_acc": "4.199e-01", "epoch": 0.03415} {"step": 17080, "loss": 1.2455, "grad_norm": "5.316e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.040e+00", "anc_loss": "1.041e+00", "dlm_acc": "4.063e-01", "anc_acc": "4.043e-01", "epoch": 0.03416} {"step": 17085, "loss": 1.0695, "grad_norm": "1.226e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.491e+00", "dlm_acc": "4.916e-01", "anc_acc": "4.771e-01", "epoch": 0.03417} {"step": 17090, "loss": 0.9607, "grad_norm": "2.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.060e+00", "dlm_acc": "4.311e-01", "anc_acc": "4.201e-01", "epoch": 0.03418} {"step": 17095, "loss": 1.4657, "grad_norm": "3.608e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.605e+00", "anc_loss": "1.699e+00", "dlm_acc": "5.286e-01", "anc_acc": "5.083e-01", "epoch": 0.03419} {"step": 17100, "loss": 1.4048, "grad_norm": "6.602e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.408e+00", "anc_loss": "1.470e+00", "dlm_acc": "5.364e-01", "anc_acc": "5.226e-01", "epoch": 0.0342} {"step": 17105, "loss": 1.8802, "grad_norm": "6.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.209e+00", "dlm_acc": "5.772e-01", "anc_acc": "5.619e-01", "epoch": 0.03421} {"step": 17110, "loss": 1.4573, "grad_norm": "2.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.528e+00", "dlm_acc": "5.038e-01", "anc_acc": "4.859e-01", "epoch": 0.03422} {"step": 17115, "loss": 1.2287, "grad_norm": "3.462e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.581e+00", "anc_loss": "1.650e+00", "dlm_acc": "4.684e-01", "anc_acc": "4.517e-01", "epoch": 0.03423} {"step": 17120, "loss": 1.4955, "grad_norm": "3.590e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.570e+00", "anc_loss": "1.672e+00", "dlm_acc": "5.078e-01", "anc_acc": "4.875e-01", "epoch": 0.03424} {"step": 17125, "loss": 1.4189, "grad_norm": "2.629e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.583e+00", "dlm_acc": "5.091e-01", "anc_acc": "4.868e-01", "epoch": 0.03425} {"step": 17130, "loss": 1.3453, "grad_norm": "4.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.764e-01", "anc_acc": "5.601e-01", "epoch": 0.03426} {"step": 17135, "loss": 1.1299, "grad_norm": "3.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.223e+00", "dlm_acc": "6.113e-01", "anc_acc": "5.883e-01", "epoch": 0.03427} {"step": 17140, "loss": 1.0112, "grad_norm": "3.197e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.977e-01", "anc_loss": "8.621e-01", "dlm_acc": "5.804e-01", "anc_acc": "5.586e-01", "epoch": 0.03428} {"step": 17145, "loss": 1.4606, "grad_norm": "3.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.230e+00", "dlm_acc": "6.087e-01", "anc_acc": "5.950e-01", "epoch": 0.03429} {"step": 17150, "loss": 1.6583, "grad_norm": "6.192e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.292e+00", "dlm_acc": "4.654e-01", "anc_acc": "4.486e-01", "epoch": 0.0343} {"step": 17155, "loss": 1.1722, "grad_norm": "1.725e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.112e+00", "dlm_acc": "6.342e-01", "anc_acc": "6.135e-01", "epoch": 0.03431} {"step": 17160, "loss": 0.9979, "grad_norm": "3.498e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.172e+00", "dlm_acc": "5.848e-01", "anc_acc": "5.668e-01", "epoch": 0.03432} {"step": 17165, "loss": 1.227, "grad_norm": "2.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.250e+00", "anc_loss": "1.347e+00", "dlm_acc": "5.767e-01", "anc_acc": "5.556e-01", "epoch": 0.03433} {"step": 17170, "loss": 1.2188, "grad_norm": "3.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.087e+00", "dlm_acc": "6.492e-01", "anc_acc": "6.355e-01", "epoch": 0.03434} {"step": 17175, "loss": 1.1285, "grad_norm": "5.211e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.096e-01", "anc_loss": "9.965e-01", "dlm_acc": "6.744e-01", "anc_acc": "6.527e-01", "epoch": 0.03435} {"step": 17180, "loss": 1.0921, "grad_norm": "3.849e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.228e+00", "dlm_acc": "5.923e-01", "anc_acc": "5.704e-01", "epoch": 0.03436} {"step": 17185, "loss": 0.9537, "grad_norm": "2.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.062e-01", "anc_loss": "9.516e-01", "dlm_acc": "5.737e-01", "anc_acc": "5.645e-01", "epoch": 0.03437} {"step": 17190, "loss": 1.1245, "grad_norm": "2.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.086e-01", "anc_loss": "7.125e-01", "dlm_acc": "5.609e-01", "anc_acc": "5.609e-01", "epoch": 0.03438} {"step": 17195, "loss": 0.7933, "grad_norm": "2.672e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.543e-01", "anc_loss": "5.570e-01", "dlm_acc": "6.022e-01", "anc_acc": "6.012e-01", "epoch": 0.03439} {"step": 17200, "loss": 1.3938, "grad_norm": "2.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.780e-01", "anc_acc": "5.607e-01", "epoch": 0.0344} {"step": 17205, "loss": 1.2275, "grad_norm": "3.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.278e+00", "dlm_acc": "6.095e-01", "anc_acc": "5.954e-01", "epoch": 0.03441} {"step": 17210, "loss": 1.0922, "grad_norm": "3.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.241e-01", "anc_loss": "9.951e-01", "dlm_acc": "6.515e-01", "anc_acc": "6.355e-01", "epoch": 0.03442} {"step": 17215, "loss": 1.2604, "grad_norm": "3.470e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.413e-01", "anc_loss": "4.758e-01", "dlm_acc": "8.238e-01", "anc_acc": "8.094e-01", "epoch": 0.03443} {"step": 17220, "loss": 1.3135, "grad_norm": "6.122e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.059e-02", "anc_loss": "5.420e-02", "dlm_acc": "9.778e-01", "anc_acc": "9.618e-01", "epoch": 0.03444} {"step": 17225, "loss": 1.7289, "grad_norm": "4.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.605e-01", "anc_loss": "4.127e-01", "dlm_acc": "8.759e-01", "anc_acc": "8.478e-01", "epoch": 0.03445} {"step": 17230, "loss": 1.6074, "grad_norm": "4.099e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.119e+00", "dlm_acc": "6.291e-01", "anc_acc": "6.162e-01", "epoch": 0.03446} {"step": 17235, "loss": 1.5435, "grad_norm": "4.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.507e+00", "anc_loss": "1.566e+00", "dlm_acc": "4.169e-01", "anc_acc": "4.039e-01", "epoch": 0.03447} {"step": 17240, "loss": 0.8849, "grad_norm": "2.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.969e-01", "anc_loss": "9.555e-01", "dlm_acc": "5.364e-01", "anc_acc": "5.236e-01", "epoch": 0.03448} {"step": 17245, "loss": 1.5746, "grad_norm": "3.074e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.211e+00", "dlm_acc": "6.260e-01", "anc_acc": "6.028e-01", "epoch": 0.03449} {"step": 17250, "loss": 1.1328, "grad_norm": "2.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.193e+00", "anc_loss": "1.274e+00", "dlm_acc": "5.472e-01", "anc_acc": "5.267e-01", "epoch": 0.0345} {"step": 17255, "loss": 1.0744, "grad_norm": "2.187e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.773e-01", "anc_loss": "8.602e-01", "dlm_acc": "6.860e-01", "anc_acc": "6.629e-01", "epoch": 0.03451} {"step": 17260, "loss": 0.8204, "grad_norm": "2.744e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.537e-01", "anc_loss": "1.026e+00", "dlm_acc": "6.514e-01", "anc_acc": "6.337e-01", "epoch": 0.03452} {"step": 17265, "loss": 1.5048, "grad_norm": "3.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.188e+00", "dlm_acc": "6.197e-01", "anc_acc": "6.034e-01", "epoch": 0.03453} {"step": 17270, "loss": 1.3743, "grad_norm": "3.171e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.489e+00", "anc_loss": "1.582e+00", "dlm_acc": "4.972e-01", "anc_acc": "4.773e-01", "epoch": 0.03454} {"step": 17275, "loss": 1.6462, "grad_norm": "2.798e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.507e+00", "anc_loss": "1.605e+00", "dlm_acc": "5.334e-01", "anc_acc": "5.141e-01", "epoch": 0.03455} {"step": 17280, "loss": 1.2593, "grad_norm": "3.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.408e+00", "dlm_acc": "5.606e-01", "anc_acc": "5.427e-01", "epoch": 0.03456} {"step": 17285, "loss": 0.9187, "grad_norm": "3.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.190e+00", "dlm_acc": "5.787e-01", "anc_acc": "5.600e-01", "epoch": 0.03457} {"step": 17290, "loss": 1.3847, "grad_norm": "6.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.279e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.670e-01", "anc_acc": "5.441e-01", "epoch": 0.03458} {"step": 17295, "loss": 1.2055, "grad_norm": "3.043e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.343e+00", "dlm_acc": "5.550e-01", "anc_acc": "5.370e-01", "epoch": 0.03459} {"step": 17300, "loss": 1.4141, "grad_norm": "2.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.358e+00", "anc_loss": "1.454e+00", "dlm_acc": "5.704e-01", "anc_acc": "5.494e-01", "epoch": 0.0346} {"step": 17305, "loss": 1.1079, "grad_norm": "2.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.445e-01", "anc_loss": "1.050e+00", "dlm_acc": "6.427e-01", "anc_acc": "6.181e-01", "epoch": 0.03461} {"step": 17310, "loss": 2.1446, "grad_norm": "4.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.161e+00", "anc_loss": "2.275e+00", "dlm_acc": "4.371e-01", "anc_acc": "4.178e-01", "epoch": 0.03462} {"step": 17315, "loss": 1.2769, "grad_norm": "2.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.889e-01", "anc_acc": "5.695e-01", "epoch": 0.03463} {"step": 17320, "loss": 1.2302, "grad_norm": "2.738e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.746e-01", "anc_loss": "1.059e+00", "dlm_acc": "6.372e-01", "anc_acc": "6.131e-01", "epoch": 0.03464} {"step": 17325, "loss": 1.1682, "grad_norm": "3.034e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.361e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.312e-01", "anc_acc": "5.124e-01", "epoch": 0.03465} {"step": 17330, "loss": 1.6482, "grad_norm": "2.180e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.566e+00", "anc_loss": "1.663e+00", "dlm_acc": "5.052e-01", "anc_acc": "4.843e-01", "epoch": 0.03466} {"step": 17335, "loss": 1.334, "grad_norm": "1.664e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.177e+00", "dlm_acc": "6.088e-01", "anc_acc": "5.850e-01", "epoch": 0.03467} {"step": 17340, "loss": 1.3815, "grad_norm": "4.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.656e+00", "anc_loss": "1.688e+00", "dlm_acc": "4.318e-01", "anc_acc": "4.250e-01", "epoch": 0.03468} {"step": 17345, "loss": 1.3958, "grad_norm": "3.403e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.756e-01", "anc_acc": "5.497e-01", "epoch": 0.03469} {"step": 17350, "loss": 1.4848, "grad_norm": "3.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.542e-01", "anc_acc": "5.262e-01", "epoch": 0.0347} {"step": 17355, "loss": 1.2728, "grad_norm": "2.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.323e+00", "dlm_acc": "5.642e-01", "anc_acc": "5.471e-01", "epoch": 0.03471} {"step": 17360, "loss": 1.0657, "grad_norm": "3.160e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.113e+00", "dlm_acc": "5.809e-01", "anc_acc": "5.538e-01", "epoch": 0.03472} {"step": 17365, "loss": 1.5579, "grad_norm": "2.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.497e+00", "dlm_acc": "4.671e-01", "anc_acc": "4.461e-01", "epoch": 0.03473} {"step": 17370, "loss": 1.4007, "grad_norm": "3.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.551e+00", "dlm_acc": "5.174e-01", "anc_acc": "4.917e-01", "epoch": 0.03474} {"step": 17375, "loss": 1.449, "grad_norm": "3.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.598e+00", "dlm_acc": "4.657e-01", "anc_acc": "4.440e-01", "epoch": 0.03475} {"step": 17380, "loss": 1.4538, "grad_norm": "3.386e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.751e+00", "anc_loss": "1.822e+00", "dlm_acc": "4.286e-01", "anc_acc": "4.147e-01", "epoch": 0.03476} {"step": 17385, "loss": 1.595, "grad_norm": "3.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.682e-01", "anc_acc": "5.502e-01", "epoch": 0.03477} {"step": 17390, "loss": 0.9335, "grad_norm": "3.141e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.141e+00", "dlm_acc": "5.872e-01", "anc_acc": "5.591e-01", "epoch": 0.03478} {"step": 17395, "loss": 1.5501, "grad_norm": "4.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.678e+00", "anc_loss": "1.773e+00", "dlm_acc": "4.916e-01", "anc_acc": "4.718e-01", "epoch": 0.03479} {"step": 17400, "loss": 1.1055, "grad_norm": "3.616e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.355e-01", "anc_loss": "8.258e-01", "dlm_acc": "6.435e-01", "anc_acc": "6.258e-01", "epoch": 0.0348} {"step": 17405, "loss": 1.3235, "grad_norm": "4.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.529e-01", "anc_loss": "8.363e-01", "dlm_acc": "6.601e-01", "anc_acc": "6.428e-01", "epoch": 0.03481} {"step": 17410, "loss": 1.4341, "grad_norm": "5.538e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.492e+00", "dlm_acc": "5.124e-01", "anc_acc": "4.884e-01", "epoch": 0.03482} {"step": 17415, "loss": 1.1096, "grad_norm": "2.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.812e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.151e-01", "anc_acc": "5.899e-01", "epoch": 0.03483} {"step": 17420, "loss": 1.3152, "grad_norm": "3.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.388e+00", "anc_loss": "1.467e+00", "dlm_acc": "5.071e-01", "anc_acc": "4.897e-01", "epoch": 0.03484} {"step": 17425, "loss": 1.493, "grad_norm": "6.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.154e+00", "dlm_acc": "6.035e-01", "anc_acc": "5.721e-01", "epoch": 0.03485} {"step": 17430, "loss": 1.3226, "grad_norm": "2.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.597e+00", "anc_loss": "1.668e+00", "dlm_acc": "4.587e-01", "anc_acc": "4.413e-01", "epoch": 0.03486} {"step": 17435, "loss": 1.4164, "grad_norm": "7.065e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.006e+00", "anc_loss": "2.071e+00", "dlm_acc": "3.401e-01", "anc_acc": "3.221e-01", "epoch": 0.03487} {"step": 17440, "loss": 1.4786, "grad_norm": "3.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.706e+00", "anc_loss": "2.716e+00", "dlm_acc": "3.530e-02", "anc_acc": "3.439e-02", "epoch": 0.03488} {"step": 17445, "loss": 1.4377, "grad_norm": "2.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.149e+00", "anc_loss": "2.203e+00", "dlm_acc": "2.362e-01", "anc_acc": "2.253e-01", "epoch": 0.03489} {"step": 17450, "loss": 1.3809, "grad_norm": "4.230e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.400e+00", "dlm_acc": "4.810e-01", "anc_acc": "4.654e-01", "epoch": 0.0349} {"step": 17455, "loss": 1.4632, "grad_norm": "4.783e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.280e-01", "anc_acc": "5.068e-01", "epoch": 0.03491} {"step": 17460, "loss": 1.3255, "grad_norm": "4.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.469e-01", "anc_loss": "1.056e+00", "dlm_acc": "6.716e-01", "anc_acc": "6.419e-01", "epoch": 0.03492} {"step": 17465, "loss": 1.2124, "grad_norm": "2.668e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.197e+00", "anc_loss": "1.254e+00", "dlm_acc": "4.497e-01", "anc_acc": "4.331e-01", "epoch": 0.03493} {"step": 17470, "loss": 1.0083, "grad_norm": "2.424e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.877e-01", "anc_loss": "6.309e-01", "dlm_acc": "7.039e-01", "anc_acc": "6.886e-01", "epoch": 0.03494} {"step": 17475, "loss": 1.3235, "grad_norm": "6.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.668e-01", "anc_loss": "9.527e-01", "dlm_acc": "6.847e-01", "anc_acc": "6.623e-01", "epoch": 0.03495} {"step": 17480, "loss": 1.1109, "grad_norm": "3.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.750e-01", "anc_loss": "7.570e-01", "dlm_acc": "7.103e-01", "anc_acc": "6.923e-01", "epoch": 0.03496} {"step": 17485, "loss": 1.478, "grad_norm": "3.447e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.461e+00", "anc_loss": "1.552e+00", "dlm_acc": "4.709e-01", "anc_acc": "4.463e-01", "epoch": 0.03497} {"step": 17490, "loss": 1.4859, "grad_norm": "3.778e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.431e+00", "anc_loss": "1.519e+00", "dlm_acc": "4.387e-01", "anc_acc": "4.139e-01", "epoch": 0.03498} {"step": 17495, "loss": 1.0488, "grad_norm": "2.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.422e-01", "anc_loss": "1.031e+00", "dlm_acc": "6.334e-01", "anc_acc": "6.137e-01", "epoch": 0.03499} {"step": 17500, "loss": 1.2819, "grad_norm": "6.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.798e-01", "anc_acc": "5.581e-01", "epoch": 0.035} {"step": 17505, "loss": 1.2972, "grad_norm": "3.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.011e+00", "anc_loss": "1.082e+00", "dlm_acc": "6.056e-01", "anc_acc": "5.880e-01", "epoch": 0.03501} {"step": 17510, "loss": 1.4825, "grad_norm": "6.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.545e+00", "anc_loss": "1.648e+00", "dlm_acc": "4.483e-01", "anc_acc": "4.301e-01", "epoch": 0.03502} {"step": 17515, "loss": 1.3604, "grad_norm": "2.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.417e+00", "dlm_acc": "5.395e-01", "anc_acc": "5.249e-01", "epoch": 0.03503} {"step": 17520, "loss": 1.4853, "grad_norm": "3.653e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.474e+00", "anc_loss": "1.567e+00", "dlm_acc": "5.202e-01", "anc_acc": "5.023e-01", "epoch": 0.03504} {"step": 17525, "loss": 1.2887, "grad_norm": "1.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.402e+00", "dlm_acc": "5.633e-01", "anc_acc": "5.468e-01", "epoch": 0.03505} {"step": 17530, "loss": 1.3899, "grad_norm": "2.899e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.313e-01", "anc_loss": "8.759e-01", "dlm_acc": "7.133e-01", "anc_acc": "7.031e-01", "epoch": 0.03506} {"step": 17535, "loss": 1.1795, "grad_norm": "2.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.969e-01", "anc_loss": "8.454e-01", "dlm_acc": "7.257e-01", "anc_acc": "7.147e-01", "epoch": 0.03507} {"step": 17540, "loss": 1.0443, "grad_norm": "4.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.445e-01", "anc_loss": "1.021e+00", "dlm_acc": "6.322e-01", "anc_acc": "6.148e-01", "epoch": 0.03508} {"step": 17545, "loss": 1.2281, "grad_norm": "4.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.144e+00", "anc_loss": "1.232e+00", "dlm_acc": "6.276e-01", "anc_acc": "6.028e-01", "epoch": 0.03509} {"step": 17550, "loss": 1.326, "grad_norm": "2.462e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.479e+00", "anc_loss": "1.566e+00", "dlm_acc": "5.112e-01", "anc_acc": "4.935e-01", "epoch": 0.0351} {"step": 17555, "loss": 1.1404, "grad_norm": "2.951e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.268e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.374e-01", "anc_acc": "5.201e-01", "epoch": 0.03511} {"step": 17560, "loss": 1.4807, "grad_norm": "9.834e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.952e-01", "anc_acc": "5.813e-01", "epoch": 0.03512} {"step": 17565, "loss": 0.9903, "grad_norm": "2.353e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.875e-01", "anc_loss": "4.133e-01", "dlm_acc": "8.138e-01", "anc_acc": "8.082e-01", "epoch": 0.03513} {"step": 17570, "loss": 1.2963, "grad_norm": "3.141e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.290e+00", "dlm_acc": "4.458e-01", "anc_acc": "4.357e-01", "epoch": 0.03514} {"step": 17575, "loss": 1.7574, "grad_norm": "2.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.424e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.801e-01", "anc_acc": "5.659e-01", "epoch": 0.03515} {"step": 17580, "loss": 1.4282, "grad_norm": "3.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.459e+00", "dlm_acc": "4.935e-01", "anc_acc": "4.739e-01", "epoch": 0.03516} {"step": 17585, "loss": 1.7222, "grad_norm": "3.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.738e+00", "anc_loss": "1.858e+00", "dlm_acc": "4.772e-01", "anc_acc": "4.584e-01", "epoch": 0.03517} {"step": 17590, "loss": 1.1975, "grad_norm": "2.180e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.191e-01", "anc_acc": "4.971e-01", "epoch": 0.03518} {"step": 17595, "loss": 1.3725, "grad_norm": "3.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.025e+00", "anc_loss": "1.133e+00", "dlm_acc": "6.431e-01", "anc_acc": "6.167e-01", "epoch": 0.03519} {"step": 17600, "loss": 1.3906, "grad_norm": "6.613e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.214e+00", "anc_loss": "1.307e+00", "dlm_acc": "5.960e-01", "anc_acc": "5.761e-01", "epoch": 0.0352} {"step": 17605, "loss": 1.346, "grad_norm": "3.366e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.655e-01", "anc_acc": "5.454e-01", "epoch": 0.03521} {"step": 17610, "loss": 1.5042, "grad_norm": "3.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.738e+00", "anc_loss": "1.833e+00", "dlm_acc": "4.872e-01", "anc_acc": "4.685e-01", "epoch": 0.03522} {"step": 17615, "loss": 1.1352, "grad_norm": "2.217e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.448e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.021e-01", "anc_acc": "4.856e-01", "epoch": 0.03523} {"step": 17620, "loss": 1.2456, "grad_norm": "2.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.907e-01", "anc_loss": "1.051e+00", "dlm_acc": "7.041e-01", "anc_acc": "6.916e-01", "epoch": 0.03524} {"step": 17625, "loss": 0.9697, "grad_norm": "2.657e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.729e-01", "anc_loss": "5.261e-01", "dlm_acc": "7.952e-01", "anc_acc": "7.779e-01", "epoch": 0.03525} {"step": 17630, "loss": 1.405, "grad_norm": "4.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.551e+00", "anc_loss": "1.625e+00", "dlm_acc": "4.443e-01", "anc_acc": "4.303e-01", "epoch": 0.03526} {"step": 17635, "loss": 1.1257, "grad_norm": "3.090e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.457e+00", "anc_loss": "1.522e+00", "dlm_acc": "4.935e-01", "anc_acc": "4.764e-01", "epoch": 0.03527} {"step": 17640, "loss": 1.1849, "grad_norm": "5.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.447e+00", "dlm_acc": "5.423e-01", "anc_acc": "5.218e-01", "epoch": 0.03528} {"step": 17645, "loss": 1.1293, "grad_norm": "2.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.283e-01", "anc_loss": "6.412e-01", "dlm_acc": "7.805e-01", "anc_acc": "7.552e-01", "epoch": 0.03529} {"step": 17650, "loss": 1.1306, "grad_norm": "2.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.325e+00", "anc_loss": "1.403e+00", "dlm_acc": "5.713e-01", "anc_acc": "5.516e-01", "epoch": 0.0353} {"step": 17655, "loss": 0.8096, "grad_norm": "2.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.226e+00", "dlm_acc": "5.829e-01", "anc_acc": "5.628e-01", "epoch": 0.03531} {"step": 17660, "loss": 0.8752, "grad_norm": "2.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.597e+00", "anc_loss": "1.700e+00", "dlm_acc": "5.030e-01", "anc_acc": "4.837e-01", "epoch": 0.03532} {"step": 17665, "loss": 1.0917, "grad_norm": "2.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.146e+00", "anc_loss": "1.233e+00", "dlm_acc": "6.276e-01", "anc_acc": "6.094e-01", "epoch": 0.03533} {"step": 17670, "loss": 1.0627, "grad_norm": "3.466e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.535e+00", "anc_loss": "1.629e+00", "dlm_acc": "4.864e-01", "anc_acc": "4.675e-01", "epoch": 0.03534} {"step": 17675, "loss": 1.2311, "grad_norm": "3.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.633e+00", "anc_loss": "1.733e+00", "dlm_acc": "5.030e-01", "anc_acc": "4.861e-01", "epoch": 0.03535} {"step": 17680, "loss": 1.3709, "grad_norm": "2.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.613e+00", "anc_loss": "1.714e+00", "dlm_acc": "5.093e-01", "anc_acc": "4.880e-01", "epoch": 0.03536} {"step": 17685, "loss": 0.8411, "grad_norm": "3.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.188e+00", "dlm_acc": "6.271e-01", "anc_acc": "6.055e-01", "epoch": 0.03537} {"step": 17690, "loss": 1.444, "grad_norm": "5.234e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.642e-01", "anc_acc": "5.429e-01", "epoch": 0.03538} {"step": 17695, "loss": 1.2579, "grad_norm": "4.006e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.299e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.651e-01", "anc_acc": "5.458e-01", "epoch": 0.03539} {"step": 17700, "loss": 1.3045, "grad_norm": "4.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.269e+00", "dlm_acc": "6.093e-01", "anc_acc": "5.891e-01", "epoch": 0.0354} {"step": 17705, "loss": 1.4182, "grad_norm": "3.291e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.623e+00", "anc_loss": "1.728e+00", "dlm_acc": "4.959e-01", "anc_acc": "4.738e-01", "epoch": 0.03541} {"step": 17710, "loss": 1.3214, "grad_norm": "2.873e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.381e+00", "dlm_acc": "6.016e-01", "anc_acc": "5.845e-01", "epoch": 0.03542} {"step": 17715, "loss": 1.3713, "grad_norm": "4.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.553e+00", "dlm_acc": "5.312e-01", "anc_acc": "5.101e-01", "epoch": 0.03543} {"step": 17720, "loss": 1.0696, "grad_norm": "2.259e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.412e+00", "anc_loss": "1.509e+00", "dlm_acc": "5.561e-01", "anc_acc": "5.381e-01", "epoch": 0.03544} {"step": 17725, "loss": 1.0245, "grad_norm": "2.808e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.399e+00", "anc_loss": "1.501e+00", "dlm_acc": "5.579e-01", "anc_acc": "5.366e-01", "epoch": 0.03545} {"step": 17730, "loss": 1.0681, "grad_norm": "5.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.269e+00", "anc_loss": "1.354e+00", "dlm_acc": "5.760e-01", "anc_acc": "5.555e-01", "epoch": 0.03546} {"step": 17735, "loss": 1.0935, "grad_norm": "1.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.672e-01", "anc_acc": "5.467e-01", "epoch": 0.03547} {"step": 17740, "loss": 0.8598, "grad_norm": "2.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.286e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.418e-01", "anc_acc": "5.246e-01", "epoch": 0.03548} {"step": 17745, "loss": 0.9606, "grad_norm": "3.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.514e+00", "dlm_acc": "5.473e-01", "anc_acc": "5.231e-01", "epoch": 0.03549} {"step": 17750, "loss": 1.2512, "grad_norm": "3.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.243e+00", "anc_loss": "1.347e+00", "dlm_acc": "5.828e-01", "anc_acc": "5.591e-01", "epoch": 0.0355} {"step": 17755, "loss": 1.7287, "grad_norm": "3.012e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.542e+00", "dlm_acc": "5.086e-01", "anc_acc": "4.907e-01", "epoch": 0.03551} {"step": 17760, "loss": 1.0221, "grad_norm": "2.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.517e+00", "anc_loss": "1.578e+00", "dlm_acc": "4.599e-01", "anc_acc": "4.480e-01", "epoch": 0.03552} {"step": 17765, "loss": 0.9822, "grad_norm": "2.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.602e-01", "anc_acc": "5.367e-01", "epoch": 0.03553} {"step": 17770, "loss": 0.8194, "grad_norm": "2.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.126e+00", "dlm_acc": "5.563e-01", "anc_acc": "5.377e-01", "epoch": 0.03554} {"step": 17775, "loss": 0.9521, "grad_norm": "2.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.152e+00", "dlm_acc": "5.687e-01", "anc_acc": "5.489e-01", "epoch": 0.03555} {"step": 17780, "loss": 1.2902, "grad_norm": "8.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.644e+00", "anc_loss": "1.728e+00", "dlm_acc": "4.922e-01", "anc_acc": "4.759e-01", "epoch": 0.03556} {"step": 17785, "loss": 1.0022, "grad_norm": "8.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.254e-01", "anc_acc": "5.032e-01", "epoch": 0.03557} {"step": 17790, "loss": 0.9489, "grad_norm": "1.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.548e+00", "anc_loss": "1.614e+00", "dlm_acc": "4.187e-01", "anc_acc": "4.014e-01", "epoch": 0.03558} {"step": 17795, "loss": 0.9661, "grad_norm": "2.515e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.486e+00", "anc_loss": "1.570e+00", "dlm_acc": "4.917e-01", "anc_acc": "4.731e-01", "epoch": 0.03559} {"step": 17800, "loss": 0.9437, "grad_norm": "3.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.403e+00", "anc_loss": "1.511e+00", "dlm_acc": "5.477e-01", "anc_acc": "5.255e-01", "epoch": 0.0356} {"step": 17805, "loss": 1.0846, "grad_norm": "5.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.408e+00", "dlm_acc": "5.435e-01", "anc_acc": "5.267e-01", "epoch": 0.03561} {"step": 17810, "loss": 0.8731, "grad_norm": "1.856e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.578e-01", "anc_acc": "5.399e-01", "epoch": 0.03562} {"step": 17815, "loss": 1.2226, "grad_norm": "2.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.828e+00", "anc_loss": "1.927e+00", "dlm_acc": "4.309e-01", "anc_acc": "4.153e-01", "epoch": 0.03563} {"step": 17820, "loss": 1.6068, "grad_norm": "6.124e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.659e+00", "anc_loss": "1.755e+00", "dlm_acc": "4.908e-01", "anc_acc": "4.740e-01", "epoch": 0.03564} {"step": 17825, "loss": 0.8762, "grad_norm": "1.759e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.666e-01", "anc_acc": "5.474e-01", "epoch": 0.03565} {"step": 17830, "loss": 1.1423, "grad_norm": "3.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.562e+00", "anc_loss": "1.652e+00", "dlm_acc": "4.814e-01", "anc_acc": "4.609e-01", "epoch": 0.03566} {"step": 17835, "loss": 1.0971, "grad_norm": "5.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.350e+00", "anc_loss": "1.443e+00", "dlm_acc": "5.203e-01", "anc_acc": "5.095e-01", "epoch": 0.03567} {"step": 17840, "loss": 1.0542, "grad_norm": "5.283e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.578e-01", "anc_loss": "8.152e-01", "dlm_acc": "6.377e-01", "anc_acc": "6.234e-01", "epoch": 0.03568} {"step": 17845, "loss": 0.9488, "grad_norm": "2.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.727e-01", "anc_loss": "1.050e+00", "dlm_acc": "6.147e-01", "anc_acc": "5.976e-01", "epoch": 0.03569} {"step": 17850, "loss": 0.8734, "grad_norm": "2.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.237e+00", "dlm_acc": "4.769e-01", "anc_acc": "4.658e-01", "epoch": 0.0357} {"step": 17855, "loss": 0.9333, "grad_norm": "2.295e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.006e+00", "anc_loss": "1.088e+00", "dlm_acc": "6.120e-01", "anc_acc": "5.933e-01", "epoch": 0.03571} {"step": 17860, "loss": 1.2309, "grad_norm": "2.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.535e+00", "anc_loss": "1.625e+00", "dlm_acc": "4.856e-01", "anc_acc": "4.654e-01", "epoch": 0.03572} {"step": 17865, "loss": 0.9381, "grad_norm": "2.425e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.669e-01", "anc_acc": "5.469e-01", "epoch": 0.03573} {"step": 17870, "loss": 0.9505, "grad_norm": "2.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.522e+00", "anc_loss": "1.616e+00", "dlm_acc": "5.099e-01", "anc_acc": "4.911e-01", "epoch": 0.03574} {"step": 17875, "loss": 0.971, "grad_norm": "5.755e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.627e+00", "anc_loss": "1.734e+00", "dlm_acc": "5.052e-01", "anc_acc": "4.826e-01", "epoch": 0.03575} {"step": 17880, "loss": 0.9692, "grad_norm": "2.327e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.558e-01", "anc_acc": "5.370e-01", "epoch": 0.03576} {"step": 17885, "loss": 0.9751, "grad_norm": "6.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.521e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.125e-01", "epoch": 0.03577} {"step": 17890, "loss": 0.7296, "grad_norm": "3.153e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.303e+00", "dlm_acc": "5.196e-01", "anc_acc": "5.042e-01", "epoch": 0.03578} {"step": 17895, "loss": 0.9906, "grad_norm": "3.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.189e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.665e-01", "anc_acc": "5.508e-01", "epoch": 0.03579} {"step": 17900, "loss": 1.1503, "grad_norm": "4.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.457e+00", "dlm_acc": "5.223e-01", "anc_acc": "5.066e-01", "epoch": 0.0358} {"step": 17905, "loss": 0.9301, "grad_norm": "2.552e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.347e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.201e-01", "epoch": 0.03581} {"step": 17910, "loss": 1.2989, "grad_norm": "2.487e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.528e+00", "anc_loss": "1.605e+00", "dlm_acc": "4.746e-01", "anc_acc": "4.580e-01", "epoch": 0.03582} {"step": 17915, "loss": 1.1351, "grad_norm": "4.361e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.019e+00", "anc_loss": "1.097e+00", "dlm_acc": "5.756e-01", "anc_acc": "5.578e-01", "epoch": 0.03583} {"step": 17920, "loss": 1.5932, "grad_norm": "1.483e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.408e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.428e-01", "anc_acc": "5.177e-01", "epoch": 0.03584} {"step": 17925, "loss": 0.9045, "grad_norm": "3.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.145e+00", "dlm_acc": "5.714e-01", "anc_acc": "5.520e-01", "epoch": 0.03585} {"step": 17930, "loss": 1.2788, "grad_norm": "3.770e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.283e+00", "anc_loss": "1.376e+00", "dlm_acc": "5.289e-01", "anc_acc": "5.066e-01", "epoch": 0.03586} {"step": 17935, "loss": 0.9891, "grad_norm": "3.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.570e-01", "anc_loss": "9.219e-01", "dlm_acc": "5.868e-01", "anc_acc": "5.648e-01", "epoch": 0.03587} {"step": 17940, "loss": 1.5595, "grad_norm": "5.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.274e+00", "dlm_acc": "5.501e-01", "anc_acc": "5.339e-01", "epoch": 0.03588} {"step": 17945, "loss": 1.0789, "grad_norm": "1.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.301e-01", "anc_loss": "8.852e-01", "dlm_acc": "6.397e-01", "anc_acc": "6.232e-01", "epoch": 0.03589} {"step": 17950, "loss": 1.3673, "grad_norm": "3.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.390e+00", "anc_loss": "1.474e+00", "dlm_acc": "5.760e-01", "anc_acc": "5.609e-01", "epoch": 0.0359} {"step": 17955, "loss": 1.093, "grad_norm": "4.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.780e-01", "anc_loss": "6.155e-01", "dlm_acc": "7.646e-01", "anc_acc": "7.541e-01", "epoch": 0.03591} {"step": 17960, "loss": 1.1945, "grad_norm": "2.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.750e-01", "anc_loss": "9.441e-01", "dlm_acc": "6.285e-01", "anc_acc": "6.085e-01", "epoch": 0.03592} {"step": 17965, "loss": 1.096, "grad_norm": "4.110e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.933e-01", "anc_loss": "7.396e-01", "dlm_acc": "6.278e-01", "anc_acc": "6.144e-01", "epoch": 0.03593} {"step": 17970, "loss": 1.2333, "grad_norm": "2.004e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.281e-01", "anc_loss": "9.805e-01", "dlm_acc": "5.331e-01", "anc_acc": "5.175e-01", "epoch": 0.03594} {"step": 17975, "loss": 1.5359, "grad_norm": "4.684e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.392e+00", "anc_loss": "1.500e+00", "dlm_acc": "5.683e-01", "anc_acc": "5.460e-01", "epoch": 0.03595} {"step": 17980, "loss": 0.9752, "grad_norm": "3.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.551e-01", "anc_loss": "1.003e+00", "dlm_acc": "6.637e-01", "anc_acc": "6.552e-01", "epoch": 0.03596} {"step": 17985, "loss": 1.3905, "grad_norm": "4.731e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.318e+00", "dlm_acc": "5.492e-01", "anc_acc": "5.316e-01", "epoch": 0.03597} {"step": 17990, "loss": 1.1959, "grad_norm": "3.260e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.135e+00", "dlm_acc": "5.022e-01", "anc_acc": "4.862e-01", "epoch": 0.03598} {"step": 17995, "loss": 1.2355, "grad_norm": "3.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.237e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.350e-01", "epoch": 0.03599} {"step": 18000, "loss": 1.5008, "grad_norm": "5.950e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.335e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.728e-01", "anc_acc": "5.556e-01", "epoch": 0.036} {"step": 18005, "loss": 1.26, "grad_norm": "4.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.523e-01", "anc_loss": "6.789e-01", "dlm_acc": "5.466e-01", "anc_acc": "5.320e-01", "epoch": 0.03601} {"step": 18010, "loss": 1.1911, "grad_norm": "3.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.145e+00", "dlm_acc": "5.000e-01", "anc_acc": "4.876e-01", "epoch": 0.03602} {"step": 18015, "loss": 1.5802, "grad_norm": "4.675e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.070e-01", "anc_loss": "8.172e-01", "dlm_acc": "5.203e-01", "anc_acc": "5.165e-01", "epoch": 0.03603} {"step": 18020, "loss": 1.3768, "grad_norm": "4.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.281e-01", "anc_loss": "7.328e-01", "dlm_acc": "5.509e-01", "anc_acc": "5.483e-01", "epoch": 0.03604} {"step": 18025, "loss": 1.5877, "grad_norm": "5.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.578e-01", "anc_loss": "7.633e-01", "dlm_acc": "5.435e-01", "anc_acc": "5.425e-01", "epoch": 0.03605} {"step": 18030, "loss": 1.632, "grad_norm": "5.313e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.727e-01", "anc_loss": "6.758e-01", "dlm_acc": "5.578e-01", "anc_acc": "5.553e-01", "epoch": 0.03606} {"step": 18035, "loss": 1.4216, "grad_norm": "4.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.074e-01", "anc_loss": "6.109e-01", "dlm_acc": "5.927e-01", "anc_acc": "5.923e-01", "epoch": 0.03607} {"step": 18040, "loss": 1.0757, "grad_norm": "4.590e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.375e-01", "anc_loss": "7.094e-01", "dlm_acc": "6.535e-01", "anc_acc": "6.334e-01", "epoch": 0.03608} {"step": 18045, "loss": 1.2024, "grad_norm": "2.202e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.609e-01", "anc_loss": "7.523e-01", "dlm_acc": "6.967e-01", "anc_acc": "6.698e-01", "epoch": 0.03609} {"step": 18050, "loss": 0.9997, "grad_norm": "5.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.121e+00", "dlm_acc": "6.510e-01", "anc_acc": "6.334e-01", "epoch": 0.0361} {"step": 18055, "loss": 0.8641, "grad_norm": "1.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.090e-01", "anc_loss": "9.660e-01", "dlm_acc": "5.839e-01", "anc_acc": "5.684e-01", "epoch": 0.03611} {"step": 18060, "loss": 0.7131, "grad_norm": "3.067e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.250e-01", "anc_loss": "8.695e-01", "dlm_acc": "5.805e-01", "anc_acc": "5.661e-01", "epoch": 0.03612} {"step": 18065, "loss": 1.1194, "grad_norm": "7.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.477e-01", "anc_loss": "8.887e-01", "dlm_acc": "5.736e-01", "anc_acc": "5.587e-01", "epoch": 0.03613} {"step": 18070, "loss": 2.0051, "grad_norm": "5.458e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.895e+00", "anc_loss": "1.995e+00", "dlm_acc": "4.476e-01", "anc_acc": "4.302e-01", "epoch": 0.03614} {"step": 18075, "loss": 1.2758, "grad_norm": "3.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.544e-01", "anc_acc": "5.325e-01", "epoch": 0.03615} {"step": 18080, "loss": 1.3877, "grad_norm": "3.591e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.435e+00", "dlm_acc": "4.730e-01", "anc_acc": "4.567e-01", "epoch": 0.03616} {"step": 18085, "loss": 1.7096, "grad_norm": "4.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.497e-01", "anc_acc": "5.343e-01", "epoch": 0.03617} {"step": 18090, "loss": 1.659, "grad_norm": "2.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.602e+00", "dlm_acc": "5.396e-01", "anc_acc": "5.205e-01", "epoch": 0.03618} {"step": 18095, "loss": 1.6215, "grad_norm": "3.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.484e+00", "dlm_acc": "4.834e-01", "anc_acc": "4.655e-01", "epoch": 0.03619} {"step": 18100, "loss": 1.4881, "grad_norm": "4.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.329e+00", "dlm_acc": "5.431e-01", "anc_acc": "5.201e-01", "epoch": 0.0362} {"step": 18105, "loss": 0.9745, "grad_norm": "3.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.244e+00", "dlm_acc": "5.621e-01", "anc_acc": "5.345e-01", "epoch": 0.03621} {"step": 18110, "loss": 0.9728, "grad_norm": "3.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.516e-01", "anc_loss": "9.496e-01", "dlm_acc": "6.153e-01", "anc_acc": "5.741e-01", "epoch": 0.03622} {"step": 18115, "loss": 1.1454, "grad_norm": "5.623e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.545e+00", "anc_loss": "1.642e+00", "dlm_acc": "5.168e-01", "anc_acc": "4.892e-01", "epoch": 0.03623} {"step": 18120, "loss": 1.0731, "grad_norm": "3.217e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.366e+00", "dlm_acc": "4.849e-01", "anc_acc": "4.679e-01", "epoch": 0.03624} {"step": 18125, "loss": 1.4348, "grad_norm": "5.892e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.610e+00", "anc_loss": "1.704e+00", "dlm_acc": "4.931e-01", "anc_acc": "4.747e-01", "epoch": 0.03625} {"step": 18130, "loss": 0.8028, "grad_norm": "5.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.586e-01", "anc_loss": "7.121e-01", "dlm_acc": "6.735e-01", "anc_acc": "6.597e-01", "epoch": 0.03626} {"step": 18135, "loss": 1.154, "grad_norm": "3.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.350e-01", "anc_acc": "5.196e-01", "epoch": 0.03627} {"step": 18140, "loss": 0.908, "grad_norm": "4.815e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.346e+00", "dlm_acc": "5.331e-01", "anc_acc": "5.121e-01", "epoch": 0.03628} {"step": 18145, "loss": 0.8376, "grad_norm": "3.211e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.770e-01", "anc_loss": "6.266e-01", "dlm_acc": "6.488e-01", "anc_acc": "6.327e-01", "epoch": 0.03629} {"step": 18150, "loss": 0.855, "grad_norm": "3.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.255e+00", "dlm_acc": "5.494e-01", "anc_acc": "5.312e-01", "epoch": 0.0363} {"step": 18155, "loss": 0.9456, "grad_norm": "3.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.465e-01", "anc_loss": "7.438e-01", "dlm_acc": "6.953e-01", "anc_acc": "6.748e-01", "epoch": 0.03631} {"step": 18160, "loss": 0.9959, "grad_norm": "2.896e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.949e-01", "anc_loss": "6.441e-01", "dlm_acc": "8.036e-01", "anc_acc": "7.627e-01", "epoch": 0.03632} {"step": 18165, "loss": 1.5007, "grad_norm": "3.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.405e+00", "anc_loss": "2.472e+00", "dlm_acc": "2.959e-01", "anc_acc": "2.843e-01", "epoch": 0.03633} {"step": 18170, "loss": 1.1211, "grad_norm": "4.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.041e+00", "anc_loss": "1.119e+00", "dlm_acc": "6.353e-01", "anc_acc": "6.146e-01", "epoch": 0.03634} {"step": 18175, "loss": 1.349, "grad_norm": "4.880e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.059e-01", "anc_loss": "9.758e-01", "dlm_acc": "5.466e-01", "anc_acc": "5.232e-01", "epoch": 0.03635} {"step": 18180, "loss": 1.1702, "grad_norm": "3.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.393e+00", "dlm_acc": "5.662e-01", "anc_acc": "5.373e-01", "epoch": 0.03636} {"step": 18185, "loss": 1.1034, "grad_norm": "2.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.109e-01", "anc_loss": "9.938e-01", "dlm_acc": "5.427e-01", "anc_acc": "5.100e-01", "epoch": 0.03637} {"step": 18190, "loss": 1.0415, "grad_norm": "2.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.645e-01", "anc_loss": "1.060e+00", "dlm_acc": "6.543e-01", "anc_acc": "6.250e-01", "epoch": 0.03638} {"step": 18195, "loss": 1.0698, "grad_norm": "2.699e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.855e-01", "anc_acc": "5.724e-01", "epoch": 0.03639} {"step": 18200, "loss": 1.4337, "grad_norm": "6.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.473e+00", "dlm_acc": "4.788e-01", "anc_acc": "4.629e-01", "epoch": 0.0364} {"step": 18205, "loss": 1.4368, "grad_norm": "8.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.011e+00", "anc_loss": "2.033e+00", "dlm_acc": "3.315e-01", "anc_acc": "3.237e-01", "epoch": 0.03641} {"step": 18210, "loss": 1.2587, "grad_norm": "4.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.651e-01", "anc_acc": "5.432e-01", "epoch": 0.03642} {"step": 18215, "loss": 1.2504, "grad_norm": "7.434e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.691e+00", "anc_loss": "1.752e+00", "dlm_acc": "3.781e-01", "anc_acc": "3.631e-01", "epoch": 0.03643} {"step": 18220, "loss": 0.7873, "grad_norm": "1.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.260e+00", "anc_loss": "1.292e+00", "dlm_acc": "4.082e-01", "anc_acc": "4.010e-01", "epoch": 0.03644} {"step": 18225, "loss": 0.6477, "grad_norm": "2.486e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.297e-01", "anc_loss": "6.367e-01", "dlm_acc": "4.904e-01", "anc_acc": "4.862e-01", "epoch": 0.03645} {"step": 18230, "loss": 0.9105, "grad_norm": "5.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.063e-01", "anc_loss": "7.156e-01", "dlm_acc": "4.715e-01", "anc_acc": "4.659e-01", "epoch": 0.03646} {"step": 18235, "loss": 1.0472, "grad_norm": "2.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.793e-01", "anc_acc": "5.606e-01", "epoch": 0.03647} {"step": 18240, "loss": 1.3063, "grad_norm": "6.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.098e+00", "anc_loss": "2.159e+00", "dlm_acc": "3.256e-01", "anc_acc": "3.128e-01", "epoch": 0.03648} {"step": 18245, "loss": 1.2772, "grad_norm": "3.768e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.468e+00", "anc_loss": "1.556e+00", "dlm_acc": "4.914e-01", "anc_acc": "4.720e-01", "epoch": 0.03649} {"step": 18250, "loss": 1.1272, "grad_norm": "2.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.582e-01", "anc_loss": "9.398e-01", "dlm_acc": "7.087e-01", "anc_acc": "6.906e-01", "epoch": 0.0365} {"step": 18255, "loss": 1.4578, "grad_norm": "3.180e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.846e-01", "anc_acc": "5.643e-01", "epoch": 0.03651} {"step": 18260, "loss": 1.3272, "grad_norm": "3.732e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.272e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.501e-01", "anc_acc": "5.282e-01", "epoch": 0.03652} {"step": 18265, "loss": 1.6119, "grad_norm": "3.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.633e+00", "anc_loss": "1.731e+00", "dlm_acc": "4.986e-01", "anc_acc": "4.796e-01", "epoch": 0.03653} {"step": 18270, "loss": 1.1632, "grad_norm": "3.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.375e+00", "dlm_acc": "5.344e-01", "anc_acc": "5.149e-01", "epoch": 0.03654} {"step": 18275, "loss": 1.3722, "grad_norm": "3.049e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.056e+00", "anc_loss": "1.110e+00", "dlm_acc": "5.786e-01", "anc_acc": "5.648e-01", "epoch": 0.03655} {"step": 18280, "loss": 0.8216, "grad_norm": "2.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.109e-01", "anc_loss": "8.129e-01", "dlm_acc": "6.763e-01", "anc_acc": "6.399e-01", "epoch": 0.03656} {"step": 18285, "loss": 1.3931, "grad_norm": "5.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.547e-01", "anc_loss": "1.040e+00", "dlm_acc": "6.762e-01", "anc_acc": "6.612e-01", "epoch": 0.03657} {"step": 18290, "loss": 1.3987, "grad_norm": "6.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.540e+00", "anc_loss": "1.650e+00", "dlm_acc": "4.763e-01", "anc_acc": "4.561e-01", "epoch": 0.03658} {"step": 18295, "loss": 1.5797, "grad_norm": "4.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.220e+00", "anc_loss": "2.331e+00", "dlm_acc": "2.484e-01", "anc_acc": "2.300e-01", "epoch": 0.03659} {"step": 18300, "loss": 1.152, "grad_norm": "2.445e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.600e+00", "anc_loss": "1.721e+00", "dlm_acc": "3.391e-01", "anc_acc": "3.107e-01", "epoch": 0.0366} {"step": 18305, "loss": 1.2302, "grad_norm": "3.217e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.421e+00", "anc_loss": "1.502e+00", "dlm_acc": "3.996e-01", "anc_acc": "3.763e-01", "epoch": 0.03661} {"step": 18310, "loss": 1.2135, "grad_norm": "2.420e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.308e+00", "anc_loss": "1.397e+00", "dlm_acc": "5.632e-01", "anc_acc": "5.445e-01", "epoch": 0.03662} {"step": 18315, "loss": 1.2172, "grad_norm": "2.640e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.113e+00", "dlm_acc": "5.869e-01", "anc_acc": "5.600e-01", "epoch": 0.03663} {"step": 18320, "loss": 1.3708, "grad_norm": "5.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.571e+00", "anc_loss": "1.629e+00", "dlm_acc": "3.843e-01", "anc_acc": "3.713e-01", "epoch": 0.03664} {"step": 18325, "loss": 1.2943, "grad_norm": "3.511e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.506e-01", "anc_acc": "5.283e-01", "epoch": 0.03665} {"step": 18330, "loss": 1.4831, "grad_norm": "2.734e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.179e+00", "dlm_acc": "6.295e-01", "anc_acc": "6.061e-01", "epoch": 0.03666} {"step": 18335, "loss": 1.5599, "grad_norm": "5.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.230e-01", "anc_acc": "5.020e-01", "epoch": 0.03667} {"step": 18340, "loss": 1.5153, "grad_norm": "2.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.534e+00", "anc_loss": "2.556e+00", "dlm_acc": "5.836e-02", "anc_acc": "5.716e-02", "epoch": 0.03668} {"step": 18345, "loss": 1.0952, "grad_norm": "1.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.332e-01", "anc_loss": "9.898e-01", "dlm_acc": "5.332e-01", "anc_acc": "5.157e-01", "epoch": 0.03669} {"step": 18350, "loss": 1.3698, "grad_norm": "3.998e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.112e+00", "anc_loss": "1.210e+00", "dlm_acc": "6.037e-01", "anc_acc": "5.760e-01", "epoch": 0.0367} {"step": 18355, "loss": 1.0844, "grad_norm": "4.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.413e+00", "dlm_acc": "4.874e-01", "anc_acc": "4.633e-01", "epoch": 0.03671} {"step": 18360, "loss": 1.0907, "grad_norm": "6.483e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.410e+00", "anc_loss": "1.503e+00", "dlm_acc": "4.928e-01", "anc_acc": "4.732e-01", "epoch": 0.03672} {"step": 18365, "loss": 1.5823, "grad_norm": "4.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.669e+00", "anc_loss": "1.769e+00", "dlm_acc": "4.429e-01", "anc_acc": "4.239e-01", "epoch": 0.03673} {"step": 18370, "loss": 1.2977, "grad_norm": "1.195e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.128e-01", "anc_acc": "4.955e-01", "epoch": 0.03674} {"step": 18375, "loss": 1.1394, "grad_norm": "4.204e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.487e+00", "dlm_acc": "5.122e-01", "anc_acc": "4.877e-01", "epoch": 0.03675} {"step": 18380, "loss": 0.9895, "grad_norm": "3.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.120e+00", "dlm_acc": "6.067e-01", "anc_acc": "5.816e-01", "epoch": 0.03676} {"step": 18385, "loss": 0.8362, "grad_norm": "3.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.153e+00", "anc_loss": "1.286e+00", "dlm_acc": "6.344e-01", "anc_acc": "6.088e-01", "epoch": 0.03677} {"step": 18390, "loss": 0.9637, "grad_norm": "1.883e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.195e+00", "dlm_acc": "5.954e-01", "anc_acc": "5.749e-01", "epoch": 0.03678} {"step": 18395, "loss": 0.9857, "grad_norm": "3.998e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.402e-01", "anc_loss": "1.028e+00", "dlm_acc": "6.670e-01", "anc_acc": "6.465e-01", "epoch": 0.03679} {"step": 18400, "loss": 0.9039, "grad_norm": "2.986e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.081e-01", "anc_acc": "4.841e-01", "epoch": 0.0368} {"step": 18405, "loss": 0.9783, "grad_norm": "1.911e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.688e-01", "anc_loss": "1.069e+00", "dlm_acc": "6.180e-01", "anc_acc": "5.910e-01", "epoch": 0.03681} {"step": 18410, "loss": 1.3032, "grad_norm": "2.062e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.461e+00", "anc_loss": "1.608e+00", "dlm_acc": "4.429e-01", "anc_acc": "4.071e-01", "epoch": 0.03682} {"step": 18415, "loss": 1.1931, "grad_norm": "2.019e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.138e+00", "anc_loss": "1.240e+00", "dlm_acc": "6.169e-01", "anc_acc": "5.897e-01", "epoch": 0.03683} {"step": 18420, "loss": 1.0406, "grad_norm": "2.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.192e+00", "dlm_acc": "5.983e-01", "anc_acc": "5.799e-01", "epoch": 0.03684} {"step": 18425, "loss": 0.7626, "grad_norm": "3.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.184e-01", "anc_loss": "6.969e-01", "dlm_acc": "6.870e-01", "anc_acc": "6.575e-01", "epoch": 0.03685} {"step": 18430, "loss": 0.9659, "grad_norm": "3.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.543e-01", "anc_acc": "5.384e-01", "epoch": 0.03686} {"step": 18435, "loss": 1.0727, "grad_norm": "4.361e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.400e-01", "anc_loss": "9.080e-01", "dlm_acc": "5.912e-01", "anc_acc": "5.698e-01", "epoch": 0.03687} {"step": 18440, "loss": 1.2662, "grad_norm": "4.716e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.206e+00", "anc_loss": "1.346e+00", "dlm_acc": "5.737e-01", "anc_acc": "5.331e-01", "epoch": 0.03688} {"step": 18445, "loss": 1.2327, "grad_norm": "2.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.508e-01", "anc_loss": "9.703e-01", "dlm_acc": "3.745e-01", "anc_acc": "3.671e-01", "epoch": 0.03689} {"step": 18450, "loss": 0.7665, "grad_norm": "3.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.695e-01", "anc_loss": "6.773e-01", "dlm_acc": "4.244e-01", "anc_acc": "4.208e-01", "epoch": 0.0369} {"step": 18455, "loss": 0.9746, "grad_norm": "4.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.820e-01", "anc_loss": "7.883e-01", "dlm_acc": "3.915e-01", "anc_acc": "3.884e-01", "epoch": 0.03691} {"step": 18460, "loss": 0.7862, "grad_norm": "3.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.461e-01", "anc_loss": "7.547e-01", "dlm_acc": "4.005e-01", "anc_acc": "3.968e-01", "epoch": 0.03692} {"step": 18465, "loss": 1.0377, "grad_norm": "2.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.461e-01", "anc_loss": "7.562e-01", "dlm_acc": "4.233e-01", "anc_acc": "4.192e-01", "epoch": 0.03693} {"step": 18470, "loss": 1.0757, "grad_norm": "3.707e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.926e-01", "anc_loss": "7.004e-01", "dlm_acc": "4.276e-01", "anc_acc": "4.218e-01", "epoch": 0.03694} {"step": 18475, "loss": 1.1065, "grad_norm": "3.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.580e+00", "anc_loss": "1.697e+00", "dlm_acc": "5.066e-01", "anc_acc": "4.802e-01", "epoch": 0.03695} {"step": 18480, "loss": 0.8963, "grad_norm": "6.444e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.350e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.263e-01", "anc_acc": "5.072e-01", "epoch": 0.03696} {"step": 18485, "loss": 0.9778, "grad_norm": "4.848e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.365e-01", "anc_acc": "5.150e-01", "epoch": 0.03697} {"step": 18490, "loss": 0.8498, "grad_norm": "6.260e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.663e+00", "anc_loss": "1.758e+00", "dlm_acc": "4.772e-01", "anc_acc": "4.591e-01", "epoch": 0.03698} {"step": 18495, "loss": 0.9312, "grad_norm": "2.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.984e-01", "anc_loss": "1.101e+00", "dlm_acc": "5.959e-01", "anc_acc": "5.643e-01", "epoch": 0.03699} {"step": 18500, "loss": 1.6411, "grad_norm": "2.984e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.566e+00", "dlm_acc": "5.285e-01", "anc_acc": "5.071e-01", "epoch": 0.037} {"step": 18505, "loss": 1.8453, "grad_norm": "8.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.636e+00", "anc_loss": "1.698e+00", "dlm_acc": "4.417e-01", "anc_acc": "4.311e-01", "epoch": 0.03701} {"step": 18510, "loss": 1.2993, "grad_norm": "2.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.065e+00", "dlm_acc": "6.439e-01", "anc_acc": "6.256e-01", "epoch": 0.03702} {"step": 18515, "loss": 1.5702, "grad_norm": "3.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.512e+00", "anc_loss": "1.611e+00", "dlm_acc": "4.874e-01", "anc_acc": "4.650e-01", "epoch": 0.03703} {"step": 18520, "loss": 1.3211, "grad_norm": "4.244e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.478e+00", "anc_loss": "1.595e+00", "dlm_acc": "4.636e-01", "anc_acc": "4.427e-01", "epoch": 0.03704} {"step": 18525, "loss": 1.1614, "grad_norm": "3.138e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.272e+00", "anc_loss": "1.365e+00", "dlm_acc": "4.886e-01", "anc_acc": "4.634e-01", "epoch": 0.03705} {"step": 18530, "loss": 1.3552, "grad_norm": "3.067e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.151e+00", "anc_loss": "1.259e+00", "dlm_acc": "6.195e-01", "anc_acc": "5.981e-01", "epoch": 0.03706} {"step": 18535, "loss": 1.1024, "grad_norm": "3.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.245e+00", "dlm_acc": "5.834e-01", "anc_acc": "5.609e-01", "epoch": 0.03707} {"step": 18540, "loss": 1.0995, "grad_norm": "5.359e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.544e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.757e-01", "anc_acc": "4.560e-01", "epoch": 0.03708} {"step": 18545, "loss": 1.104, "grad_norm": "2.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.067e+00", "anc_loss": "1.139e+00", "dlm_acc": "5.834e-01", "anc_acc": "5.639e-01", "epoch": 0.03709} {"step": 18550, "loss": 1.0591, "grad_norm": "3.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.597e+00", "dlm_acc": "4.988e-01", "anc_acc": "4.696e-01", "epoch": 0.0371} {"step": 18555, "loss": 1.5988, "grad_norm": "3.238e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.716e+00", "anc_loss": "1.808e+00", "dlm_acc": "5.040e-01", "anc_acc": "4.849e-01", "epoch": 0.03711} {"step": 18560, "loss": 1.4592, "grad_norm": "3.192e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.714e+00", "anc_loss": "1.819e+00", "dlm_acc": "4.631e-01", "anc_acc": "4.423e-01", "epoch": 0.03712} {"step": 18565, "loss": 1.1684, "grad_norm": "2.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.370e+00", "anc_loss": "1.468e+00", "dlm_acc": "5.577e-01", "anc_acc": "5.354e-01", "epoch": 0.03713} {"step": 18570, "loss": 1.4211, "grad_norm": "3.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.555e+00", "anc_loss": "1.652e+00", "dlm_acc": "5.050e-01", "anc_acc": "4.840e-01", "epoch": 0.03714} {"step": 18575, "loss": 1.2688, "grad_norm": "3.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.448e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.189e-01", "anc_acc": "5.009e-01", "epoch": 0.03715} {"step": 18580, "loss": 1.2948, "grad_norm": "3.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.946e+00", "anc_loss": "2.014e+00", "dlm_acc": "3.730e-01", "anc_acc": "3.582e-01", "epoch": 0.03716} {"step": 18585, "loss": 1.3175, "grad_norm": "3.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.602e+00", "anc_loss": "1.712e+00", "dlm_acc": "5.013e-01", "anc_acc": "4.798e-01", "epoch": 0.03717} {"step": 18590, "loss": 1.211, "grad_norm": "3.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.197e+00", "anc_loss": "1.296e+00", "dlm_acc": "6.024e-01", "anc_acc": "5.812e-01", "epoch": 0.03718} {"step": 18595, "loss": 1.1065, "grad_norm": "3.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.293e+00", "dlm_acc": "5.662e-01", "anc_acc": "5.444e-01", "epoch": 0.03719} {"step": 18600, "loss": 1.539, "grad_norm": "4.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.429e+00", "dlm_acc": "5.552e-01", "anc_acc": "5.350e-01", "epoch": 0.0372} {"step": 18605, "loss": 1.2545, "grad_norm": "4.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.198e+00", "dlm_acc": "6.199e-01", "anc_acc": "5.977e-01", "epoch": 0.03721} {"step": 18610, "loss": 1.3431, "grad_norm": "4.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.376e+00", "dlm_acc": "5.582e-01", "anc_acc": "5.362e-01", "epoch": 0.03722} {"step": 18615, "loss": 1.5543, "grad_norm": "1.987e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.404e+00", "anc_loss": "1.482e+00", "dlm_acc": "5.361e-01", "anc_acc": "5.184e-01", "epoch": 0.03723} {"step": 18620, "loss": 1.1324, "grad_norm": "1.970e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.218e+00", "dlm_acc": "5.615e-01", "anc_acc": "5.393e-01", "epoch": 0.03724} {"step": 18625, "loss": 1.8044, "grad_norm": "2.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.788e+00", "anc_loss": "1.891e+00", "dlm_acc": "4.871e-01", "anc_acc": "4.663e-01", "epoch": 0.03725} {"step": 18630, "loss": 1.5104, "grad_norm": "3.090e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.591e+00", "dlm_acc": "4.943e-01", "anc_acc": "4.772e-01", "epoch": 0.03726} {"step": 18635, "loss": 1.6131, "grad_norm": "3.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.514e+00", "dlm_acc": "5.222e-01", "anc_acc": "5.003e-01", "epoch": 0.03727} {"step": 18640, "loss": 1.334, "grad_norm": "3.449e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.479e+00", "anc_loss": "1.567e+00", "dlm_acc": "5.068e-01", "anc_acc": "4.869e-01", "epoch": 0.03728} {"step": 18645, "loss": 1.4009, "grad_norm": "3.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.328e+00", "dlm_acc": "5.676e-01", "anc_acc": "5.526e-01", "epoch": 0.03729} {"step": 18650, "loss": 1.609, "grad_norm": "6.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.794e+00", "anc_loss": "1.886e+00", "dlm_acc": "4.907e-01", "anc_acc": "4.716e-01", "epoch": 0.0373} {"step": 18655, "loss": 1.3939, "grad_norm": "2.473e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.428e+00", "dlm_acc": "5.454e-01", "anc_acc": "5.284e-01", "epoch": 0.03731} {"step": 18660, "loss": 1.2328, "grad_norm": "4.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.299e+00", "anc_loss": "1.389e+00", "dlm_acc": "6.057e-01", "anc_acc": "5.899e-01", "epoch": 0.03732} {"step": 18665, "loss": 1.272, "grad_norm": "3.331e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.922e-01", "anc_loss": "6.297e-01", "dlm_acc": "8.074e-01", "anc_acc": "7.999e-01", "epoch": 0.03733} {"step": 18670, "loss": 1.3903, "grad_norm": "2.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.530e-01", "anc_acc": "5.372e-01", "epoch": 0.03734} {"step": 18675, "loss": 0.9034, "grad_norm": "1.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.068e+00", "anc_loss": "1.150e+00", "dlm_acc": "6.185e-01", "anc_acc": "5.998e-01", "epoch": 0.03735} {"step": 18680, "loss": 1.3616, "grad_norm": "4.635e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.493e+00", "anc_loss": "1.580e+00", "dlm_acc": "5.154e-01", "anc_acc": "4.963e-01", "epoch": 0.03736} {"step": 18685, "loss": 1.4163, "grad_norm": "3.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.304e+00", "anc_loss": "1.392e+00", "dlm_acc": "5.458e-01", "anc_acc": "5.256e-01", "epoch": 0.03737} {"step": 18690, "loss": 2.0583, "grad_norm": "4.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.908e+00", "anc_loss": "2.027e+00", "dlm_acc": "4.435e-01", "anc_acc": "4.246e-01", "epoch": 0.03738} {"step": 18695, "loss": 1.9803, "grad_norm": "5.399e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.432e+00", "anc_loss": "1.537e+00", "dlm_acc": "5.787e-01", "anc_acc": "5.576e-01", "epoch": 0.03739} {"step": 18700, "loss": 1.5377, "grad_norm": "2.773e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.407e+00", "anc_loss": "1.505e+00", "dlm_acc": "5.260e-01", "anc_acc": "5.043e-01", "epoch": 0.0374} {"step": 18705, "loss": 1.5477, "grad_norm": "3.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.174e-01", "anc_acc": "4.982e-01", "epoch": 0.03741} {"step": 18710, "loss": 1.1054, "grad_norm": "2.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.073e+00", "dlm_acc": "5.549e-01", "anc_acc": "5.354e-01", "epoch": 0.03742} {"step": 18715, "loss": 0.9586, "grad_norm": "2.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.094e+00", "anc_loss": "1.160e+00", "dlm_acc": "5.299e-01", "anc_acc": "5.140e-01", "epoch": 0.03743} {"step": 18720, "loss": 1.29, "grad_norm": "5.523e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.140e+00", "dlm_acc": "3.497e-01", "anc_acc": "3.490e-01", "epoch": 0.03744} {"step": 18725, "loss": 1.4122, "grad_norm": "4.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.467e+00", "anc_loss": "1.509e+00", "dlm_acc": "3.668e-01", "anc_acc": "3.571e-01", "epoch": 0.03745} {"step": 18730, "loss": 1.4152, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.356e-01", "anc_acc": "5.175e-01", "epoch": 0.03746} {"step": 18735, "loss": 1.3684, "grad_norm": "5.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.485e+00", "dlm_acc": "5.464e-01", "anc_acc": "5.290e-01", "epoch": 0.03747} {"step": 18740, "loss": 1.4218, "grad_norm": "3.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.494e+00", "dlm_acc": "5.477e-01", "anc_acc": "5.303e-01", "epoch": 0.03748} {"step": 18745, "loss": 1.5296, "grad_norm": "7.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.594e-01", "anc_loss": "9.688e-01", "dlm_acc": "6.004e-01", "anc_acc": "5.835e-01", "epoch": 0.03749} {"step": 18750, "loss": 1.0177, "grad_norm": "1.183e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.852e-01", "anc_loss": "9.395e-01", "dlm_acc": "5.982e-01", "anc_acc": "5.914e-01", "epoch": 0.0375} {"step": 18755, "loss": 1.7399, "grad_norm": "4.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.407e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.379e-01", "anc_acc": "5.203e-01", "epoch": 0.03751} {"step": 18760, "loss": 1.2764, "grad_norm": "3.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.276e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.373e-01", "anc_acc": "5.171e-01", "epoch": 0.03752} {"step": 18765, "loss": 1.7974, "grad_norm": "4.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.766e+00", "anc_loss": "1.872e+00", "dlm_acc": "4.945e-01", "anc_acc": "4.742e-01", "epoch": 0.03753} {"step": 18770, "loss": 1.5885, "grad_norm": "4.957e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.536e+00", "dlm_acc": "4.810e-01", "anc_acc": "4.646e-01", "epoch": 0.03754} {"step": 18775, "loss": 1.3549, "grad_norm": "1.971e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.361e+00", "anc_loss": "1.446e+00", "dlm_acc": "5.689e-01", "anc_acc": "5.519e-01", "epoch": 0.03755} {"step": 18780, "loss": 1.0582, "grad_norm": "3.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.857e-01", "anc_acc": "5.599e-01", "epoch": 0.03756} {"step": 18785, "loss": 1.5394, "grad_norm": "1.235e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.072e-01", "anc_acc": "4.924e-01", "epoch": 0.03757} {"step": 18790, "loss": 1.7669, "grad_norm": "5.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.619e+00", "anc_loss": "1.709e+00", "dlm_acc": "4.964e-01", "anc_acc": "4.776e-01", "epoch": 0.03758} {"step": 18795, "loss": 1.2667, "grad_norm": "2.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.389e+00", "dlm_acc": "5.421e-01", "anc_acc": "5.221e-01", "epoch": 0.03759} {"step": 18800, "loss": 1.4057, "grad_norm": "4.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.444e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.209e-01", "anc_acc": "4.995e-01", "epoch": 0.0376} {"step": 18805, "loss": 1.618, "grad_norm": "2.131e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.645e+00", "anc_loss": "1.740e+00", "dlm_acc": "4.743e-01", "anc_acc": "4.555e-01", "epoch": 0.03761} {"step": 18810, "loss": 1.6073, "grad_norm": "3.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.945e+00", "anc_loss": "2.006e+00", "dlm_acc": "3.304e-01", "anc_acc": "3.189e-01", "epoch": 0.03762} {"step": 18815, "loss": 1.3997, "grad_norm": "2.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.271e-01", "anc_loss": "7.883e-01", "dlm_acc": "7.594e-01", "anc_acc": "7.439e-01", "epoch": 0.03763} {"step": 18820, "loss": 1.5747, "grad_norm": "3.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.377e-01", "anc_acc": "5.076e-01", "epoch": 0.03764} {"step": 18825, "loss": 1.4014, "grad_norm": "4.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.077e-01", "anc_acc": "4.822e-01", "epoch": 0.03765} {"step": 18830, "loss": 1.3098, "grad_norm": "3.747e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.067e-01", "anc_loss": "4.301e-01", "dlm_acc": "8.012e-01", "anc_acc": "7.913e-01", "epoch": 0.03766} {"step": 18835, "loss": 1.394, "grad_norm": "3.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.119e-01", "anc_loss": "9.168e-01", "dlm_acc": "6.799e-01", "anc_acc": "6.546e-01", "epoch": 0.03767} {"step": 18840, "loss": 1.1818, "grad_norm": "3.076e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.451e-01", "anc_loss": "7.199e-01", "dlm_acc": "7.232e-01", "anc_acc": "7.004e-01", "epoch": 0.03768} {"step": 18845, "loss": 1.6309, "grad_norm": "4.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.429e+00", "dlm_acc": "5.753e-01", "anc_acc": "5.542e-01", "epoch": 0.03769} {"step": 18850, "loss": 1.3595, "grad_norm": "3.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.109e-01", "anc_loss": "7.105e-01", "dlm_acc": "7.221e-01", "anc_acc": "6.881e-01", "epoch": 0.0377} {"step": 18855, "loss": 1.3313, "grad_norm": "7.619e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.065e+00", "anc_loss": "1.144e+00", "dlm_acc": "5.228e-01", "anc_acc": "5.019e-01", "epoch": 0.03771} {"step": 18860, "loss": 1.4662, "grad_norm": "3.945e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.693e-01", "anc_acc": "5.475e-01", "epoch": 0.03772} {"step": 18865, "loss": 1.5813, "grad_norm": "7.161e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.349e+00", "anc_loss": "1.421e+00", "dlm_acc": "5.505e-01", "anc_acc": "5.304e-01", "epoch": 0.03773} {"step": 18870, "loss": 1.3342, "grad_norm": "6.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.645e+00", "anc_loss": "1.735e+00", "dlm_acc": "4.135e-01", "anc_acc": "3.912e-01", "epoch": 0.03774} {"step": 18875, "loss": 1.9313, "grad_norm": "5.994e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.219e+00", "anc_loss": "2.375e+00", "dlm_acc": "3.970e-01", "anc_acc": "3.781e-01", "epoch": 0.03775} {"step": 18880, "loss": 1.4014, "grad_norm": "2.005e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.326e+00", "anc_loss": "1.418e+00", "dlm_acc": "5.631e-01", "anc_acc": "5.441e-01", "epoch": 0.03776} {"step": 18885, "loss": 1.4406, "grad_norm": "3.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.368e+00", "dlm_acc": "4.494e-01", "anc_acc": "4.332e-01", "epoch": 0.03777} {"step": 18890, "loss": 1.6767, "grad_norm": "8.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.458e+00", "anc_loss": "1.541e+00", "dlm_acc": "4.590e-01", "anc_acc": "4.406e-01", "epoch": 0.03778} {"step": 18895, "loss": 1.5438, "grad_norm": "4.089e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.552e+00", "anc_loss": "1.659e+00", "dlm_acc": "4.819e-01", "anc_acc": "4.549e-01", "epoch": 0.03779} {"step": 18900, "loss": 1.2696, "grad_norm": "3.220e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.520e+00", "dlm_acc": "5.232e-01", "anc_acc": "5.009e-01", "epoch": 0.0378} {"step": 18905, "loss": 0.9362, "grad_norm": "2.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.664e-01", "anc_loss": "6.098e-01", "dlm_acc": "7.297e-01", "anc_acc": "7.153e-01", "epoch": 0.03781} {"step": 18910, "loss": 0.7155, "grad_norm": "1.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.781e-01", "anc_loss": "6.367e-01", "dlm_acc": "7.286e-01", "anc_acc": "7.079e-01", "epoch": 0.03782} {"step": 18915, "loss": 0.9815, "grad_norm": "3.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.126e+00", "anc_loss": "1.227e+00", "dlm_acc": "6.300e-01", "anc_acc": "6.034e-01", "epoch": 0.03783} {"step": 18920, "loss": 0.8339, "grad_norm": "4.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.953e-01", "anc_loss": "9.859e-01", "dlm_acc": "6.259e-01", "anc_acc": "6.007e-01", "epoch": 0.03784} {"step": 18925, "loss": 1.0986, "grad_norm": "3.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.748e+00", "anc_loss": "1.805e+00", "dlm_acc": "3.748e-01", "anc_acc": "3.606e-01", "epoch": 0.03785} {"step": 18930, "loss": 1.3915, "grad_norm": "7.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.523e-01", "anc_acc": "5.216e-01", "epoch": 0.03786} {"step": 18935, "loss": 1.2281, "grad_norm": "3.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.516e+00", "dlm_acc": "5.253e-01", "anc_acc": "5.050e-01", "epoch": 0.03787} {"step": 18940, "loss": 1.1168, "grad_norm": "6.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.703e+00", "anc_loss": "1.782e+00", "dlm_acc": "4.581e-01", "anc_acc": "4.391e-01", "epoch": 0.03788} {"step": 18945, "loss": 0.9492, "grad_norm": "3.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.376e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.307e-01", "anc_acc": "5.037e-01", "epoch": 0.03789} {"step": 18950, "loss": 1.1216, "grad_norm": "3.658e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.684e+00", "dlm_acc": "4.526e-01", "anc_acc": "4.348e-01", "epoch": 0.0379} {"step": 18955, "loss": 0.9375, "grad_norm": "4.696e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.716e-01", "anc_loss": "5.089e-01", "dlm_acc": "8.305e-01", "anc_acc": "8.242e-01", "epoch": 0.03791} {"step": 18960, "loss": 0.8192, "grad_norm": "2.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.880e-02", "anc_loss": "8.843e-02", "dlm_acc": "9.547e-01", "anc_acc": "9.466e-01", "epoch": 0.03792} {"step": 18965, "loss": 1.0237, "grad_norm": "2.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.071e-01", "anc_loss": "6.417e-01", "dlm_acc": "7.762e-01", "anc_acc": "7.655e-01", "epoch": 0.03793} {"step": 18970, "loss": 0.9917, "grad_norm": "7.483e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.151e+00", "dlm_acc": "5.738e-01", "anc_acc": "5.546e-01", "epoch": 0.03794} {"step": 18975, "loss": 0.7658, "grad_norm": "3.337e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.141e-01", "anc_loss": "6.352e-01", "dlm_acc": "5.472e-01", "anc_acc": "5.371e-01", "epoch": 0.03795} {"step": 18980, "loss": 0.7047, "grad_norm": "1.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.557e-01", "anc_loss": "9.273e-01", "dlm_acc": "6.241e-01", "anc_acc": "6.057e-01", "epoch": 0.03796} {"step": 18985, "loss": 1.2753, "grad_norm": "4.980e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.351e+00", "anc_loss": "1.458e+00", "dlm_acc": "5.443e-01", "anc_acc": "5.207e-01", "epoch": 0.03797} {"step": 18990, "loss": 0.9946, "grad_norm": "2.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.147e+00", "dlm_acc": "5.871e-01", "anc_acc": "5.605e-01", "epoch": 0.03798} {"step": 18995, "loss": 0.8782, "grad_norm": "3.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.117e-01", "anc_loss": "9.602e-01", "dlm_acc": "5.497e-01", "anc_acc": "5.265e-01", "epoch": 0.03799} {"step": 19000, "loss": 1.0555, "grad_norm": "3.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.281e-01", "anc_loss": "8.836e-01", "dlm_acc": "5.531e-01", "anc_acc": "5.268e-01", "epoch": 0.038} {"step": 19005, "loss": 1.5875, "grad_norm": "7.304e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.820e+00", "anc_loss": "1.922e+00", "dlm_acc": "4.114e-01", "anc_acc": "3.847e-01", "epoch": 0.03801} {"step": 19010, "loss": 1.3459, "grad_norm": "2.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.561e+00", "anc_loss": "1.640e+00", "dlm_acc": "4.363e-01", "anc_acc": "4.157e-01", "epoch": 0.03802} {"step": 19015, "loss": 1.3283, "grad_norm": "4.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.249e+00", "dlm_acc": "4.731e-01", "anc_acc": "4.586e-01", "epoch": 0.03803} {"step": 19020, "loss": 1.0349, "grad_norm": "4.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.375e-01", "anc_loss": "9.742e-01", "dlm_acc": "3.731e-01", "anc_acc": "3.625e-01", "epoch": 0.03804} {"step": 19025, "loss": 1.204, "grad_norm": "8.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.738e-01", "anc_loss": "8.332e-01", "dlm_acc": "6.857e-01", "anc_acc": "6.684e-01", "epoch": 0.03805} {"step": 19030, "loss": 1.4455, "grad_norm": "3.031e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.367e-01", "anc_loss": "9.867e-01", "dlm_acc": "4.816e-01", "anc_acc": "4.626e-01", "epoch": 0.03806} {"step": 19035, "loss": 1.7866, "grad_norm": "4.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.400e+00", "anc_loss": "1.473e+00", "dlm_acc": "4.660e-01", "anc_acc": "4.457e-01", "epoch": 0.03807} {"step": 19040, "loss": 1.1972, "grad_norm": "2.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.276e+00", "anc_loss": "1.390e+00", "dlm_acc": "5.630e-01", "anc_acc": "5.370e-01", "epoch": 0.03808} {"step": 19045, "loss": 0.9772, "grad_norm": "4.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.652e-01", "anc_loss": "7.348e-01", "dlm_acc": "7.013e-01", "anc_acc": "6.782e-01", "epoch": 0.03809} {"step": 19050, "loss": 1.1885, "grad_norm": "2.718e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.041e-01", "anc_acc": "4.807e-01", "epoch": 0.0381} {"step": 19055, "loss": 0.9931, "grad_norm": "2.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.949e-01", "anc_acc": "5.709e-01", "epoch": 0.03811} {"step": 19060, "loss": 1.1578, "grad_norm": "3.132e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.445e+00", "dlm_acc": "4.969e-01", "anc_acc": "4.767e-01", "epoch": 0.03812} {"step": 19065, "loss": 1.0828, "grad_norm": "2.228e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.547e-01", "anc_loss": "1.050e+00", "dlm_acc": "6.500e-01", "anc_acc": "6.219e-01", "epoch": 0.03813} {"step": 19070, "loss": 1.1689, "grad_norm": "2.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.563e+00", "dlm_acc": "5.225e-01", "anc_acc": "4.978e-01", "epoch": 0.03814} {"step": 19075, "loss": 1.1862, "grad_norm": "3.341e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.442e+00", "anc_loss": "1.536e+00", "dlm_acc": "5.236e-01", "anc_acc": "5.049e-01", "epoch": 0.03815} {"step": 19080, "loss": 1.8253, "grad_norm": "6.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.835e+00", "anc_loss": "1.944e+00", "dlm_acc": "4.846e-01", "anc_acc": "4.622e-01", "epoch": 0.03816} {"step": 19085, "loss": 1.3682, "grad_norm": "3.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.759e+00", "anc_loss": "1.800e+00", "dlm_acc": "2.961e-01", "anc_acc": "2.907e-01", "epoch": 0.03817} {"step": 19090, "loss": 1.5074, "grad_norm": "2.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.719e+00", "dlm_acc": "4.278e-01", "anc_acc": "4.090e-01", "epoch": 0.03818} {"step": 19095, "loss": 1.2817, "grad_norm": "3.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.535e+00", "dlm_acc": "5.252e-01", "anc_acc": "5.037e-01", "epoch": 0.03819} {"step": 19100, "loss": 1.2258, "grad_norm": "2.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.501e+00", "anc_loss": "1.605e+00", "dlm_acc": "5.046e-01", "anc_acc": "4.845e-01", "epoch": 0.0382} {"step": 19105, "loss": 1.2886, "grad_norm": "3.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.064e+00", "anc_loss": "1.148e+00", "dlm_acc": "6.366e-01", "anc_acc": "6.197e-01", "epoch": 0.03821} {"step": 19110, "loss": 1.4574, "grad_norm": "2.330e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.700e+00", "anc_loss": "1.787e+00", "dlm_acc": "4.197e-01", "anc_acc": "4.051e-01", "epoch": 0.03822} {"step": 19115, "loss": 1.7204, "grad_norm": "6.109e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.144e+00", "anc_loss": "2.247e+00", "dlm_acc": "3.776e-01", "anc_acc": "3.619e-01", "epoch": 0.03823} {"step": 19120, "loss": 1.1788, "grad_norm": "3.351e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.356e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.254e-01", "anc_acc": "5.075e-01", "epoch": 0.03824} {"step": 19125, "loss": 1.237, "grad_norm": "3.716e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.453e+00", "dlm_acc": "4.769e-01", "anc_acc": "4.669e-01", "epoch": 0.03825} {"step": 19130, "loss": 1.0156, "grad_norm": "3.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.262e+00", "dlm_acc": "4.745e-01", "anc_acc": "4.613e-01", "epoch": 0.03826} {"step": 19135, "loss": 1.1866, "grad_norm": "2.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.203e+00", "dlm_acc": "5.318e-01", "anc_acc": "5.179e-01", "epoch": 0.03827} {"step": 19140, "loss": 0.7274, "grad_norm": "4.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.805e-01", "anc_loss": "9.453e-01", "dlm_acc": "6.305e-01", "anc_acc": "6.139e-01", "epoch": 0.03828} {"step": 19145, "loss": 0.9831, "grad_norm": "4.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.158e+00", "dlm_acc": "5.301e-01", "anc_acc": "5.147e-01", "epoch": 0.03829} {"step": 19150, "loss": 1.7917, "grad_norm": "2.184e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.863e+00", "anc_loss": "1.898e+00", "dlm_acc": "2.606e-01", "anc_acc": "2.536e-01", "epoch": 0.0383} {"step": 19155, "loss": 1.3448, "grad_norm": "3.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.862e+00", "anc_loss": "2.894e+00", "dlm_acc": "6.362e-02", "anc_acc": "6.111e-02", "epoch": 0.03831} {"step": 19160, "loss": 1.2743, "grad_norm": "6.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.250e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.546e-01", "anc_acc": "5.257e-01", "epoch": 0.03832} {"step": 19165, "loss": 1.2484, "grad_norm": "3.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.883e-01", "anc_loss": "9.992e-01", "dlm_acc": "6.518e-01", "anc_acc": "6.184e-01", "epoch": 0.03833} {"step": 19170, "loss": 1.1942, "grad_norm": "4.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.111e+00", "dlm_acc": "5.781e-01", "anc_acc": "5.598e-01", "epoch": 0.03834} {"step": 19175, "loss": 0.9342, "grad_norm": "2.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.125e+00", "anc_loss": "1.222e+00", "dlm_acc": "5.954e-01", "anc_acc": "5.716e-01", "epoch": 0.03835} {"step": 19180, "loss": 1.5811, "grad_norm": "3.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.242e-01", "anc_loss": "1.045e+00", "dlm_acc": "6.760e-01", "anc_acc": "6.407e-01", "epoch": 0.03836} {"step": 19185, "loss": 1.3988, "grad_norm": "3.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.476e+00", "dlm_acc": "4.867e-01", "anc_acc": "4.601e-01", "epoch": 0.03837} {"step": 19190, "loss": 1.2451, "grad_norm": "3.382e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.275e+00", "dlm_acc": "5.804e-01", "anc_acc": "5.558e-01", "epoch": 0.03838} {"step": 19195, "loss": 1.2809, "grad_norm": "4.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.750e+00", "anc_loss": "1.836e+00", "dlm_acc": "4.342e-01", "anc_acc": "4.146e-01", "epoch": 0.03839} {"step": 19200, "loss": 1.4641, "grad_norm": "3.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.723e+00", "anc_loss": "1.834e+00", "dlm_acc": "4.519e-01", "anc_acc": "4.281e-01", "epoch": 0.0384} {"step": 19205, "loss": 1.3063, "grad_norm": "4.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.211e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.709e-01", "anc_acc": "5.494e-01", "epoch": 0.03841} {"step": 19210, "loss": 1.326, "grad_norm": "3.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.566e-01", "anc_loss": "1.054e+00", "dlm_acc": "6.121e-01", "anc_acc": "5.823e-01", "epoch": 0.03842} {"step": 19215, "loss": 1.7656, "grad_norm": "4.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.619e+00", "anc_loss": "2.641e+00", "dlm_acc": "1.320e-01", "anc_acc": "1.296e-01", "epoch": 0.03843} {"step": 19220, "loss": 1.2489, "grad_norm": "2.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.859e+00", "anc_loss": "1.925e+00", "dlm_acc": "3.625e-01", "anc_acc": "3.470e-01", "epoch": 0.03844} {"step": 19225, "loss": 1.2585, "grad_norm": "4.300e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.789e-01", "anc_loss": "9.512e-01", "dlm_acc": "6.087e-01", "anc_acc": "5.913e-01", "epoch": 0.03845} {"step": 19230, "loss": 0.8939, "grad_norm": "2.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.523e-01", "anc_loss": "1.080e+00", "dlm_acc": "6.329e-01", "anc_acc": "5.905e-01", "epoch": 0.03846} {"step": 19235, "loss": 1.5362, "grad_norm": "6.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.745e-01", "anc_acc": "5.422e-01", "epoch": 0.03847} {"step": 19240, "loss": 1.5991, "grad_norm": "5.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.313e+00", "anc_loss": "1.390e+00", "dlm_acc": "4.987e-01", "anc_acc": "4.710e-01", "epoch": 0.03848} {"step": 19245, "loss": 1.1104, "grad_norm": "5.280e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.154e+00", "dlm_acc": "6.024e-01", "anc_acc": "5.834e-01", "epoch": 0.03849} {"step": 19250, "loss": 1.0965, "grad_norm": "2.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.597e+00", "dlm_acc": "4.098e-01", "anc_acc": "3.895e-01", "epoch": 0.0385} {"step": 19255, "loss": 1.3708, "grad_norm": "3.271e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.163e+00", "dlm_acc": "5.780e-01", "anc_acc": "5.431e-01", "epoch": 0.03851} {"step": 19260, "loss": 1.3829, "grad_norm": "4.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.040e+00", "anc_loss": "1.155e+00", "dlm_acc": "6.063e-01", "anc_acc": "5.696e-01", "epoch": 0.03852} {"step": 19265, "loss": 1.2827, "grad_norm": "2.862e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.759e-01", "anc_acc": "5.576e-01", "epoch": 0.03853} {"step": 19270, "loss": 1.7274, "grad_norm": "6.653e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.327e+00", "anc_loss": "2.375e+00", "dlm_acc": "1.908e-01", "anc_acc": "1.815e-01", "epoch": 0.03854} {"step": 19275, "loss": 1.3578, "grad_norm": "4.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.071e+00", "dlm_acc": "6.208e-01", "anc_acc": "6.066e-01", "epoch": 0.03855} {"step": 19280, "loss": 1.8805, "grad_norm": "4.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.859e+00", "anc_loss": "1.969e+00", "dlm_acc": "4.794e-01", "anc_acc": "4.599e-01", "epoch": 0.03856} {"step": 19285, "loss": 1.3274, "grad_norm": "2.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.792e+00", "anc_loss": "1.945e+00", "dlm_acc": "4.325e-01", "anc_acc": "4.112e-01", "epoch": 0.03857} {"step": 19290, "loss": 1.4149, "grad_norm": "7.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.308e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.762e-01", "anc_acc": "5.502e-01", "epoch": 0.03858} {"step": 19295, "loss": 1.4443, "grad_norm": "3.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.256e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.964e-01", "anc_acc": "5.746e-01", "epoch": 0.03859} {"step": 19300, "loss": 1.7657, "grad_norm": "4.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.762e+00", "anc_loss": "1.861e+00", "dlm_acc": "4.614e-01", "anc_acc": "4.413e-01", "epoch": 0.0386} {"step": 19305, "loss": 1.2357, "grad_norm": "2.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.128e+00", "dlm_acc": "5.855e-01", "anc_acc": "5.674e-01", "epoch": 0.03861} {"step": 19310, "loss": 1.4288, "grad_norm": "4.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.659e+00", "anc_loss": "1.769e+00", "dlm_acc": "4.420e-01", "anc_acc": "4.101e-01", "epoch": 0.03862} {"step": 19315, "loss": 1.0215, "grad_norm": "2.518e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.417e-01", "anc_acc": "5.153e-01", "epoch": 0.03863} {"step": 19320, "loss": 1.3698, "grad_norm": "3.222e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.683e-01", "anc_acc": "5.412e-01", "epoch": 0.03864} {"step": 19325, "loss": 1.6882, "grad_norm": "8.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.080e+00", "anc_loss": "2.131e+00", "dlm_acc": "2.759e-01", "anc_acc": "2.637e-01", "epoch": 0.03865} {"step": 19330, "loss": 1.612, "grad_norm": "4.699e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.543e+00", "anc_loss": "1.641e+00", "dlm_acc": "4.212e-01", "anc_acc": "3.999e-01", "epoch": 0.03866} {"step": 19335, "loss": 0.9425, "grad_norm": "3.365e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.193e+00", "dlm_acc": "5.501e-01", "anc_acc": "5.322e-01", "epoch": 0.03867} {"step": 19340, "loss": 1.0425, "grad_norm": "3.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.013e+00", "anc_loss": "1.080e+00", "dlm_acc": "5.565e-01", "anc_acc": "5.393e-01", "epoch": 0.03868} {"step": 19345, "loss": 1.234, "grad_norm": "4.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.414e+00", "dlm_acc": "5.261e-01", "anc_acc": "5.053e-01", "epoch": 0.03869} {"step": 19350, "loss": 1.1677, "grad_norm": "3.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.183e+00", "dlm_acc": "5.669e-01", "anc_acc": "5.419e-01", "epoch": 0.0387} {"step": 19355, "loss": 1.5259, "grad_norm": "2.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.526e+00", "anc_loss": "1.616e+00", "dlm_acc": "5.216e-01", "anc_acc": "5.036e-01", "epoch": 0.03871} {"step": 19360, "loss": 1.4658, "grad_norm": "4.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.074e-01", "anc_loss": "8.660e-01", "dlm_acc": "6.525e-01", "anc_acc": "6.346e-01", "epoch": 0.03872} {"step": 19365, "loss": 1.2234, "grad_norm": "4.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.645e-01", "anc_loss": "7.188e-01", "dlm_acc": "6.898e-01", "anc_acc": "6.703e-01", "epoch": 0.03873} {"step": 19370, "loss": 1.2966, "grad_norm": "2.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.070e-01", "anc_loss": "8.688e-01", "dlm_acc": "6.520e-01", "anc_acc": "6.304e-01", "epoch": 0.03874} {"step": 19375, "loss": 1.1687, "grad_norm": "3.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.883e-01", "anc_loss": "6.617e-01", "dlm_acc": "7.025e-01", "anc_acc": "6.764e-01", "epoch": 0.03875} {"step": 19380, "loss": 1.0853, "grad_norm": "3.134e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.012e-01", "anc_loss": "8.891e-01", "dlm_acc": "6.909e-01", "anc_acc": "6.653e-01", "epoch": 0.03876} {"step": 19385, "loss": 1.2613, "grad_norm": "3.099e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.210e+00", "dlm_acc": "5.849e-01", "anc_acc": "5.632e-01", "epoch": 0.03877} {"step": 19390, "loss": 1.5569, "grad_norm": "2.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.490e+00", "dlm_acc": "5.279e-01", "anc_acc": "5.001e-01", "epoch": 0.03878} {"step": 19395, "loss": 1.3193, "grad_norm": "2.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.625e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.462e-01", "anc_acc": "6.257e-01", "epoch": 0.03879} {"step": 19400, "loss": 1.3668, "grad_norm": "3.242e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.207e+00", "dlm_acc": "5.615e-01", "anc_acc": "5.282e-01", "epoch": 0.0388} {"step": 19405, "loss": 1.5748, "grad_norm": "2.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.232e+00", "anc_loss": "1.329e+00", "dlm_acc": "5.721e-01", "anc_acc": "5.446e-01", "epoch": 0.03881} {"step": 19410, "loss": 1.3396, "grad_norm": "3.153e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.696e-01", "anc_acc": "5.442e-01", "epoch": 0.03882} {"step": 19415, "loss": 1.2159, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.138e+00", "dlm_acc": "5.990e-01", "anc_acc": "5.751e-01", "epoch": 0.03883} {"step": 19420, "loss": 1.5662, "grad_norm": "3.088e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.381e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.405e-01", "anc_acc": "5.215e-01", "epoch": 0.03884} {"step": 19425, "loss": 1.6198, "grad_norm": "3.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.122e+00", "anc_loss": "2.194e+00", "dlm_acc": "3.161e-01", "anc_acc": "3.020e-01", "epoch": 0.03885} {"step": 19430, "loss": 1.2987, "grad_norm": "2.623e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.542e-01", "anc_acc": "5.287e-01", "epoch": 0.03886} {"step": 19435, "loss": 1.9052, "grad_norm": "4.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.553e+00", "anc_loss": "1.653e+00", "dlm_acc": "4.597e-01", "anc_acc": "4.401e-01", "epoch": 0.03887} {"step": 19440, "loss": 0.8772, "grad_norm": "2.689e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.352e-01", "anc_loss": "9.062e-01", "dlm_acc": "6.163e-01", "anc_acc": "5.957e-01", "epoch": 0.03888} {"step": 19445, "loss": 1.6944, "grad_norm": "3.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.556e+00", "anc_loss": "1.664e+00", "dlm_acc": "5.446e-01", "anc_acc": "5.245e-01", "epoch": 0.03889} {"step": 19450, "loss": 1.3245, "grad_norm": "5.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.910e-01", "anc_loss": "9.453e-01", "dlm_acc": "6.974e-01", "anc_acc": "6.836e-01", "epoch": 0.0389} {"step": 19455, "loss": 1.0281, "grad_norm": "4.429e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.931e-01", "anc_loss": "8.598e-01", "dlm_acc": "7.134e-01", "anc_acc": "6.969e-01", "epoch": 0.03891} {"step": 19460, "loss": 1.5084, "grad_norm": "4.373e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.244e+00", "dlm_acc": "3.579e-01", "anc_acc": "3.433e-01", "epoch": 0.03892} {"step": 19465, "loss": 1.3341, "grad_norm": "3.690e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.305e-01", "anc_loss": "9.383e-01", "dlm_acc": "2.445e-01", "anc_acc": "2.413e-01", "epoch": 0.03893} {"step": 19470, "loss": 1.2213, "grad_norm": "2.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.202e+00", "dlm_acc": "5.299e-01", "anc_acc": "5.021e-01", "epoch": 0.03894} {"step": 19475, "loss": 1.5357, "grad_norm": "6.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.344e-01", "anc_loss": "8.980e-01", "dlm_acc": "6.939e-01", "anc_acc": "6.783e-01", "epoch": 0.03895} {"step": 19480, "loss": 1.4091, "grad_norm": "5.149e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.441e-01", "anc_acc": "5.203e-01", "epoch": 0.03896} {"step": 19485, "loss": 1.301, "grad_norm": "3.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.880e-01", "anc_acc": "5.647e-01", "epoch": 0.03897} {"step": 19490, "loss": 1.4484, "grad_norm": "3.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.242e-01", "anc_loss": "9.961e-01", "dlm_acc": "5.962e-01", "anc_acc": "5.756e-01", "epoch": 0.03898} {"step": 19495, "loss": 1.5397, "grad_norm": "4.455e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.225e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.942e-01", "anc_acc": "5.729e-01", "epoch": 0.03899} {"step": 19500, "loss": 1.3037, "grad_norm": "3.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.863e-01", "anc_acc": "5.665e-01", "epoch": 0.039} {"step": 19505, "loss": 1.5587, "grad_norm": "3.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.553e+00", "dlm_acc": "5.482e-01", "anc_acc": "5.215e-01", "epoch": 0.03901} {"step": 19510, "loss": 1.3892, "grad_norm": "3.836e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.215e+00", "anc_loss": "1.290e+00", "dlm_acc": "5.830e-01", "anc_acc": "5.674e-01", "epoch": 0.03902} {"step": 19515, "loss": 1.5201, "grad_norm": "2.893e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.418e-01", "epoch": 0.03903} {"step": 19520, "loss": 1.1744, "grad_norm": "3.429e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.492e-01", "anc_loss": "7.340e-01", "dlm_acc": "7.581e-01", "anc_acc": "7.385e-01", "epoch": 0.03904} {"step": 19525, "loss": 1.2056, "grad_norm": "3.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.065e+00", "anc_loss": "1.126e+00", "dlm_acc": "6.442e-01", "anc_acc": "6.274e-01", "epoch": 0.03905} {"step": 19530, "loss": 1.2473, "grad_norm": "4.179e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.293e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.445e-01", "epoch": 0.03906} {"step": 19535, "loss": 1.0276, "grad_norm": "2.496e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.129e-01", "anc_loss": "9.711e-01", "dlm_acc": "6.741e-01", "anc_acc": "6.611e-01", "epoch": 0.03907} {"step": 19540, "loss": 1.0765, "grad_norm": "4.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.252e+00", "dlm_acc": "6.088e-01", "anc_acc": "5.881e-01", "epoch": 0.03908} {"step": 19545, "loss": 0.8959, "grad_norm": "2.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.816e-01", "anc_loss": "7.430e-01", "dlm_acc": "6.921e-01", "anc_acc": "6.755e-01", "epoch": 0.03909} {"step": 19550, "loss": 0.8723, "grad_norm": "1.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.818e-01", "anc_loss": "6.539e-01", "dlm_acc": "7.340e-01", "anc_acc": "7.113e-01", "epoch": 0.0391} {"step": 19555, "loss": 0.8378, "grad_norm": "3.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.325e-01", "anc_loss": "5.839e-01", "dlm_acc": "7.486e-01", "anc_acc": "7.339e-01", "epoch": 0.03911} {"step": 19560, "loss": 0.9921, "grad_norm": "2.403e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.221e-01", "anc_loss": "8.885e-01", "dlm_acc": "6.584e-01", "anc_acc": "6.435e-01", "epoch": 0.03912} {"step": 19565, "loss": 1.0989, "grad_norm": "3.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.861e-01", "anc_acc": "5.652e-01", "epoch": 0.03913} {"step": 19570, "loss": 0.7861, "grad_norm": "2.437e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.558e-01", "anc_loss": "9.359e-01", "dlm_acc": "6.722e-01", "anc_acc": "6.528e-01", "epoch": 0.03914} {"step": 19575, "loss": 0.6225, "grad_norm": "3.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.467e-01", "anc_loss": "5.672e-01", "dlm_acc": "6.619e-01", "anc_acc": "6.566e-01", "epoch": 0.03915} {"step": 19580, "loss": 0.9666, "grad_norm": "3.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.945e-01", "anc_loss": "6.984e-01", "dlm_acc": "5.541e-01", "anc_acc": "5.540e-01", "epoch": 0.03916} {"step": 19585, "loss": 1.2055, "grad_norm": "3.598e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.289e-01", "anc_loss": "7.336e-01", "dlm_acc": "5.454e-01", "anc_acc": "5.460e-01", "epoch": 0.03917} {"step": 19590, "loss": 1.5485, "grad_norm": "5.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.178e+00", "dlm_acc": "5.726e-01", "anc_acc": "5.575e-01", "epoch": 0.03918} {"step": 19595, "loss": 1.2175, "grad_norm": "3.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.523e+00", "dlm_acc": "5.182e-01", "anc_acc": "4.970e-01", "epoch": 0.03919} {"step": 19600, "loss": 0.8162, "grad_norm": "2.198e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.172e-01", "anc_loss": "7.603e-01", "dlm_acc": "7.691e-01", "anc_acc": "7.563e-01", "epoch": 0.0392} {"step": 19605, "loss": 0.9315, "grad_norm": "4.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.858e-01", "anc_loss": "5.328e-01", "dlm_acc": "8.281e-01", "anc_acc": "8.110e-01", "epoch": 0.03921} {"step": 19610, "loss": 0.7986, "grad_norm": "1.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.177e-01", "anc_loss": "3.515e-01", "dlm_acc": "8.395e-01", "anc_acc": "8.246e-01", "epoch": 0.03922} {"step": 19615, "loss": 0.9452, "grad_norm": "3.113e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.723e-01", "anc_loss": "5.223e-01", "dlm_acc": "8.388e-01", "anc_acc": "8.250e-01", "epoch": 0.03923} {"step": 19620, "loss": 0.9702, "grad_norm": "5.802e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.160e-01", "anc_loss": "3.463e-01", "dlm_acc": "8.641e-01", "anc_acc": "8.574e-01", "epoch": 0.03924} {"step": 19625, "loss": 0.9849, "grad_norm": "5.294e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.626e-01", "anc_loss": "7.187e-01", "dlm_acc": "7.677e-01", "anc_acc": "7.505e-01", "epoch": 0.03925} {"step": 19630, "loss": 1.4881, "grad_norm": "4.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.664e+00", "anc_loss": "1.755e+00", "dlm_acc": "5.228e-01", "anc_acc": "5.056e-01", "epoch": 0.03926} {"step": 19635, "loss": 0.9446, "grad_norm": "3.482e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.373e-01", "anc_loss": "9.027e-01", "dlm_acc": "6.425e-01", "anc_acc": "6.230e-01", "epoch": 0.03927} {"step": 19640, "loss": 0.8801, "grad_norm": "4.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.927e-01", "anc_loss": "7.480e-01", "dlm_acc": "7.247e-01", "anc_acc": "7.134e-01", "epoch": 0.03928} {"step": 19645, "loss": 0.8886, "grad_norm": "8.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.376e-01", "anc_loss": "1.527e-01", "dlm_acc": "9.279e-01", "anc_acc": "9.169e-01", "epoch": 0.03929} {"step": 19650, "loss": 0.8273, "grad_norm": "3.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.240e-01", "anc_loss": "3.478e-01", "dlm_acc": "8.567e-01", "anc_acc": "8.503e-01", "epoch": 0.0393} {"step": 19655, "loss": 1.1029, "grad_norm": "2.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.039e-01", "anc_loss": "8.484e-01", "dlm_acc": "6.539e-01", "anc_acc": "6.444e-01", "epoch": 0.03931} {"step": 19660, "loss": 0.9995, "grad_norm": "2.979e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.162e-01", "anc_loss": "6.572e-01", "dlm_acc": "7.888e-01", "anc_acc": "7.759e-01", "epoch": 0.03932} {"step": 19665, "loss": 1.262, "grad_norm": "2.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.189e+00", "anc_loss": "1.265e+00", "dlm_acc": "6.224e-01", "anc_acc": "6.078e-01", "epoch": 0.03933} {"step": 19670, "loss": 0.8488, "grad_norm": "1.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.706e-01", "anc_loss": "8.241e-01", "dlm_acc": "7.520e-01", "anc_acc": "7.394e-01", "epoch": 0.03934} {"step": 19675, "loss": 0.9661, "grad_norm": "3.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.243e+00", "dlm_acc": "6.291e-01", "anc_acc": "6.132e-01", "epoch": 0.03935} {"step": 19680, "loss": 0.8367, "grad_norm": "3.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.340e-01", "anc_loss": "7.779e-01", "dlm_acc": "6.778e-01", "anc_acc": "6.680e-01", "epoch": 0.03936} {"step": 19685, "loss": 0.7501, "grad_norm": "3.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.247e-01", "anc_loss": "5.724e-01", "dlm_acc": "7.551e-01", "anc_acc": "7.412e-01", "epoch": 0.03937} {"step": 19690, "loss": 0.9558, "grad_norm": "5.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.692e+00", "anc_loss": "1.783e+00", "dlm_acc": "5.015e-01", "anc_acc": "4.861e-01", "epoch": 0.03938} {"step": 19695, "loss": 1.1984, "grad_norm": "5.698e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.635e+00", "anc_loss": "1.742e+00", "dlm_acc": "5.190e-01", "anc_acc": "4.993e-01", "epoch": 0.03939} {"step": 19700, "loss": 1.2449, "grad_norm": "4.883e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.542e-01", "anc_acc": "5.323e-01", "epoch": 0.0394} {"step": 19705, "loss": 1.2188, "grad_norm": "2.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.527e-01", "anc_acc": "5.299e-01", "epoch": 0.03941} {"step": 19710, "loss": 0.9872, "grad_norm": "2.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.577e-01", "anc_acc": "5.375e-01", "epoch": 0.03942} {"step": 19715, "loss": 1.1018, "grad_norm": "2.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.688e+00", "anc_loss": "1.783e+00", "dlm_acc": "4.822e-01", "anc_acc": "4.647e-01", "epoch": 0.03943} {"step": 19720, "loss": 0.7952, "grad_norm": "2.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.031e-01", "anc_loss": "9.992e-01", "dlm_acc": "6.521e-01", "anc_acc": "6.258e-01", "epoch": 0.03944} {"step": 19725, "loss": 1.1182, "grad_norm": "2.875e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.451e+00", "anc_loss": "1.555e+00", "dlm_acc": "5.346e-01", "anc_acc": "5.128e-01", "epoch": 0.03945} {"step": 19730, "loss": 0.9823, "grad_norm": "3.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.176e+00", "anc_loss": "1.281e+00", "dlm_acc": "6.156e-01", "anc_acc": "5.964e-01", "epoch": 0.03946} {"step": 19735, "loss": 1.0267, "grad_norm": "2.940e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.341e+00", "dlm_acc": "6.119e-01", "anc_acc": "5.941e-01", "epoch": 0.03947} {"step": 19740, "loss": 0.7427, "grad_norm": "4.486e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.036e+00", "anc_loss": "1.116e+00", "dlm_acc": "6.150e-01", "anc_acc": "5.941e-01", "epoch": 0.03948} {"step": 19745, "loss": 0.9701, "grad_norm": "4.292e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.589e+00", "dlm_acc": "5.004e-01", "anc_acc": "4.811e-01", "epoch": 0.03949} {"step": 19750, "loss": 1.1686, "grad_norm": "2.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.313e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.934e-01", "anc_acc": "5.727e-01", "epoch": 0.0395} {"step": 19755, "loss": 1.2168, "grad_norm": "1.533e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.303e+00", "dlm_acc": "5.975e-01", "anc_acc": "5.715e-01", "epoch": 0.03951} {"step": 19760, "loss": 1.1012, "grad_norm": "4.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.180e+00", "dlm_acc": "5.774e-01", "anc_acc": "5.540e-01", "epoch": 0.03952} {"step": 19765, "loss": 1.022, "grad_norm": "4.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.068e+00", "anc_loss": "1.132e+00", "dlm_acc": "6.317e-01", "anc_acc": "6.183e-01", "epoch": 0.03953} {"step": 19770, "loss": 1.1745, "grad_norm": "3.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.238e-01", "anc_loss": "1.001e+00", "dlm_acc": "6.291e-01", "anc_acc": "6.136e-01", "epoch": 0.03954} {"step": 19775, "loss": 1.3897, "grad_norm": "3.362e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.359e+00", "anc_loss": "1.471e+00", "dlm_acc": "5.332e-01", "anc_acc": "5.123e-01", "epoch": 0.03955} {"step": 19780, "loss": 1.263, "grad_norm": "3.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.715e+00", "dlm_acc": "4.609e-01", "anc_acc": "4.355e-01", "epoch": 0.03956} {"step": 19785, "loss": 0.815, "grad_norm": "8.515e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.473e-01", "anc_loss": "8.063e-01", "dlm_acc": "6.397e-01", "anc_acc": "6.242e-01", "epoch": 0.03957} {"step": 19790, "loss": 1.5061, "grad_norm": "5.996e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.126e+00", "anc_loss": "1.236e+00", "dlm_acc": "5.521e-01", "anc_acc": "5.244e-01", "epoch": 0.03958} {"step": 19795, "loss": 1.163, "grad_norm": "5.714e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.290e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.258e-01", "anc_acc": "4.969e-01", "epoch": 0.03959} {"step": 19800, "loss": 1.0442, "grad_norm": "5.090e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.308e+00", "anc_loss": "1.373e+00", "dlm_acc": "5.414e-01", "anc_acc": "5.245e-01", "epoch": 0.0396} {"step": 19805, "loss": 1.1162, "grad_norm": "8.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.105e-01", "anc_loss": "8.586e-01", "dlm_acc": "6.581e-01", "anc_acc": "6.482e-01", "epoch": 0.03961} {"step": 19810, "loss": 1.5203, "grad_norm": "5.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.325e+00", "dlm_acc": "4.667e-01", "anc_acc": "4.495e-01", "epoch": 0.03962} {"step": 19815, "loss": 1.3109, "grad_norm": "4.744e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.396e+00", "anc_loss": "1.479e+00", "dlm_acc": "4.803e-01", "anc_acc": "4.630e-01", "epoch": 0.03963} {"step": 19820, "loss": 1.0936, "grad_norm": "3.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.336e-01", "anc_loss": "7.883e-01", "dlm_acc": "6.395e-01", "anc_acc": "6.227e-01", "epoch": 0.03964} {"step": 19825, "loss": 1.4996, "grad_norm": "3.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.371e+00", "dlm_acc": "5.585e-01", "anc_acc": "5.342e-01", "epoch": 0.03965} {"step": 19830, "loss": 1.2104, "grad_norm": "4.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.233e+00", "anc_loss": "1.317e+00", "dlm_acc": "5.269e-01", "anc_acc": "5.043e-01", "epoch": 0.03966} {"step": 19835, "loss": 1.4219, "grad_norm": "3.676e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.332e-01", "anc_loss": "9.211e-01", "dlm_acc": "7.064e-01", "anc_acc": "6.799e-01", "epoch": 0.03967} {"step": 19840, "loss": 1.3237, "grad_norm": "4.320e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.404e+00", "anc_loss": "1.461e+00", "dlm_acc": "4.725e-01", "anc_acc": "4.575e-01", "epoch": 0.03968} {"step": 19845, "loss": 1.4331, "grad_norm": "2.699e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.106e+00", "anc_loss": "1.195e+00", "dlm_acc": "5.317e-01", "anc_acc": "5.064e-01", "epoch": 0.03969} {"step": 19850, "loss": 0.9229, "grad_norm": "1.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.552e-01", "anc_loss": "6.301e-01", "dlm_acc": "7.603e-01", "anc_acc": "7.381e-01", "epoch": 0.0397} {"step": 19855, "loss": 0.9367, "grad_norm": "3.335e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.307e-01", "anc_loss": "9.939e-01", "dlm_acc": "6.296e-01", "anc_acc": "6.121e-01", "epoch": 0.03971} {"step": 19860, "loss": 0.8593, "grad_norm": "4.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.426e-01", "anc_loss": "7.969e-01", "dlm_acc": "6.782e-01", "anc_acc": "6.623e-01", "epoch": 0.03972} {"step": 19865, "loss": 1.2952, "grad_norm": "3.149e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.421e+00", "anc_loss": "1.515e+00", "dlm_acc": "5.640e-01", "anc_acc": "5.402e-01", "epoch": 0.03973} {"step": 19870, "loss": 1.2765, "grad_norm": "4.113e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.031e+00", "anc_loss": "2.078e+00", "dlm_acc": "2.240e-01", "anc_acc": "2.145e-01", "epoch": 0.03974} {"step": 19875, "loss": 0.8943, "grad_norm": "3.958e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.353e+00", "dlm_acc": "3.868e-01", "anc_acc": "3.646e-01", "epoch": 0.03975} {"step": 19880, "loss": 1.1579, "grad_norm": "4.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.685e+00", "anc_loss": "1.770e+00", "dlm_acc": "4.753e-01", "anc_acc": "4.575e-01", "epoch": 0.03976} {"step": 19885, "loss": 1.0438, "grad_norm": "2.340e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.434e-01", "anc_acc": "5.286e-01", "epoch": 0.03977} {"step": 19890, "loss": 0.7475, "grad_norm": "3.759e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.838e-01", "anc_loss": "1.964e-01", "dlm_acc": "8.643e-01", "anc_acc": "8.582e-01", "epoch": 0.03978} {"step": 19895, "loss": 1.066, "grad_norm": "3.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.638e-01", "anc_loss": "1.728e-01", "dlm_acc": "8.962e-01", "anc_acc": "8.911e-01", "epoch": 0.03979} {"step": 19900, "loss": 0.9589, "grad_norm": "2.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.020e-01", "anc_loss": "1.128e-01", "dlm_acc": "9.322e-01", "anc_acc": "9.257e-01", "epoch": 0.0398} {"step": 19905, "loss": 0.8626, "grad_norm": "3.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.138e-01", "anc_loss": "1.272e-01", "dlm_acc": "9.177e-01", "anc_acc": "9.094e-01", "epoch": 0.03981} {"step": 19910, "loss": 0.8265, "grad_norm": "3.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.662e-01", "anc_loss": "1.856e-01", "dlm_acc": "8.862e-01", "anc_acc": "8.770e-01", "epoch": 0.03982} {"step": 19915, "loss": 1.2275, "grad_norm": "3.547e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.250e+00", "dlm_acc": "5.839e-01", "anc_acc": "5.655e-01", "epoch": 0.03983} {"step": 19920, "loss": 1.0412, "grad_norm": "2.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.398e+00", "anc_loss": "1.511e+00", "dlm_acc": "4.934e-01", "anc_acc": "4.632e-01", "epoch": 0.03984} {"step": 19925, "loss": 0.8728, "grad_norm": "2.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.832e-01", "anc_loss": "1.060e+00", "dlm_acc": "6.371e-01", "anc_acc": "6.169e-01", "epoch": 0.03985} {"step": 19930, "loss": 0.7996, "grad_norm": "2.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.045e-01", "anc_loss": "7.746e-01", "dlm_acc": "7.444e-01", "anc_acc": "7.246e-01", "epoch": 0.03986} {"step": 19935, "loss": 1.1096, "grad_norm": "4.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.620e-01", "anc_acc": "5.438e-01", "epoch": 0.03987} {"step": 19940, "loss": 1.2011, "grad_norm": "2.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.471e+00", "anc_loss": "1.551e+00", "dlm_acc": "4.860e-01", "anc_acc": "4.630e-01", "epoch": 0.03988} {"step": 19945, "loss": 1.1675, "grad_norm": "1.072e+00", "learning_rate": "1.000e-04", "dlm_loss": "7.328e-01", "anc_loss": "8.043e-01", "dlm_acc": "6.928e-01", "anc_acc": "6.730e-01", "epoch": 0.03989} {"step": 19950, "loss": 1.6669, "grad_norm": "2.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.260e+00", "anc_loss": "2.281e+00", "dlm_acc": "1.499e-01", "anc_acc": "1.473e-01", "epoch": 0.0399} {"step": 19955, "loss": 2.3087, "grad_norm": "4.728e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.961e+00", "anc_loss": "2.972e+00", "dlm_acc": "2.244e-02", "anc_acc": "2.104e-02", "epoch": 0.03991} {"step": 19960, "loss": 1.5003, "grad_norm": "3.432e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.383e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.286e-01", "anc_acc": "5.103e-01", "epoch": 0.03992} {"step": 19965, "loss": 1.2915, "grad_norm": "1.148e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.914e-01", "anc_loss": "1.091e+00", "dlm_acc": "5.553e-01", "anc_acc": "5.230e-01", "epoch": 0.03993} {"step": 19970, "loss": 1.3166, "grad_norm": "2.846e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.246e+00", "dlm_acc": "4.714e-01", "anc_acc": "4.587e-01", "epoch": 0.03994} {"step": 19975, "loss": 1.2, "grad_norm": "3.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.046e+00", "anc_loss": "1.122e+00", "dlm_acc": "5.699e-01", "anc_acc": "5.519e-01", "epoch": 0.03995} {"step": 19980, "loss": 1.5474, "grad_norm": "2.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.545e+00", "anc_loss": "1.644e+00", "dlm_acc": "5.121e-01", "anc_acc": "4.902e-01", "epoch": 0.03996} {"step": 19985, "loss": 0.9855, "grad_norm": "2.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.688e-01", "anc_loss": "1.047e+00", "dlm_acc": "5.965e-01", "anc_acc": "5.773e-01", "epoch": 0.03997} {"step": 19990, "loss": 1.7031, "grad_norm": "2.928e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.538e+00", "dlm_acc": "5.368e-01", "anc_acc": "5.130e-01", "epoch": 0.03998} {"step": 19995, "loss": 1.3195, "grad_norm": "4.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.529e+00", "anc_loss": "1.625e+00", "dlm_acc": "4.852e-01", "anc_acc": "4.646e-01", "epoch": 0.03999} {"step": 20000, "loss": 1.2269, "grad_norm": "5.237e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.520e+00", "dlm_acc": "5.143e-01", "anc_acc": "4.948e-01", "epoch": 0.04} {"step": 20005, "loss": 1.1364, "grad_norm": "2.482e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.538e-01", "anc_acc": "5.315e-01", "epoch": 0.04001} {"step": 20010, "loss": 1.157, "grad_norm": "1.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.343e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.248e-01", "anc_acc": "5.036e-01", "epoch": 0.04002} {"step": 20015, "loss": 1.2644, "grad_norm": "6.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.788e+00", "anc_loss": "1.884e+00", "dlm_acc": "4.663e-01", "anc_acc": "4.477e-01", "epoch": 0.04003} {"step": 20020, "loss": 1.6309, "grad_norm": "4.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.483e+00", "anc_loss": "1.580e+00", "dlm_acc": "5.107e-01", "anc_acc": "4.913e-01", "epoch": 0.04004} {"step": 20025, "loss": 1.0832, "grad_norm": "4.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.350e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.389e-01", "anc_acc": "5.167e-01", "epoch": 0.04005} {"step": 20030, "loss": 1.2219, "grad_norm": "1.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.473e-01", "anc_loss": "9.207e-01", "dlm_acc": "6.665e-01", "anc_acc": "6.453e-01", "epoch": 0.04006} {"step": 20035, "loss": 1.3861, "grad_norm": "5.362e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.397e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.246e-01", "anc_acc": "5.054e-01", "epoch": 0.04007} {"step": 20040, "loss": 1.44, "grad_norm": "3.293e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.004e-01", "anc_acc": "4.806e-01", "epoch": 0.04008} {"step": 20045, "loss": 1.6433, "grad_norm": "4.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.645e+00", "anc_loss": "1.759e+00", "dlm_acc": "4.973e-01", "anc_acc": "4.771e-01", "epoch": 0.04009} {"step": 20050, "loss": 1.6333, "grad_norm": "5.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.570e+00", "anc_loss": "1.659e+00", "dlm_acc": "5.138e-01", "anc_acc": "4.969e-01", "epoch": 0.0401} {"step": 20055, "loss": 1.984, "grad_norm": "5.560e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.916e+00", "anc_loss": "2.020e+00", "dlm_acc": "4.228e-01", "anc_acc": "4.023e-01", "epoch": 0.04011} {"step": 20060, "loss": 1.3712, "grad_norm": "1.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.676e-01", "anc_acc": "5.421e-01", "epoch": 0.04012} {"step": 20065, "loss": 1.5862, "grad_norm": "4.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.393e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.223e-01", "anc_acc": "5.027e-01", "epoch": 0.04013} {"step": 20070, "loss": 1.6578, "grad_norm": "2.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.321e+00", "anc_loss": "1.407e+00", "dlm_acc": "5.328e-01", "anc_acc": "5.142e-01", "epoch": 0.04014} {"step": 20075, "loss": 1.6336, "grad_norm": "2.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.446e+00", "anc_loss": "1.547e+00", "dlm_acc": "5.778e-01", "anc_acc": "5.590e-01", "epoch": 0.04015} {"step": 20080, "loss": 1.5349, "grad_norm": "3.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.261e+00", "anc_loss": "1.359e+00", "dlm_acc": "6.091e-01", "anc_acc": "5.856e-01", "epoch": 0.04016} {"step": 20085, "loss": 1.9165, "grad_norm": "5.191e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.618e+00", "anc_loss": "1.725e+00", "dlm_acc": "5.220e-01", "anc_acc": "5.007e-01", "epoch": 0.04017} {"step": 20090, "loss": 1.5208, "grad_norm": "2.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.188e+00", "dlm_acc": "5.267e-01", "anc_acc": "5.058e-01", "epoch": 0.04018} {"step": 20095, "loss": 1.5534, "grad_norm": "3.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.531e+00", "anc_loss": "1.622e+00", "dlm_acc": "5.319e-01", "anc_acc": "5.100e-01", "epoch": 0.04019} {"step": 20100, "loss": 1.5389, "grad_norm": "4.470e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.562e+00", "anc_loss": "1.655e+00", "dlm_acc": "5.080e-01", "anc_acc": "4.898e-01", "epoch": 0.0402} {"step": 20105, "loss": 1.396, "grad_norm": "3.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.248e+00", "dlm_acc": "5.923e-01", "anc_acc": "5.720e-01", "epoch": 0.04021} {"step": 20110, "loss": 1.4824, "grad_norm": "3.507e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.087e-01", "anc_acc": "4.869e-01", "epoch": 0.04022} {"step": 20115, "loss": 1.5987, "grad_norm": "3.431e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.636e+00", "anc_loss": "1.739e+00", "dlm_acc": "4.780e-01", "anc_acc": "4.600e-01", "epoch": 0.04023} {"step": 20120, "loss": 1.2875, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.520e+00", "anc_loss": "1.603e+00", "dlm_acc": "4.894e-01", "anc_acc": "4.688e-01", "epoch": 0.04024} {"step": 20125, "loss": 1.5374, "grad_norm": "4.462e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.708e+00", "anc_loss": "1.822e+00", "dlm_acc": "4.840e-01", "anc_acc": "4.619e-01", "epoch": 0.04025} {"step": 20130, "loss": 1.6181, "grad_norm": "3.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.689e+00", "anc_loss": "1.792e+00", "dlm_acc": "5.008e-01", "anc_acc": "4.829e-01", "epoch": 0.04026} {"step": 20135, "loss": 1.3863, "grad_norm": "3.333e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.219e+00", "dlm_acc": "5.736e-01", "anc_acc": "5.506e-01", "epoch": 0.04027} {"step": 20140, "loss": 1.574, "grad_norm": "6.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.669e+00", "anc_loss": "1.764e+00", "dlm_acc": "5.001e-01", "anc_acc": "4.831e-01", "epoch": 0.04028} {"step": 20145, "loss": 1.513, "grad_norm": "3.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.600e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.229e-01", "epoch": 0.04029} {"step": 20150, "loss": 1.4626, "grad_norm": "5.450e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.298e-01", "anc_acc": "5.063e-01", "epoch": 0.0403} {"step": 20155, "loss": 1.3915, "grad_norm": "3.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.611e-01", "anc_acc": "5.451e-01", "epoch": 0.04031} {"step": 20160, "loss": 1.6042, "grad_norm": "5.998e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.698e+00", "dlm_acc": "5.015e-01", "anc_acc": "4.816e-01", "epoch": 0.04032} {"step": 20165, "loss": 1.3365, "grad_norm": "2.911e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.392e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.601e-01", "epoch": 0.04033} {"step": 20170, "loss": 1.4634, "grad_norm": "4.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.573e+00", "dlm_acc": "5.537e-01", "anc_acc": "5.360e-01", "epoch": 0.04034} {"step": 20175, "loss": 1.3377, "grad_norm": "3.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.057e-01", "anc_acc": "4.762e-01", "epoch": 0.04035} {"step": 20180, "loss": 1.2697, "grad_norm": "6.559e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.410e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.605e-01", "anc_acc": "5.397e-01", "epoch": 0.04036} {"step": 20185, "loss": 1.1196, "grad_norm": "2.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.151e+00", "anc_loss": "1.246e+00", "dlm_acc": "5.855e-01", "anc_acc": "5.657e-01", "epoch": 0.04037} {"step": 20190, "loss": 1.189, "grad_norm": "2.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.326e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.466e-01", "anc_acc": "5.276e-01", "epoch": 0.04038} {"step": 20195, "loss": 1.4522, "grad_norm": "3.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.573e+00", "anc_loss": "1.687e+00", "dlm_acc": "4.998e-01", "anc_acc": "4.771e-01", "epoch": 0.04039} {"step": 20200, "loss": 1.0079, "grad_norm": "4.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.902e-01", "anc_loss": "1.060e+00", "dlm_acc": "6.004e-01", "anc_acc": "5.820e-01", "epoch": 0.0404} {"step": 20205, "loss": 1.486, "grad_norm": "3.380e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.716e+00", "dlm_acc": "4.906e-01", "anc_acc": "4.688e-01", "epoch": 0.04041} {"step": 20210, "loss": 1.3178, "grad_norm": "1.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.487e+00", "dlm_acc": "5.443e-01", "anc_acc": "5.236e-01", "epoch": 0.04042} {"step": 20215, "loss": 1.023, "grad_norm": "4.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.024e+00", "anc_loss": "1.115e+00", "dlm_acc": "6.411e-01", "anc_acc": "6.195e-01", "epoch": 0.04043} {"step": 20220, "loss": 1.0748, "grad_norm": "6.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.326e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.613e-01", "anc_acc": "5.408e-01", "epoch": 0.04044} {"step": 20225, "loss": 0.8504, "grad_norm": "3.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.470e-01", "anc_loss": "8.197e-01", "dlm_acc": "7.010e-01", "anc_acc": "6.790e-01", "epoch": 0.04045} {"step": 20230, "loss": 1.2747, "grad_norm": "1.225e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.304e+00", "dlm_acc": "6.142e-01", "anc_acc": "5.910e-01", "epoch": 0.04046} {"step": 20235, "loss": 1.0589, "grad_norm": "2.675e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.374e+00", "dlm_acc": "5.479e-01", "anc_acc": "5.253e-01", "epoch": 0.04047} {"step": 20240, "loss": 1.2447, "grad_norm": "2.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.260e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.582e-01", "epoch": 0.04048} {"step": 20245, "loss": 0.8994, "grad_norm": "2.880e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.797e-01", "anc_loss": "1.058e+00", "dlm_acc": "6.186e-01", "anc_acc": "5.980e-01", "epoch": 0.04049} {"step": 20250, "loss": 0.9794, "grad_norm": "3.317e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.539e+00", "dlm_acc": "5.523e-01", "anc_acc": "5.292e-01", "epoch": 0.0405} {"step": 20255, "loss": 1.178, "grad_norm": "1.102e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.522e+00", "dlm_acc": "5.011e-01", "anc_acc": "4.823e-01", "epoch": 0.04051} {"step": 20260, "loss": 0.6447, "grad_norm": "3.395e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.253e+00", "dlm_acc": "5.967e-01", "anc_acc": "5.747e-01", "epoch": 0.04052} {"step": 20265, "loss": 1.1059, "grad_norm": "3.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.497e+00", "anc_loss": "1.591e+00", "dlm_acc": "5.272e-01", "anc_acc": "5.095e-01", "epoch": 0.04053} {"step": 20270, "loss": 1.055, "grad_norm": "2.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.096e+00", "dlm_acc": "6.555e-01", "anc_acc": "6.374e-01", "epoch": 0.04054} {"step": 20275, "loss": 1.0586, "grad_norm": "2.690e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.329e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.229e-01", "epoch": 0.04055} {"step": 20280, "loss": 1.2582, "grad_norm": "3.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.412e+00", "dlm_acc": "5.431e-01", "anc_acc": "5.219e-01", "epoch": 0.04056} {"step": 20285, "loss": 1.6167, "grad_norm": "1.419e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.611e+00", "anc_loss": "1.687e+00", "dlm_acc": "5.646e-01", "anc_acc": "5.497e-01", "epoch": 0.04057} {"step": 20290, "loss": 0.7153, "grad_norm": "4.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.980e-01", "anc_loss": "8.672e-01", "dlm_acc": "6.280e-01", "anc_acc": "6.024e-01", "epoch": 0.04058} {"step": 20295, "loss": 1.1698, "grad_norm": "2.131e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.810e-01", "anc_acc": "5.610e-01", "epoch": 0.04059} {"step": 20300, "loss": 1.2748, "grad_norm": "4.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.231e-01", "anc_loss": "4.448e-01", "dlm_acc": "7.628e-01", "anc_acc": "7.528e-01", "epoch": 0.0406} {"step": 20305, "loss": 1.4913, "grad_norm": "3.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.914e-01", "anc_loss": "8.094e-01", "dlm_acc": "5.933e-01", "anc_acc": "5.895e-01", "epoch": 0.04061} {"step": 20310, "loss": 0.9707, "grad_norm": "2.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.619e-01", "anc_loss": "8.272e-01", "dlm_acc": "6.920e-01", "anc_acc": "6.777e-01", "epoch": 0.04062} {"step": 20315, "loss": 1.5207, "grad_norm": "5.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.360e+00", "anc_loss": "1.444e+00", "dlm_acc": "5.638e-01", "anc_acc": "5.511e-01", "epoch": 0.04063} {"step": 20320, "loss": 1.0922, "grad_norm": "4.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.961e-01", "anc_acc": "5.768e-01", "epoch": 0.04064} {"step": 20325, "loss": 1.1815, "grad_norm": "2.774e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.565e-01", "anc_acc": "5.379e-01", "epoch": 0.04065} {"step": 20330, "loss": 0.9779, "grad_norm": "3.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.281e+00", "dlm_acc": "5.960e-01", "anc_acc": "5.768e-01", "epoch": 0.04066} {"step": 20335, "loss": 1.0994, "grad_norm": "2.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.836e-01", "anc_loss": "1.042e+00", "dlm_acc": "5.154e-01", "anc_acc": "5.020e-01", "epoch": 0.04067} {"step": 20340, "loss": 1.2499, "grad_norm": "3.049e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.163e+00", "dlm_acc": "5.834e-01", "anc_acc": "5.632e-01", "epoch": 0.04068} {"step": 20345, "loss": 0.7129, "grad_norm": "3.124e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.587e-02", "anc_loss": "6.380e-02", "dlm_acc": "9.699e-01", "anc_acc": "9.670e-01", "epoch": 0.04069} {"step": 20350, "loss": 0.9982, "grad_norm": "2.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.058e+00", "anc_loss": "1.128e+00", "dlm_acc": "5.994e-01", "anc_acc": "5.794e-01", "epoch": 0.0407} {"step": 20355, "loss": 1.2703, "grad_norm": "2.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.550e+00", "anc_loss": "1.647e+00", "dlm_acc": "5.018e-01", "anc_acc": "4.823e-01", "epoch": 0.04071} {"step": 20360, "loss": 1.0478, "grad_norm": "1.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.686e-01", "anc_loss": "7.219e-01", "dlm_acc": "7.159e-01", "anc_acc": "7.005e-01", "epoch": 0.04072} {"step": 20365, "loss": 0.9614, "grad_norm": "3.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.750e-01", "anc_loss": "8.371e-01", "dlm_acc": "6.588e-01", "anc_acc": "6.397e-01", "epoch": 0.04073} {"step": 20370, "loss": 1.5629, "grad_norm": "3.493e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.259e-01", "epoch": 0.04074} {"step": 20375, "loss": 1.5814, "grad_norm": "3.242e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.060e+00", "dlm_acc": "6.475e-01", "anc_acc": "6.383e-01", "epoch": 0.04075} {"step": 20380, "loss": 1.3215, "grad_norm": "5.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.877e-01", "anc_loss": "7.172e-01", "dlm_acc": "7.545e-01", "anc_acc": "7.452e-01", "epoch": 0.04076} {"step": 20385, "loss": 1.3226, "grad_norm": "9.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.079e+00", "anc_loss": "1.136e+00", "dlm_acc": "6.308e-01", "anc_acc": "6.185e-01", "epoch": 0.04077} {"step": 20390, "loss": 0.8264, "grad_norm": "2.430e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.070e-01", "anc_loss": "9.992e-01", "dlm_acc": "6.415e-01", "anc_acc": "6.197e-01", "epoch": 0.04078} {"step": 20395, "loss": 0.9472, "grad_norm": "2.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.172e-01", "anc_loss": "8.898e-01", "dlm_acc": "6.671e-01", "anc_acc": "6.454e-01", "epoch": 0.04079} {"step": 20400, "loss": 1.1958, "grad_norm": "5.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.500e-01", "anc_loss": "1.011e+00", "dlm_acc": "6.729e-01", "anc_acc": "6.563e-01", "epoch": 0.0408} {"step": 20405, "loss": 0.868, "grad_norm": "3.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.619e-01", "anc_loss": "4.943e-01", "dlm_acc": "7.531e-01", "anc_acc": "7.430e-01", "epoch": 0.04081} {"step": 20410, "loss": 1.0179, "grad_norm": "3.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.332e-01", "anc_loss": "6.379e-01", "dlm_acc": "6.154e-01", "anc_acc": "6.138e-01", "epoch": 0.04082} {"step": 20415, "loss": 0.9979, "grad_norm": "2.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.391e-01", "anc_loss": "5.445e-01", "dlm_acc": "6.376e-01", "anc_acc": "6.340e-01", "epoch": 0.04083} {"step": 20420, "loss": 1.0641, "grad_norm": "3.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.473e-01", "anc_loss": "6.504e-01", "dlm_acc": "6.208e-01", "anc_acc": "6.174e-01", "epoch": 0.04084} {"step": 20425, "loss": 0.905, "grad_norm": "1.837e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.340e-01", "anc_loss": "5.395e-01", "dlm_acc": "6.374e-01", "anc_acc": "6.335e-01", "epoch": 0.04085} {"step": 20430, "loss": 0.5991, "grad_norm": "1.191e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.512e-01", "anc_loss": "5.980e-01", "dlm_acc": "7.282e-01", "anc_acc": "7.167e-01", "epoch": 0.04086} {"step": 20435, "loss": 1.3252, "grad_norm": "4.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.465e-01", "anc_loss": "9.979e-01", "dlm_acc": "6.621e-01", "anc_acc": "6.499e-01", "epoch": 0.04087} {"step": 20440, "loss": 0.9375, "grad_norm": "3.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.512e-01", "anc_loss": "5.797e-01", "dlm_acc": "6.957e-01", "anc_acc": "6.845e-01", "epoch": 0.04088} {"step": 20445, "loss": 1.1196, "grad_norm": "2.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.273e-01", "anc_loss": "9.895e-01", "dlm_acc": "6.226e-01", "anc_acc": "6.037e-01", "epoch": 0.04089} {"step": 20450, "loss": 0.9843, "grad_norm": "2.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.001e-01", "anc_loss": "7.580e-01", "dlm_acc": "7.599e-01", "anc_acc": "7.451e-01", "epoch": 0.0409} {"step": 20455, "loss": 1.0476, "grad_norm": "3.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.398e-01", "anc_loss": "6.609e-01", "dlm_acc": "5.403e-01", "anc_acc": "5.299e-01", "epoch": 0.04091} {"step": 20460, "loss": 0.9185, "grad_norm": "5.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.904e-01", "anc_loss": "8.299e-01", "dlm_acc": "6.320e-01", "anc_acc": "6.201e-01", "epoch": 0.04092} {"step": 20465, "loss": 1.0499, "grad_norm": "2.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.750e-01", "anc_loss": "7.305e-01", "dlm_acc": "7.199e-01", "anc_acc": "7.068e-01", "epoch": 0.04093} {"step": 20470, "loss": 1.3025, "grad_norm": "3.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.056e+00", "dlm_acc": "5.308e-01", "anc_acc": "5.173e-01", "epoch": 0.04094} {"step": 20475, "loss": 0.8348, "grad_norm": "3.610e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.576e-01", "anc_loss": "4.866e-01", "dlm_acc": "8.284e-01", "anc_acc": "8.198e-01", "epoch": 0.04095} {"step": 20480, "loss": 1.0371, "grad_norm": "3.128e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.512e-01", "anc_loss": "1.001e+00", "dlm_acc": "6.107e-01", "anc_acc": "5.992e-01", "epoch": 0.04096} {"step": 20485, "loss": 1.0284, "grad_norm": "7.526e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.523e-01", "anc_loss": "8.128e-01", "dlm_acc": "6.989e-01", "anc_acc": "6.835e-01", "epoch": 0.04097} {"step": 20490, "loss": 1.0758, "grad_norm": "2.379e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.103e-01", "anc_loss": "9.799e-01", "dlm_acc": "6.146e-01", "anc_acc": "5.955e-01", "epoch": 0.04098} {"step": 20495, "loss": 0.9292, "grad_norm": "2.483e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.352e-01", "anc_loss": "4.628e-01", "dlm_acc": "8.267e-01", "anc_acc": "8.212e-01", "epoch": 0.04099} {"step": 20500, "loss": 1.3967, "grad_norm": "2.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.106e+00", "dlm_acc": "6.654e-01", "anc_acc": "6.541e-01", "epoch": 0.041} {"step": 20505, "loss": 1.679, "grad_norm": "3.695e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.019e+00", "anc_loss": "2.061e+00", "dlm_acc": "2.861e-01", "anc_acc": "2.754e-01", "epoch": 0.04101} {"step": 20510, "loss": 1.4369, "grad_norm": "2.709e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.190e+00", "dlm_acc": "6.228e-01", "anc_acc": "6.070e-01", "epoch": 0.04102} {"step": 20515, "loss": 1.1645, "grad_norm": "4.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.738e-01", "anc_loss": "1.055e+00", "dlm_acc": "6.475e-01", "anc_acc": "6.262e-01", "epoch": 0.04103} {"step": 20520, "loss": 1.1037, "grad_norm": "3.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.203e-01", "anc_acc": "4.988e-01", "epoch": 0.04104} {"step": 20525, "loss": 1.4142, "grad_norm": "3.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.630e+00", "anc_loss": "1.739e+00", "dlm_acc": "4.939e-01", "anc_acc": "4.720e-01", "epoch": 0.04105} {"step": 20530, "loss": 1.6103, "grad_norm": "3.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.435e+00", "anc_loss": "1.525e+00", "dlm_acc": "5.434e-01", "anc_acc": "5.205e-01", "epoch": 0.04106} {"step": 20535, "loss": 1.2971, "grad_norm": "3.734e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.573e-01", "anc_acc": "5.335e-01", "epoch": 0.04107} {"step": 20540, "loss": 1.0672, "grad_norm": "3.560e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.122e+00", "anc_loss": "1.206e+00", "dlm_acc": "6.245e-01", "anc_acc": "6.071e-01", "epoch": 0.04108} {"step": 20545, "loss": 0.8388, "grad_norm": "2.628e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.879e-01", "anc_loss": "2.137e-01", "dlm_acc": "8.657e-01", "anc_acc": "8.513e-01", "epoch": 0.04109} {"step": 20550, "loss": 0.9945, "grad_norm": "2.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.451e-01", "anc_loss": "2.852e-01", "dlm_acc": "8.358e-01", "anc_acc": "8.148e-01", "epoch": 0.0411} {"step": 20555, "loss": 1.0754, "grad_norm": "3.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.883e-01", "anc_loss": "6.500e-01", "dlm_acc": "7.586e-01", "anc_acc": "7.422e-01", "epoch": 0.04111} {"step": 20560, "loss": 1.5612, "grad_norm": "4.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.634e+00", "anc_loss": "1.744e+00", "dlm_acc": "4.984e-01", "anc_acc": "4.771e-01", "epoch": 0.04112} {"step": 20565, "loss": 1.2739, "grad_norm": "2.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.286e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.613e-01", "anc_acc": "5.408e-01", "epoch": 0.04113} {"step": 20570, "loss": 1.4569, "grad_norm": "1.521e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.510e-01", "anc_acc": "5.306e-01", "epoch": 0.04114} {"step": 20575, "loss": 1.818, "grad_norm": "9.388e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.639e-01", "anc_acc": "5.432e-01", "epoch": 0.04115} {"step": 20580, "loss": 0.7253, "grad_norm": "2.898e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.156e-01", "anc_loss": "5.473e-01", "dlm_acc": "6.153e-01", "anc_acc": "5.967e-01", "epoch": 0.04116} {"step": 20585, "loss": 1.038, "grad_norm": "2.217e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.284e+00", "dlm_acc": "5.621e-01", "anc_acc": "5.360e-01", "epoch": 0.04117} {"step": 20590, "loss": 1.0512, "grad_norm": "2.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.219e+00", "dlm_acc": "6.059e-01", "anc_acc": "5.834e-01", "epoch": 0.04118} {"step": 20595, "loss": 1.2692, "grad_norm": "2.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.556e+00", "anc_loss": "1.580e+00", "dlm_acc": "5.014e-01", "anc_acc": "4.792e-01", "epoch": 0.04119} {"step": 20600, "loss": 1.4364, "grad_norm": "4.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.475e+00", "anc_loss": "1.559e+00", "dlm_acc": "5.017e-01", "anc_acc": "4.850e-01", "epoch": 0.0412} {"step": 20605, "loss": 1.3381, "grad_norm": "3.267e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.407e+00", "anc_loss": "1.522e+00", "dlm_acc": "5.551e-01", "anc_acc": "5.323e-01", "epoch": 0.04121} {"step": 20610, "loss": 0.8942, "grad_norm": "2.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.097e+00", "anc_loss": "1.188e+00", "dlm_acc": "5.520e-01", "anc_acc": "5.276e-01", "epoch": 0.04122} {"step": 20615, "loss": 1.2315, "grad_norm": "2.623e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.301e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.980e-01", "anc_acc": "5.781e-01", "epoch": 0.04123} {"step": 20620, "loss": 1.2994, "grad_norm": "3.678e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.817e+00", "anc_loss": "1.898e+00", "dlm_acc": "3.904e-01", "anc_acc": "3.742e-01", "epoch": 0.04124} {"step": 20625, "loss": 1.2524, "grad_norm": "4.795e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.644e+00", "anc_loss": "1.736e+00", "dlm_acc": "4.771e-01", "anc_acc": "4.567e-01", "epoch": 0.04125} {"step": 20630, "loss": 0.9998, "grad_norm": "3.832e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.258e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.747e-01", "anc_acc": "5.534e-01", "epoch": 0.04126} {"step": 20635, "loss": 0.9936, "grad_norm": "4.466e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.852e-01", "anc_loss": "7.410e-01", "dlm_acc": "6.365e-01", "anc_acc": "6.182e-01", "epoch": 0.04127} {"step": 20640, "loss": 1.64, "grad_norm": "4.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.293e+00", "dlm_acc": "5.964e-01", "anc_acc": "5.750e-01", "epoch": 0.04128} {"step": 20645, "loss": 1.7706, "grad_norm": "2.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.727e+00", "anc_loss": "1.787e+00", "dlm_acc": "3.221e-01", "anc_acc": "3.128e-01", "epoch": 0.04129} {"step": 20650, "loss": 1.0215, "grad_norm": "2.516e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.229e+00", "dlm_acc": "5.251e-01", "anc_acc": "5.026e-01", "epoch": 0.0413} {"step": 20655, "loss": 1.1329, "grad_norm": "3.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.509e-01", "anc_acc": "5.291e-01", "epoch": 0.04131} {"step": 20660, "loss": 0.8725, "grad_norm": "2.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.758e-01", "anc_loss": "1.061e+00", "dlm_acc": "6.126e-01", "anc_acc": "5.887e-01", "epoch": 0.04132} {"step": 20665, "loss": 1.2509, "grad_norm": "3.431e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.093e+00", "dlm_acc": "6.289e-01", "anc_acc": "6.109e-01", "epoch": 0.04133} {"step": 20670, "loss": 1.8454, "grad_norm": "2.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.459e+00", "anc_loss": "1.555e+00", "dlm_acc": "5.037e-01", "anc_acc": "4.829e-01", "epoch": 0.04134} {"step": 20675, "loss": 1.2871, "grad_norm": "3.129e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.364e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.322e-01", "anc_acc": "5.099e-01", "epoch": 0.04135} {"step": 20680, "loss": 1.0271, "grad_norm": "3.544e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.479e-01", "anc_loss": "1.037e+00", "dlm_acc": "6.511e-01", "anc_acc": "6.301e-01", "epoch": 0.04136} {"step": 20685, "loss": 1.477, "grad_norm": "2.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.577e+00", "anc_loss": "1.695e+00", "dlm_acc": "5.274e-01", "anc_acc": "5.053e-01", "epoch": 0.04137} {"step": 20690, "loss": 1.1956, "grad_norm": "2.216e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.875e-01", "anc_acc": "5.678e-01", "epoch": 0.04138} {"step": 20695, "loss": 1.6888, "grad_norm": "7.755e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.416e+00", "dlm_acc": "5.706e-01", "anc_acc": "5.467e-01", "epoch": 0.04139} {"step": 20700, "loss": 1.8469, "grad_norm": "4.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.182e+00", "anc_loss": "1.287e+00", "dlm_acc": "6.074e-01", "anc_acc": "5.843e-01", "epoch": 0.0414} {"step": 20705, "loss": 1.6175, "grad_norm": "4.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.568e+00", "anc_loss": "1.679e+00", "dlm_acc": "5.198e-01", "anc_acc": "4.990e-01", "epoch": 0.04141} {"step": 20710, "loss": 1.2074, "grad_norm": "5.108e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.121e-01", "anc_acc": "4.927e-01", "epoch": 0.04142} {"step": 20715, "loss": 1.0928, "grad_norm": "4.288e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.141e+00", "dlm_acc": "5.937e-01", "anc_acc": "5.686e-01", "epoch": 0.04143} {"step": 20720, "loss": 1.4739, "grad_norm": "2.668e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.562e+00", "dlm_acc": "5.082e-01", "anc_acc": "4.867e-01", "epoch": 0.04144} {"step": 20725, "loss": 1.2704, "grad_norm": "2.074e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.346e+00", "anc_loss": "1.446e+00", "dlm_acc": "5.351e-01", "anc_acc": "5.123e-01", "epoch": 0.04145} {"step": 20730, "loss": 0.975, "grad_norm": "2.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.555e-01", "anc_loss": "9.375e-01", "dlm_acc": "6.505e-01", "anc_acc": "6.291e-01", "epoch": 0.04146} {"step": 20735, "loss": 1.2166, "grad_norm": "3.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.175e+00", "dlm_acc": "6.325e-01", "anc_acc": "6.135e-01", "epoch": 0.04147} {"step": 20740, "loss": 0.7462, "grad_norm": "3.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.473e-01", "anc_loss": "8.164e-01", "dlm_acc": "7.012e-01", "anc_acc": "6.802e-01", "epoch": 0.04148} {"step": 20745, "loss": 1.3033, "grad_norm": "2.601e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.226e+00", "anc_loss": "1.335e+00", "dlm_acc": "5.691e-01", "anc_acc": "5.445e-01", "epoch": 0.04149} {"step": 20750, "loss": 1.4583, "grad_norm": "2.552e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.517e+00", "dlm_acc": "5.425e-01", "anc_acc": "5.205e-01", "epoch": 0.0415} {"step": 20755, "loss": 1.1225, "grad_norm": "4.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.938e-01", "anc_acc": "5.716e-01", "epoch": 0.04151} {"step": 20760, "loss": 1.4104, "grad_norm": "3.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.482e+00", "dlm_acc": "5.586e-01", "anc_acc": "5.371e-01", "epoch": 0.04152} {"step": 20765, "loss": 1.7866, "grad_norm": "3.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.528e+00", "dlm_acc": "5.442e-01", "anc_acc": "5.218e-01", "epoch": 0.04153} {"step": 20770, "loss": 1.2046, "grad_norm": "5.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.466e-01", "anc_acc": "5.218e-01", "epoch": 0.04154} {"step": 20775, "loss": 0.9435, "grad_norm": "7.117e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.422e-01", "anc_loss": "9.477e-01", "dlm_acc": "3.539e-01", "anc_acc": "3.536e-01", "epoch": 0.04155} {"step": 20780, "loss": 1.1147, "grad_norm": "4.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.001e+00", "anc_loss": "1.007e+00", "dlm_acc": "3.329e-01", "anc_acc": "3.322e-01", "epoch": 0.04156} {"step": 20785, "loss": 1.3084, "grad_norm": "4.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.122e+00", "dlm_acc": "3.272e-01", "anc_acc": "3.242e-01", "epoch": 0.04157} {"step": 20790, "loss": 1.6485, "grad_norm": "5.508e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.311e+00", "dlm_acc": "3.261e-01", "anc_acc": "3.257e-01", "epoch": 0.04158} {"step": 20795, "loss": 1.309, "grad_norm": "4.953e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.234e+00", "dlm_acc": "3.881e-01", "anc_acc": "3.796e-01", "epoch": 0.04159} {"step": 20800, "loss": 1.9352, "grad_norm": "4.398e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.472e+00", "anc_loss": "1.580e+00", "dlm_acc": "5.285e-01", "anc_acc": "5.048e-01", "epoch": 0.0416} {"step": 20805, "loss": 1.7627, "grad_norm": "4.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.581e+00", "anc_loss": "1.680e+00", "dlm_acc": "5.213e-01", "anc_acc": "5.016e-01", "epoch": 0.04161} {"step": 20810, "loss": 1.0931, "grad_norm": "2.117e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.308e+00", "dlm_acc": "5.542e-01", "anc_acc": "5.374e-01", "epoch": 0.04162} {"step": 20815, "loss": 1.3103, "grad_norm": "4.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.170e-01", "anc_acc": "4.967e-01", "epoch": 0.04163} {"step": 20820, "loss": 1.0943, "grad_norm": "3.518e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.604e-01", "anc_acc": "5.419e-01", "epoch": 0.04164} {"step": 20825, "loss": 1.2925, "grad_norm": "5.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.335e+00", "dlm_acc": "5.531e-01", "anc_acc": "5.241e-01", "epoch": 0.04165} {"step": 20830, "loss": 1.0949, "grad_norm": "2.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.316e+00", "dlm_acc": "5.454e-01", "anc_acc": "5.213e-01", "epoch": 0.04166} {"step": 20835, "loss": 1.5852, "grad_norm": "5.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.445e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.542e-01", "anc_acc": "5.337e-01", "epoch": 0.04167} {"step": 20840, "loss": 1.2125, "grad_norm": "6.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.225e+00", "dlm_acc": "6.011e-01", "anc_acc": "5.834e-01", "epoch": 0.04168} {"step": 20845, "loss": 1.1889, "grad_norm": "3.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.190e+00", "dlm_acc": "5.496e-01", "anc_acc": "5.266e-01", "epoch": 0.04169} {"step": 20850, "loss": 1.1404, "grad_norm": "2.987e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.233e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.621e-01", "anc_acc": "5.375e-01", "epoch": 0.0417} {"step": 20855, "loss": 1.2146, "grad_norm": "3.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.243e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.729e-01", "anc_acc": "5.505e-01", "epoch": 0.04171} {"step": 20860, "loss": 1.4254, "grad_norm": "3.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.303e+00", "dlm_acc": "5.909e-01", "anc_acc": "5.694e-01", "epoch": 0.04172} {"step": 20865, "loss": 0.9927, "grad_norm": "3.437e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.099e+00", "dlm_acc": "6.377e-01", "anc_acc": "6.153e-01", "epoch": 0.04173} {"step": 20870, "loss": 1.3551, "grad_norm": "3.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.641e+00", "anc_loss": "1.752e+00", "dlm_acc": "5.041e-01", "anc_acc": "4.815e-01", "epoch": 0.04174} {"step": 20875, "loss": 1.109, "grad_norm": "1.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.195e+00", "dlm_acc": "6.305e-01", "anc_acc": "6.043e-01", "epoch": 0.04175} {"step": 20880, "loss": 1.0966, "grad_norm": "2.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.260e+00", "dlm_acc": "6.108e-01", "anc_acc": "5.887e-01", "epoch": 0.04176} {"step": 20885, "loss": 1.4553, "grad_norm": "2.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.733e-01", "anc_acc": "5.498e-01", "epoch": 0.04177} {"step": 20890, "loss": 1.4563, "grad_norm": "4.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.769e+00", "anc_loss": "1.873e+00", "dlm_acc": "4.654e-01", "anc_acc": "4.443e-01", "epoch": 0.04178} {"step": 20895, "loss": 1.41, "grad_norm": "4.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.556e+00", "anc_loss": "1.645e+00", "dlm_acc": "5.227e-01", "anc_acc": "5.032e-01", "epoch": 0.04179} {"step": 20900, "loss": 1.2661, "grad_norm": "3.494e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.118e+00", "anc_loss": "1.220e+00", "dlm_acc": "6.266e-01", "anc_acc": "6.022e-01", "epoch": 0.0418} {"step": 20905, "loss": 0.8947, "grad_norm": "2.134e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.941e-01", "anc_loss": "8.898e-01", "dlm_acc": "6.671e-01", "anc_acc": "6.390e-01", "epoch": 0.04181} {"step": 20910, "loss": 1.2035, "grad_norm": "1.744e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.653e-01", "anc_acc": "5.443e-01", "epoch": 0.04182} {"step": 20915, "loss": 1.1658, "grad_norm": "2.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.263e+00", "dlm_acc": "6.182e-01", "anc_acc": "5.922e-01", "epoch": 0.04183} {"step": 20920, "loss": 1.0291, "grad_norm": "2.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.075e+00", "dlm_acc": "6.865e-01", "anc_acc": "6.734e-01", "epoch": 0.04184} {"step": 20925, "loss": 1.0547, "grad_norm": "3.307e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.750e-01", "anc_loss": "6.117e-01", "dlm_acc": "8.017e-01", "anc_acc": "7.918e-01", "epoch": 0.04185} {"step": 20930, "loss": 1.1908, "grad_norm": "6.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.417e+00", "anc_loss": "1.512e+00", "dlm_acc": "5.411e-01", "anc_acc": "5.202e-01", "epoch": 0.04186} {"step": 20935, "loss": 1.1046, "grad_norm": "2.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.426e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.149e-01", "anc_acc": "4.909e-01", "epoch": 0.04187} {"step": 20940, "loss": 1.3885, "grad_norm": "3.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.271e+00", "dlm_acc": "6.050e-01", "anc_acc": "5.809e-01", "epoch": 0.04188} {"step": 20945, "loss": 1.378, "grad_norm": "4.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.745e+00", "anc_loss": "1.828e+00", "dlm_acc": "4.426e-01", "anc_acc": "4.250e-01", "epoch": 0.04189} {"step": 20950, "loss": 1.4557, "grad_norm": "3.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.664e+00", "anc_loss": "1.759e+00", "dlm_acc": "4.964e-01", "anc_acc": "4.769e-01", "epoch": 0.0419} {"step": 20955, "loss": 1.0901, "grad_norm": "4.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.321e+00", "dlm_acc": "5.408e-01", "anc_acc": "5.189e-01", "epoch": 0.04191} {"step": 20960, "loss": 1.1679, "grad_norm": "5.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.331e+00", "dlm_acc": "3.403e-01", "anc_acc": "3.383e-01", "epoch": 0.04192} {"step": 20965, "loss": 0.9864, "grad_norm": "2.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.953e-01", "anc_loss": "1.000e+00", "dlm_acc": "3.365e-01", "anc_acc": "3.352e-01", "epoch": 0.04193} {"step": 20970, "loss": 0.7695, "grad_norm": "2.937e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.484e-01", "anc_loss": "9.531e-01", "dlm_acc": "3.452e-01", "anc_acc": "3.436e-01", "epoch": 0.04194} {"step": 20975, "loss": 0.9644, "grad_norm": "3.125e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.081e+00", "dlm_acc": "3.415e-01", "anc_acc": "3.388e-01", "epoch": 0.04195} {"step": 20980, "loss": 0.887, "grad_norm": "1.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.602e-01", "anc_loss": "1.008e+00", "dlm_acc": "4.931e-01", "anc_acc": "4.779e-01", "epoch": 0.04196} {"step": 20985, "loss": 1.4737, "grad_norm": "5.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.602e+00", "dlm_acc": "5.321e-01", "anc_acc": "5.072e-01", "epoch": 0.04197} {"step": 20990, "loss": 0.9802, "grad_norm": "3.162e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.111e+00", "dlm_acc": "5.966e-01", "anc_acc": "5.749e-01", "epoch": 0.04198} {"step": 20995, "loss": 1.2521, "grad_norm": "4.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.198e+00", "dlm_acc": "6.062e-01", "anc_acc": "5.853e-01", "epoch": 0.04199} {"step": 21000, "loss": 1.4099, "grad_norm": "5.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.611e+00", "anc_loss": "1.667e+00", "dlm_acc": "4.200e-01", "anc_acc": "4.056e-01", "epoch": 0.042} {"step": 21005, "loss": 1.3642, "grad_norm": "3.216e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.579e+00", "anc_loss": "1.673e+00", "dlm_acc": "5.083e-01", "anc_acc": "4.876e-01", "epoch": 0.04201} {"step": 21010, "loss": 1.5656, "grad_norm": "5.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.522e+00", "dlm_acc": "5.599e-01", "anc_acc": "5.403e-01", "epoch": 0.04202} {"step": 21015, "loss": 1.6831, "grad_norm": "8.900e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.519e-01", "anc_acc": "5.307e-01", "epoch": 0.04203} {"step": 21020, "loss": 1.3456, "grad_norm": "4.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.404e-01", "anc_acc": "5.221e-01", "epoch": 0.04204} {"step": 21025, "loss": 1.0813, "grad_norm": "3.899e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.519e+00", "dlm_acc": "5.442e-01", "anc_acc": "5.226e-01", "epoch": 0.04205} {"step": 21030, "loss": 1.2211, "grad_norm": "3.731e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.472e+00", "anc_loss": "1.584e+00", "dlm_acc": "5.247e-01", "anc_acc": "5.019e-01", "epoch": 0.04206} {"step": 21035, "loss": 1.276, "grad_norm": "4.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.587e+00", "dlm_acc": "5.310e-01", "anc_acc": "4.932e-01", "epoch": 0.04207} {"step": 21040, "loss": 1.3543, "grad_norm": "1.984e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.437e+00", "dlm_acc": "5.923e-01", "anc_acc": "5.670e-01", "epoch": 0.04208} {"step": 21045, "loss": 0.8436, "grad_norm": "4.358e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.266e-01", "anc_loss": "1.016e+00", "dlm_acc": "6.106e-01", "anc_acc": "5.849e-01", "epoch": 0.04209} {"step": 21050, "loss": 1.1155, "grad_norm": "2.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.515e+00", "anc_loss": "1.606e+00", "dlm_acc": "4.276e-01", "anc_acc": "4.070e-01", "epoch": 0.0421} {"step": 21055, "loss": 1.2268, "grad_norm": "4.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.518e+00", "anc_loss": "1.598e+00", "dlm_acc": "5.064e-01", "anc_acc": "4.877e-01", "epoch": 0.04211} {"step": 21060, "loss": 1.1774, "grad_norm": "3.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.203e-01", "anc_loss": "8.602e-01", "dlm_acc": "4.869e-01", "anc_acc": "4.653e-01", "epoch": 0.04212} {"step": 21065, "loss": 0.8852, "grad_norm": "5.193e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.375e-01", "anc_loss": "7.531e-01", "dlm_acc": "4.978e-01", "anc_acc": "4.911e-01", "epoch": 0.04213} {"step": 21070, "loss": 0.9383, "grad_norm": "5.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.797e-01", "anc_loss": "6.922e-01", "dlm_acc": "5.121e-01", "anc_acc": "5.052e-01", "epoch": 0.04214} {"step": 21075, "loss": 0.9378, "grad_norm": "3.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.508e-01", "anc_loss": "6.637e-01", "dlm_acc": "5.134e-01", "anc_acc": "5.040e-01", "epoch": 0.04215} {"step": 21080, "loss": 1.1164, "grad_norm": "4.520e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.664e-01", "anc_loss": "6.828e-01", "dlm_acc": "5.296e-01", "anc_acc": "5.197e-01", "epoch": 0.04216} {"step": 21085, "loss": 1.0649, "grad_norm": "5.696e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.766e-01", "anc_loss": "5.977e-01", "dlm_acc": "6.071e-01", "anc_acc": "5.942e-01", "epoch": 0.04217} {"step": 21090, "loss": 0.7686, "grad_norm": "3.858e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.248e-01", "anc_loss": "8.781e-01", "dlm_acc": "5.921e-01", "anc_acc": "5.740e-01", "epoch": 0.04218} {"step": 21095, "loss": 1.1706, "grad_norm": "4.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.352e-01", "anc_loss": "9.922e-01", "dlm_acc": "6.348e-01", "anc_acc": "6.239e-01", "epoch": 0.04219} {"step": 21100, "loss": 0.7269, "grad_norm": "2.404e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.463e-01", "anc_loss": "3.998e-01", "dlm_acc": "8.268e-01", "anc_acc": "8.090e-01", "epoch": 0.0422} {"step": 21105, "loss": 1.1227, "grad_norm": "4.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.351e+00", "anc_loss": "1.447e+00", "dlm_acc": "4.799e-01", "anc_acc": "4.617e-01", "epoch": 0.04221} {"step": 21110, "loss": 1.7495, "grad_norm": "4.815e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.591e+00", "anc_loss": "1.698e+00", "dlm_acc": "5.000e-01", "anc_acc": "4.808e-01", "epoch": 0.04222} {"step": 21115, "loss": 1.001, "grad_norm": "2.526e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.609e-01", "anc_loss": "9.453e-01", "dlm_acc": "6.490e-01", "anc_acc": "6.232e-01", "epoch": 0.04223} {"step": 21120, "loss": 1.6073, "grad_norm": "3.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.464e+00", "anc_loss": "1.581e+00", "dlm_acc": "4.837e-01", "anc_acc": "4.528e-01", "epoch": 0.04224} {"step": 21125, "loss": 1.1642, "grad_norm": "3.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.332e+00", "anc_loss": "1.400e+00", "dlm_acc": "4.761e-01", "anc_acc": "4.505e-01", "epoch": 0.04225} {"step": 21130, "loss": 1.1973, "grad_norm": "4.668e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.243e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.217e-01", "anc_acc": "4.970e-01", "epoch": 0.04226} {"step": 21135, "loss": 1.3064, "grad_norm": "3.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.153e+00", "dlm_acc": "6.116e-01", "anc_acc": "5.856e-01", "epoch": 0.04227} {"step": 21140, "loss": 1.1914, "grad_norm": "8.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.164e-01", "anc_loss": "1.006e+00", "dlm_acc": "6.216e-01", "anc_acc": "5.897e-01", "epoch": 0.04228} {"step": 21145, "loss": 1.0708, "grad_norm": "1.983e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.226e+00", "dlm_acc": "5.477e-01", "anc_acc": "5.105e-01", "epoch": 0.04229} {"step": 21150, "loss": 1.2097, "grad_norm": "3.719e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.408e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.306e-01", "anc_acc": "5.101e-01", "epoch": 0.0423} {"step": 21155, "loss": 1.2942, "grad_norm": "8.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.465e+00", "anc_loss": "1.551e+00", "dlm_acc": "5.190e-01", "anc_acc": "5.006e-01", "epoch": 0.04231} {"step": 21160, "loss": 1.4047, "grad_norm": "3.173e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.092e+00", "dlm_acc": "5.888e-01", "anc_acc": "5.697e-01", "epoch": 0.04232} {"step": 21165, "loss": 1.5441, "grad_norm": "5.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.251e+00", "anc_loss": "2.289e+00", "dlm_acc": "2.694e-01", "anc_acc": "2.583e-01", "epoch": 0.04233} {"step": 21170, "loss": 1.0433, "grad_norm": "5.129e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.688e-01", "anc_loss": "8.578e-01", "dlm_acc": "6.719e-01", "anc_acc": "6.448e-01", "epoch": 0.04234} {"step": 21175, "loss": 1.4016, "grad_norm": "1.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.945e+00", "anc_loss": "1.999e+00", "dlm_acc": "3.064e-01", "anc_acc": "2.969e-01", "epoch": 0.04235} {"step": 21180, "loss": 1.3612, "grad_norm": "2.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.149e+00", "anc_loss": "1.243e+00", "dlm_acc": "5.348e-01", "anc_acc": "5.143e-01", "epoch": 0.04236} {"step": 21185, "loss": 1.3528, "grad_norm": "5.444e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.338e+00", "dlm_acc": "5.054e-01", "anc_acc": "4.833e-01", "epoch": 0.04237} {"step": 21190, "loss": 1.4981, "grad_norm": "3.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.464e+00", "anc_loss": "2.498e+00", "dlm_acc": "1.358e-01", "anc_acc": "1.280e-01", "epoch": 0.04238} {"step": 21195, "loss": 1.2874, "grad_norm": "4.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.873e+00", "anc_loss": "1.940e+00", "dlm_acc": "2.809e-01", "anc_acc": "2.720e-01", "epoch": 0.04239} {"step": 21200, "loss": 1.3072, "grad_norm": "2.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.681e+00", "anc_loss": "1.767e+00", "dlm_acc": "4.476e-01", "anc_acc": "4.268e-01", "epoch": 0.0424} {"step": 21205, "loss": 1.2365, "grad_norm": "2.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.735e+00", "anc_loss": "1.775e+00", "dlm_acc": "3.974e-01", "anc_acc": "3.878e-01", "epoch": 0.04241} {"step": 21210, "loss": 1.7459, "grad_norm": "3.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.267e+00", "anc_loss": "2.403e+00", "dlm_acc": "2.646e-01", "anc_acc": "2.429e-01", "epoch": 0.04242} {"step": 21215, "loss": 0.9959, "grad_norm": "3.667e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.084e+00", "dlm_acc": "4.141e-01", "anc_acc": "3.915e-01", "epoch": 0.04243} {"step": 21220, "loss": 1.363, "grad_norm": "2.049e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.662e+00", "dlm_acc": "4.731e-01", "anc_acc": "4.536e-01", "epoch": 0.04244} {"step": 21225, "loss": 0.9834, "grad_norm": "5.149e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.621e-01", "anc_loss": "8.100e-01", "dlm_acc": "6.644e-01", "anc_acc": "6.522e-01", "epoch": 0.04245} {"step": 21230, "loss": 1.0312, "grad_norm": "5.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.471e+00", "anc_loss": "1.585e+00", "dlm_acc": "5.307e-01", "anc_acc": "5.054e-01", "epoch": 0.04246} {"step": 21235, "loss": 1.2962, "grad_norm": "7.111e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.716e+00", "anc_loss": "1.755e+00", "dlm_acc": "3.459e-01", "anc_acc": "3.324e-01", "epoch": 0.04247} {"step": 21240, "loss": 1.3561, "grad_norm": "5.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.764e+00", "anc_loss": "1.848e+00", "dlm_acc": "3.937e-01", "anc_acc": "3.712e-01", "epoch": 0.04248} {"step": 21245, "loss": 0.8093, "grad_norm": "2.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.428e+00", "anc_loss": "1.591e+00", "dlm_acc": "5.513e-01", "anc_acc": "5.199e-01", "epoch": 0.04249} {"step": 21250, "loss": 0.7078, "grad_norm": "3.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.781e-01", "anc_loss": "9.742e-01", "dlm_acc": "6.295e-01", "anc_acc": "6.039e-01", "epoch": 0.0425} {"step": 21255, "loss": 1.2035, "grad_norm": "6.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.167e+00", "dlm_acc": "5.844e-01", "anc_acc": "5.644e-01", "epoch": 0.04251} {"step": 21260, "loss": 0.8634, "grad_norm": "2.048e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.389e-01", "epoch": 0.04252} {"step": 21265, "loss": 0.9726, "grad_norm": "5.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.168e+00", "dlm_acc": "5.878e-01", "anc_acc": "5.627e-01", "epoch": 0.04253} {"step": 21270, "loss": 0.9012, "grad_norm": "3.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.229e+00", "anc_loss": "1.302e+00", "dlm_acc": "5.276e-01", "anc_acc": "5.098e-01", "epoch": 0.04254} {"step": 21275, "loss": 0.535, "grad_norm": "3.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.542e-01", "anc_loss": "9.230e-01", "dlm_acc": "6.639e-01", "anc_acc": "6.420e-01", "epoch": 0.04255} {"step": 21280, "loss": 1.182, "grad_norm": "6.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.487e+00", "dlm_acc": "5.555e-01", "anc_acc": "5.403e-01", "epoch": 0.04256} {"step": 21285, "loss": 0.8966, "grad_norm": "3.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.828e-01", "anc_loss": "9.637e-01", "dlm_acc": "6.296e-01", "anc_acc": "6.067e-01", "epoch": 0.04257} {"step": 21290, "loss": 0.8299, "grad_norm": "1.971e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.650e-01", "anc_acc": "5.424e-01", "epoch": 0.04258} {"step": 21295, "loss": 1.1299, "grad_norm": "2.994e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.504e+00", "dlm_acc": "5.700e-01", "anc_acc": "5.493e-01", "epoch": 0.04259} {"step": 21300, "loss": 1.0035, "grad_norm": "3.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.618e-01", "anc_acc": "5.418e-01", "epoch": 0.0426} {"step": 21305, "loss": 1.2867, "grad_norm": "5.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.903e+00", "anc_loss": "2.011e+00", "dlm_acc": "4.228e-01", "anc_acc": "4.040e-01", "epoch": 0.04261} {"step": 21310, "loss": 1.3143, "grad_norm": "2.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.186e+00", "dlm_acc": "6.421e-01", "anc_acc": "6.218e-01", "epoch": 0.04262} {"step": 21315, "loss": 1.2531, "grad_norm": "2.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.210e-01", "anc_acc": "4.991e-01", "epoch": 0.04263} {"step": 21320, "loss": 1.2669, "grad_norm": "6.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.002e+00", "anc_loss": "2.065e+00", "dlm_acc": "3.529e-01", "anc_acc": "3.407e-01", "epoch": 0.04264} {"step": 21325, "loss": 0.9697, "grad_norm": "2.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.623e+00", "anc_loss": "1.720e+00", "dlm_acc": "5.051e-01", "anc_acc": "4.816e-01", "epoch": 0.04265} {"step": 21330, "loss": 0.6528, "grad_norm": "7.160e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.500e-01", "anc_loss": "9.223e-01", "dlm_acc": "6.612e-01", "anc_acc": "6.418e-01", "epoch": 0.04266} {"step": 21335, "loss": 0.8672, "grad_norm": "5.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.000e+00", "anc_loss": "1.098e+00", "dlm_acc": "6.521e-01", "anc_acc": "6.292e-01", "epoch": 0.04267} {"step": 21340, "loss": 1.7568, "grad_norm": "7.274e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.028e+00", "anc_loss": "2.189e+00", "dlm_acc": "3.909e-01", "anc_acc": "3.711e-01", "epoch": 0.04268} {"step": 21345, "loss": 1.2691, "grad_norm": "6.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.819e+00", "anc_loss": "2.002e+00", "dlm_acc": "3.895e-01", "anc_acc": "3.647e-01", "epoch": 0.04269} {"step": 21350, "loss": 1.3317, "grad_norm": "4.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.025e+00", "anc_loss": "2.138e+00", "dlm_acc": "2.854e-01", "anc_acc": "2.648e-01", "epoch": 0.0427} {"step": 21355, "loss": 1.2848, "grad_norm": "5.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.386e+00", "anc_loss": "2.444e+00", "dlm_acc": "1.938e-01", "anc_acc": "1.860e-01", "epoch": 0.04271} {"step": 21360, "loss": 0.957, "grad_norm": "2.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.111e+00", "dlm_acc": "3.776e-01", "anc_acc": "3.729e-01", "epoch": 0.04272} {"step": 21365, "loss": 0.9286, "grad_norm": "1.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.088e+00", "dlm_acc": "5.068e-01", "anc_acc": "4.898e-01", "epoch": 0.04273} {"step": 21370, "loss": 1.0272, "grad_norm": "2.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.211e-01", "anc_loss": "1.002e+00", "dlm_acc": "6.326e-01", "anc_acc": "6.112e-01", "epoch": 0.04274} {"step": 21375, "loss": 0.9979, "grad_norm": "3.385e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.200e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.345e-01", "anc_acc": "5.141e-01", "epoch": 0.04275} {"step": 21380, "loss": 0.9236, "grad_norm": "3.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.277e-01", "anc_loss": "9.947e-01", "dlm_acc": "6.565e-01", "anc_acc": "6.413e-01", "epoch": 0.04276} {"step": 21385, "loss": 0.9791, "grad_norm": "2.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.166e+00", "dlm_acc": "5.730e-01", "anc_acc": "5.523e-01", "epoch": 0.04277} {"step": 21390, "loss": 1.2217, "grad_norm": "4.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.828e-01", "anc_loss": "8.984e-01", "dlm_acc": "5.471e-01", "anc_acc": "5.444e-01", "epoch": 0.04278} {"step": 21395, "loss": 1.2164, "grad_norm": "3.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.047e-01", "anc_loss": "9.801e-01", "dlm_acc": "6.494e-01", "anc_acc": "6.355e-01", "epoch": 0.04279} {"step": 21400, "loss": 1.106, "grad_norm": "3.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.220e+00", "dlm_acc": "5.880e-01", "anc_acc": "5.675e-01", "epoch": 0.0428} {"step": 21405, "loss": 1.0512, "grad_norm": "4.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.648e-01", "anc_loss": "6.977e-01", "dlm_acc": "6.437e-01", "anc_acc": "6.367e-01", "epoch": 0.04281} {"step": 21410, "loss": 1.194, "grad_norm": "3.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.141e-01", "anc_loss": "9.805e-01", "dlm_acc": "6.644e-01", "anc_acc": "6.488e-01", "epoch": 0.04282} {"step": 21415, "loss": 1.3075, "grad_norm": "2.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.539e+00", "anc_loss": "1.663e+00", "dlm_acc": "5.449e-01", "anc_acc": "5.198e-01", "epoch": 0.04283} {"step": 21420, "loss": 0.9881, "grad_norm": "2.756e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.708e-01", "anc_acc": "5.571e-01", "epoch": 0.04284} {"step": 21425, "loss": 0.8357, "grad_norm": "6.875e-02", "learning_rate": "1.000e-04", "dlm_loss": "7.164e-01", "anc_loss": "7.430e-01", "dlm_acc": "5.814e-01", "anc_acc": "5.724e-01", "epoch": 0.04285} {"step": 21430, "loss": 1.2278, "grad_norm": "3.783e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.362e+00", "dlm_acc": "4.942e-01", "anc_acc": "4.828e-01", "epoch": 0.04286} {"step": 21435, "loss": 0.8217, "grad_norm": "1.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.484e-01", "anc_loss": "9.797e-01", "dlm_acc": "4.291e-01", "anc_acc": "4.224e-01", "epoch": 0.04287} {"step": 21440, "loss": 1.3277, "grad_norm": "5.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.208e+00", "dlm_acc": "5.675e-01", "anc_acc": "5.471e-01", "epoch": 0.04288} {"step": 21445, "loss": 1.2885, "grad_norm": "3.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.436e+00", "dlm_acc": "5.485e-01", "anc_acc": "5.222e-01", "epoch": 0.04289} {"step": 21450, "loss": 0.9036, "grad_norm": "3.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.215e+00", "dlm_acc": "3.053e-01", "anc_acc": "2.980e-01", "epoch": 0.0429} {"step": 21455, "loss": 1.1451, "grad_norm": "8.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.898e-01", "anc_loss": "8.273e-01", "dlm_acc": "5.747e-01", "anc_acc": "5.634e-01", "epoch": 0.04291} {"step": 21460, "loss": 0.7398, "grad_norm": "3.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.609e-01", "anc_loss": "5.641e-01", "dlm_acc": "5.819e-01", "anc_acc": "5.808e-01", "epoch": 0.04292} {"step": 21465, "loss": 1.1156, "grad_norm": "6.243e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.062e-01", "anc_loss": "9.828e-01", "dlm_acc": "5.658e-01", "anc_acc": "5.474e-01", "epoch": 0.04293} {"step": 21470, "loss": 1.5302, "grad_norm": "2.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.438e+00", "dlm_acc": "6.016e-01", "anc_acc": "5.689e-01", "epoch": 0.04294} {"step": 21475, "loss": 1.1378, "grad_norm": "3.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.941e-01", "anc_loss": "9.480e-01", "dlm_acc": "5.997e-01", "anc_acc": "5.800e-01", "epoch": 0.04295} {"step": 21480, "loss": 1.1136, "grad_norm": "5.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.465e-01", "anc_loss": "1.024e+00", "dlm_acc": "6.640e-01", "anc_acc": "6.444e-01", "epoch": 0.04296} {"step": 21485, "loss": 1.1459, "grad_norm": "4.076e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.702e-02", "anc_loss": "1.057e-01", "dlm_acc": "9.315e-01", "anc_acc": "9.291e-01", "epoch": 0.04297} {"step": 21490, "loss": 0.9996, "grad_norm": "1.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.424e-01", "anc_loss": "1.538e-01", "dlm_acc": "8.927e-01", "anc_acc": "8.904e-01", "epoch": 0.04298} {"step": 21495, "loss": 0.762, "grad_norm": "5.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.568e-01", "anc_loss": "1.680e-01", "dlm_acc": "8.812e-01", "anc_acc": "8.762e-01", "epoch": 0.04299} {"step": 21500, "loss": 0.9881, "grad_norm": "3.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e-01", "anc_loss": "1.593e-01", "dlm_acc": "9.014e-01", "anc_acc": "8.952e-01", "epoch": 0.043} {"step": 21505, "loss": 0.4708, "grad_norm": "2.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.125e-02", "anc_loss": "6.807e-02", "dlm_acc": "9.455e-01", "anc_acc": "9.425e-01", "epoch": 0.04301} {"step": 21510, "loss": 0.6292, "grad_norm": "2.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.510e-02", "anc_loss": "8.826e-02", "dlm_acc": "9.346e-01", "anc_acc": "9.290e-01", "epoch": 0.04302} {"step": 21515, "loss": 0.7328, "grad_norm": "1.733e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.259e-01", "anc_loss": "7.560e-01", "dlm_acc": "6.480e-01", "anc_acc": "6.431e-01", "epoch": 0.04303} {"step": 21520, "loss": 0.7367, "grad_norm": "2.905e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.891e-01", "anc_loss": "5.925e-01", "dlm_acc": "6.258e-01", "anc_acc": "6.241e-01", "epoch": 0.04304} {"step": 21525, "loss": 0.7652, "grad_norm": "3.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.977e-01", "anc_loss": "9.977e-01", "dlm_acc": "6.806e-01", "anc_acc": "6.561e-01", "epoch": 0.04305} {"step": 21530, "loss": 0.9322, "grad_norm": "3.748e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.008e+00", "anc_loss": "1.103e+00", "dlm_acc": "6.204e-01", "anc_acc": "5.976e-01", "epoch": 0.04306} {"step": 21535, "loss": 1.2656, "grad_norm": "5.315e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.221e+00", "dlm_acc": "5.851e-01", "anc_acc": "5.650e-01", "epoch": 0.04307} {"step": 21540, "loss": 1.3824, "grad_norm": "3.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.132e+00", "dlm_acc": "5.798e-01", "anc_acc": "5.603e-01", "epoch": 0.04308} {"step": 21545, "loss": 1.1143, "grad_norm": "4.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.850e-01", "anc_acc": "5.631e-01", "epoch": 0.04309} {"step": 21550, "loss": 1.4185, "grad_norm": "3.676e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.400e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.498e-01", "anc_acc": "5.274e-01", "epoch": 0.0431} {"step": 21555, "loss": 1.2307, "grad_norm": "4.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.089e+00", "dlm_acc": "5.177e-01", "anc_acc": "4.934e-01", "epoch": 0.04311} {"step": 21560, "loss": 1.454, "grad_norm": "3.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.152e-01", "anc_loss": "8.645e-01", "dlm_acc": "5.825e-01", "anc_acc": "5.685e-01", "epoch": 0.04312} {"step": 21565, "loss": 1.9083, "grad_norm": "5.560e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e+00", "anc_loss": "1.529e+00", "dlm_acc": "4.127e-01", "anc_acc": "4.011e-01", "epoch": 0.04313} {"step": 21570, "loss": 1.1515, "grad_norm": "4.038e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.656e-01", "anc_loss": "9.742e-01", "dlm_acc": "6.618e-01", "anc_acc": "6.297e-01", "epoch": 0.04314} {"step": 21575, "loss": 0.9893, "grad_norm": "3.694e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.110e+00", "dlm_acc": "6.237e-01", "anc_acc": "6.024e-01", "epoch": 0.04315} {"step": 21580, "loss": 1.2257, "grad_norm": "5.425e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.812e-01", "anc_loss": "1.097e+00", "dlm_acc": "6.424e-01", "anc_acc": "6.155e-01", "epoch": 0.04316} {"step": 21585, "loss": 1.1497, "grad_norm": "3.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.225e+00", "dlm_acc": "6.003e-01", "anc_acc": "5.820e-01", "epoch": 0.04317} {"step": 21590, "loss": 1.481, "grad_norm": "7.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.517e+00", "anc_loss": "1.586e+00", "dlm_acc": "3.803e-01", "anc_acc": "3.663e-01", "epoch": 0.04318} {"step": 21595, "loss": 1.3061, "grad_norm": "3.388e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.905e+00", "anc_loss": "1.970e+00", "dlm_acc": "3.001e-01", "anc_acc": "2.880e-01", "epoch": 0.04319} {"step": 21600, "loss": 1.0787, "grad_norm": "3.183e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.711e-01", "anc_loss": "8.203e-01", "dlm_acc": "6.659e-01", "anc_acc": "6.529e-01", "epoch": 0.0432} {"step": 21605, "loss": 1.0399, "grad_norm": "4.220e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.703e-01", "anc_loss": "7.086e-01", "dlm_acc": "6.160e-01", "anc_acc": "6.032e-01", "epoch": 0.04321} {"step": 21610, "loss": 1.1269, "grad_norm": "4.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.188e-01", "anc_loss": "7.023e-01", "dlm_acc": "6.310e-01", "anc_acc": "6.075e-01", "epoch": 0.04322} {"step": 21615, "loss": 0.8793, "grad_norm": "3.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.348e-01", "anc_loss": "8.121e-01", "dlm_acc": "6.547e-01", "anc_acc": "6.266e-01", "epoch": 0.04323} {"step": 21620, "loss": 1.4478, "grad_norm": "4.242e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.481e+00", "anc_loss": "1.558e+00", "dlm_acc": "4.729e-01", "anc_acc": "4.530e-01", "epoch": 0.04324} {"step": 21625, "loss": 1.5897, "grad_norm": "3.156e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.552e+00", "anc_loss": "1.684e+00", "dlm_acc": "5.069e-01", "anc_acc": "4.738e-01", "epoch": 0.04325} {"step": 21630, "loss": 1.3503, "grad_norm": "3.725e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.715e-01", "anc_acc": "5.469e-01", "epoch": 0.04326} {"step": 21635, "loss": 1.3608, "grad_norm": "2.737e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.189e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.512e-01", "epoch": 0.04327} {"step": 21640, "loss": 0.8905, "grad_norm": "6.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.111e-01", "anc_loss": "6.004e-01", "dlm_acc": "7.789e-01", "anc_acc": "7.460e-01", "epoch": 0.04328} {"step": 21645, "loss": 1.3862, "grad_norm": "7.520e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.319e+00", "dlm_acc": "5.610e-01", "anc_acc": "5.408e-01", "epoch": 0.04329} {"step": 21650, "loss": 1.3677, "grad_norm": "3.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.374e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.021e-01", "anc_acc": "4.705e-01", "epoch": 0.0433} {"step": 21655, "loss": 1.1646, "grad_norm": "3.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.586e-01", "anc_loss": "9.328e-01", "dlm_acc": "6.279e-01", "anc_acc": "6.023e-01", "epoch": 0.04331} {"step": 21660, "loss": 1.3333, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.867e-01", "anc_loss": "1.006e+00", "dlm_acc": "5.891e-01", "anc_acc": "5.471e-01", "epoch": 0.04332} {"step": 21665, "loss": 1.5851, "grad_norm": "3.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.953e-01", "anc_loss": "9.336e-01", "dlm_acc": "5.229e-01", "anc_acc": "5.101e-01", "epoch": 0.04333} {"step": 21670, "loss": 1.1754, "grad_norm": "5.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.711e-01", "anc_loss": "6.281e-01", "dlm_acc": "6.201e-01", "anc_acc": "5.852e-01", "epoch": 0.04334} {"step": 21675, "loss": 0.704, "grad_norm": "2.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.934e-01", "anc_loss": "5.035e-01", "dlm_acc": "5.937e-01", "anc_acc": "5.895e-01", "epoch": 0.04335} {"step": 21680, "loss": 0.8454, "grad_norm": "4.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.383e-01", "anc_loss": "4.203e-01", "dlm_acc": "7.484e-01", "anc_acc": "6.955e-01", "epoch": 0.04336} {"step": 21685, "loss": 0.9743, "grad_norm": "8.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.082e-01", "anc_loss": "3.885e-01", "dlm_acc": "7.926e-01", "anc_acc": "7.407e-01", "epoch": 0.04337} {"step": 21690, "loss": 0.7452, "grad_norm": "3.877e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.977e-01", "anc_loss": "4.221e-01", "dlm_acc": "6.698e-01", "anc_acc": "6.504e-01", "epoch": 0.04338} {"step": 21695, "loss": 1.0881, "grad_norm": "6.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.164e-01", "anc_loss": "5.752e-01", "dlm_acc": "7.975e-01", "anc_acc": "7.689e-01", "epoch": 0.04339} {"step": 21700, "loss": 1.1484, "grad_norm": "2.953e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.133e-01", "epoch": 0.0434} {"step": 21705, "loss": 1.2858, "grad_norm": "2.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.493e+00", "dlm_acc": "4.611e-01", "anc_acc": "4.382e-01", "epoch": 0.04341} {"step": 21710, "loss": 1.3663, "grad_norm": "3.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.347e+00", "dlm_acc": "5.629e-01", "anc_acc": "5.303e-01", "epoch": 0.04342} {"step": 21715, "loss": 1.2053, "grad_norm": "3.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.853e-01", "anc_acc": "5.586e-01", "epoch": 0.04343} {"step": 21720, "loss": 1.416, "grad_norm": "5.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.410e-01", "anc_loss": "9.305e-01", "dlm_acc": "6.808e-01", "anc_acc": "6.587e-01", "epoch": 0.04344} {"step": 21725, "loss": 1.6575, "grad_norm": "3.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.428e+00", "anc_loss": "1.529e+00", "dlm_acc": "5.025e-01", "anc_acc": "4.855e-01", "epoch": 0.04345} {"step": 21730, "loss": 1.4277, "grad_norm": "3.003e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.853e+00", "anc_loss": "1.911e+00", "dlm_acc": "3.236e-01", "anc_acc": "3.108e-01", "epoch": 0.04346} {"step": 21735, "loss": 1.5199, "grad_norm": "5.494e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.459e+00", "anc_loss": "1.625e+00", "dlm_acc": "5.232e-01", "anc_acc": "4.925e-01", "epoch": 0.04347} {"step": 21740, "loss": 1.1209, "grad_norm": "3.877e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.096e+00", "dlm_acc": "5.527e-01", "anc_acc": "5.396e-01", "epoch": 0.04348} {"step": 21745, "loss": 1.4802, "grad_norm": "9.928e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.597e-01", "anc_acc": "5.372e-01", "epoch": 0.04349} {"step": 21750, "loss": 0.9404, "grad_norm": "3.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.841e-01", "anc_loss": "4.267e-01", "dlm_acc": "8.071e-01", "anc_acc": "7.894e-01", "epoch": 0.0435} {"step": 21755, "loss": 1.4656, "grad_norm": "3.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.217e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.663e-01", "anc_acc": "5.380e-01", "epoch": 0.04351} {"step": 21760, "loss": 1.2302, "grad_norm": "3.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.063e-01", "anc_loss": "8.648e-01", "dlm_acc": "7.184e-01", "anc_acc": "7.059e-01", "epoch": 0.04352} {"step": 21765, "loss": 1.0103, "grad_norm": "2.731e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.437e-01", "anc_loss": "3.036e-01", "dlm_acc": "8.945e-01", "anc_acc": "8.773e-01", "epoch": 0.04353} {"step": 21770, "loss": 1.1497, "grad_norm": "2.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.502e-01", "anc_loss": "9.400e-01", "dlm_acc": "6.499e-01", "anc_acc": "6.241e-01", "epoch": 0.04354} {"step": 21775, "loss": 1.4267, "grad_norm": "8.059e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.089e+00", "anc_loss": "1.193e+00", "dlm_acc": "5.758e-01", "anc_acc": "5.505e-01", "epoch": 0.04355} {"step": 21780, "loss": 1.3815, "grad_norm": "4.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.010e+00", "anc_loss": "1.104e+00", "dlm_acc": "6.312e-01", "anc_acc": "6.068e-01", "epoch": 0.04356} {"step": 21785, "loss": 1.2067, "grad_norm": "7.281e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.186e-01", "anc_acc": "4.951e-01", "epoch": 0.04357} {"step": 21790, "loss": 1.2811, "grad_norm": "3.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.481e+00", "anc_loss": "1.555e+00", "dlm_acc": "4.691e-01", "anc_acc": "4.520e-01", "epoch": 0.04358} {"step": 21795, "loss": 1.7417, "grad_norm": "2.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.156e+00", "anc_loss": "2.233e+00", "dlm_acc": "3.245e-01", "anc_acc": "3.107e-01", "epoch": 0.04359} {"step": 21800, "loss": 1.5294, "grad_norm": "3.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.269e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.757e-01", "anc_acc": "5.579e-01", "epoch": 0.0436} {"step": 21805, "loss": 1.5054, "grad_norm": "4.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.829e-01", "anc_acc": "5.585e-01", "epoch": 0.04361} {"step": 21810, "loss": 1.5021, "grad_norm": "3.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.251e+00", "anc_loss": "1.332e+00", "dlm_acc": "5.881e-01", "anc_acc": "5.671e-01", "epoch": 0.04362} {"step": 21815, "loss": 1.4886, "grad_norm": "4.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.870e-01", "anc_acc": "5.651e-01", "epoch": 0.04363} {"step": 21820, "loss": 1.3212, "grad_norm": "2.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.727e-01", "anc_loss": "1.068e+00", "dlm_acc": "6.257e-01", "anc_acc": "6.015e-01", "epoch": 0.04364} {"step": 21825, "loss": 1.2234, "grad_norm": "2.531e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.188e+00", "dlm_acc": "6.037e-01", "anc_acc": "5.802e-01", "epoch": 0.04365} {"step": 21830, "loss": 1.238, "grad_norm": "5.109e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.411e+00", "dlm_acc": "5.498e-01", "anc_acc": "5.261e-01", "epoch": 0.04366} {"step": 21835, "loss": 1.1354, "grad_norm": "3.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.131e+00", "dlm_acc": "6.039e-01", "anc_acc": "5.783e-01", "epoch": 0.04367} {"step": 21840, "loss": 1.1681, "grad_norm": "3.167e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.448e+00", "anc_loss": "1.558e+00", "dlm_acc": "5.465e-01", "anc_acc": "5.240e-01", "epoch": 0.04368} {"step": 21845, "loss": 1.1268, "grad_norm": "4.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.446e-01", "anc_acc": "5.252e-01", "epoch": 0.04369} {"step": 21850, "loss": 1.3672, "grad_norm": "4.333e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.795e+00", "anc_loss": "1.908e+00", "dlm_acc": "4.693e-01", "anc_acc": "4.469e-01", "epoch": 0.0437} {"step": 21855, "loss": 1.2655, "grad_norm": "5.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.431e+00", "anc_loss": "1.538e+00", "dlm_acc": "5.199e-01", "anc_acc": "4.971e-01", "epoch": 0.04371} {"step": 21860, "loss": 1.4553, "grad_norm": "5.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.605e+00", "anc_loss": "1.698e+00", "dlm_acc": "5.051e-01", "anc_acc": "4.884e-01", "epoch": 0.04372} {"step": 21865, "loss": 1.1101, "grad_norm": "2.813e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.216e+00", "dlm_acc": "5.929e-01", "anc_acc": "5.730e-01", "epoch": 0.04373} {"step": 21870, "loss": 1.3827, "grad_norm": "3.152e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.429e+00", "anc_loss": "1.534e+00", "dlm_acc": "5.301e-01", "anc_acc": "5.052e-01", "epoch": 0.04374} {"step": 21875, "loss": 1.2195, "grad_norm": "2.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.363e+00", "dlm_acc": "4.626e-01", "anc_acc": "4.264e-01", "epoch": 0.04375} {"step": 21880, "loss": 1.3453, "grad_norm": "4.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.132e+00", "anc_loss": "1.214e+00", "dlm_acc": "5.744e-01", "anc_acc": "5.523e-01", "epoch": 0.04376} {"step": 21885, "loss": 1.373, "grad_norm": "3.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.816e-01", "anc_loss": "7.020e-01", "dlm_acc": "5.448e-01", "anc_acc": "5.327e-01", "epoch": 0.04377} {"step": 21890, "loss": 1.5665, "grad_norm": "2.943e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.418e-01", "anc_loss": "6.586e-01", "dlm_acc": "5.736e-01", "anc_acc": "5.663e-01", "epoch": 0.04378} {"step": 21895, "loss": 1.0491, "grad_norm": "3.874e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.805e-01", "anc_loss": "5.980e-01", "dlm_acc": "5.733e-01", "anc_acc": "5.635e-01", "epoch": 0.04379} {"step": 21900, "loss": 1.198, "grad_norm": "4.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.395e-01", "anc_loss": "6.621e-01", "dlm_acc": "5.754e-01", "anc_acc": "5.645e-01", "epoch": 0.0438} {"step": 21905, "loss": 1.0215, "grad_norm": "2.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.340e-01", "anc_loss": "5.504e-01", "dlm_acc": "5.931e-01", "anc_acc": "5.844e-01", "epoch": 0.04381} {"step": 21910, "loss": 1.1979, "grad_norm": "5.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.523e-01", "anc_loss": "8.957e-01", "dlm_acc": "5.644e-01", "anc_acc": "5.541e-01", "epoch": 0.04382} {"step": 21915, "loss": 1.1926, "grad_norm": "6.717e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.249e+00", "dlm_acc": "5.957e-01", "anc_acc": "5.721e-01", "epoch": 0.04383} {"step": 21920, "loss": 1.3994, "grad_norm": "4.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.634e+00", "anc_loss": "1.745e+00", "dlm_acc": "4.700e-01", "anc_acc": "4.517e-01", "epoch": 0.04384} {"step": 21925, "loss": 1.1675, "grad_norm": "4.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.207e+00", "dlm_acc": "5.734e-01", "anc_acc": "5.393e-01", "epoch": 0.04385} {"step": 21930, "loss": 1.3671, "grad_norm": "4.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.177e+00", "dlm_acc": "5.517e-01", "anc_acc": "5.206e-01", "epoch": 0.04386} {"step": 21935, "loss": 1.5209, "grad_norm": "3.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.239e+00", "dlm_acc": "5.837e-01", "anc_acc": "5.482e-01", "epoch": 0.04387} {"step": 21940, "loss": 1.3443, "grad_norm": "3.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.625e-01", "anc_loss": "1.007e+00", "dlm_acc": "5.408e-01", "anc_acc": "5.310e-01", "epoch": 0.04388} {"step": 21945, "loss": 1.381, "grad_norm": "4.915e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.536e+00", "dlm_acc": "4.928e-01", "anc_acc": "4.656e-01", "epoch": 0.04389} {"step": 21950, "loss": 1.7932, "grad_norm": "3.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.501e+00", "anc_loss": "1.584e+00", "dlm_acc": "4.929e-01", "anc_acc": "4.753e-01", "epoch": 0.0439} {"step": 21955, "loss": 1.6368, "grad_norm": "5.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.656e-01", "anc_loss": "1.046e+00", "dlm_acc": "6.114e-01", "anc_acc": "5.900e-01", "epoch": 0.04391} {"step": 21960, "loss": 1.7558, "grad_norm": "2.081e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.044e+00", "anc_loss": "2.142e+00", "dlm_acc": "3.232e-01", "anc_acc": "2.971e-01", "epoch": 0.04392} {"step": 21965, "loss": 1.1339, "grad_norm": "2.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.477e+00", "dlm_acc": "5.533e-01", "anc_acc": "5.053e-01", "epoch": 0.04393} {"step": 21970, "loss": 1.4585, "grad_norm": "4.909e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.536e+00", "dlm_acc": "5.232e-01", "anc_acc": "4.958e-01", "epoch": 0.04394} {"step": 21975, "loss": 1.3052, "grad_norm": "3.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.281e+00", "dlm_acc": "5.463e-01", "anc_acc": "5.198e-01", "epoch": 0.04395} {"step": 21980, "loss": 1.1605, "grad_norm": "6.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.578e-01", "anc_loss": "8.844e-01", "dlm_acc": "4.436e-01", "anc_acc": "4.300e-01", "epoch": 0.04396} {"step": 21985, "loss": 0.9992, "grad_norm": "6.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.013e+00", "anc_loss": "1.097e+00", "dlm_acc": "5.637e-01", "anc_acc": "5.369e-01", "epoch": 0.04397} {"step": 21990, "loss": 1.5983, "grad_norm": "4.050e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.667e+00", "dlm_acc": "4.961e-01", "anc_acc": "4.670e-01", "epoch": 0.04398} {"step": 21995, "loss": 1.3937, "grad_norm": "1.578e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.396e+00", "dlm_acc": "5.736e-01", "anc_acc": "5.485e-01", "epoch": 0.04399} {"step": 22000, "loss": 1.7548, "grad_norm": "5.467e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.944e+00", "anc_loss": "2.043e+00", "dlm_acc": "3.879e-01", "anc_acc": "3.653e-01", "epoch": 0.044} {"step": 22005, "loss": 1.0299, "grad_norm": "3.288e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.711e-01", "anc_loss": "8.434e-01", "dlm_acc": "6.419e-01", "anc_acc": "6.140e-01", "epoch": 0.04401} {"step": 22010, "loss": 1.4868, "grad_norm": "2.951e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.409e+00", "dlm_acc": "4.744e-01", "anc_acc": "4.540e-01", "epoch": 0.04402} {"step": 22015, "loss": 1.6573, "grad_norm": "5.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.664e+00", "anc_loss": "1.775e+00", "dlm_acc": "4.894e-01", "anc_acc": "4.660e-01", "epoch": 0.04403} {"step": 22020, "loss": 1.151, "grad_norm": "3.481e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.098e+00", "dlm_acc": "5.502e-01", "anc_acc": "5.234e-01", "epoch": 0.04404} {"step": 22025, "loss": 1.3877, "grad_norm": "3.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.574e+00", "anc_loss": "1.672e+00", "dlm_acc": "4.292e-01", "anc_acc": "4.050e-01", "epoch": 0.04405} {"step": 22030, "loss": 1.3347, "grad_norm": "4.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.094e-01", "anc_loss": "8.680e-01", "dlm_acc": "5.959e-01", "anc_acc": "5.710e-01", "epoch": 0.04406} {"step": 22035, "loss": 1.1172, "grad_norm": "2.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.256e+00", "dlm_acc": "5.904e-01", "anc_acc": "5.669e-01", "epoch": 0.04407} {"step": 22040, "loss": 1.2173, "grad_norm": "2.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.210e+00", "dlm_acc": "5.797e-01", "anc_acc": "5.524e-01", "epoch": 0.04408} {"step": 22045, "loss": 1.1033, "grad_norm": "3.537e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.688e-01", "anc_loss": "9.113e-01", "dlm_acc": "6.252e-01", "anc_acc": "6.088e-01", "epoch": 0.04409} {"step": 22050, "loss": 1.1836, "grad_norm": "2.986e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.090e+00", "anc_loss": "1.228e+00", "dlm_acc": "6.025e-01", "anc_acc": "5.665e-01", "epoch": 0.0441} {"step": 22055, "loss": 1.0226, "grad_norm": "3.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.797e-01", "anc_loss": "7.566e-01", "dlm_acc": "7.150e-01", "anc_acc": "6.904e-01", "epoch": 0.04411} {"step": 22060, "loss": 1.4924, "grad_norm": "4.752e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.691e+00", "anc_loss": "1.816e+00", "dlm_acc": "5.132e-01", "anc_acc": "4.929e-01", "epoch": 0.04412} {"step": 22065, "loss": 1.52, "grad_norm": "4.601e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.466e+00", "anc_loss": "1.545e+00", "dlm_acc": "4.861e-01", "anc_acc": "4.665e-01", "epoch": 0.04413} {"step": 22070, "loss": 1.2532, "grad_norm": "3.299e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.006e+00", "anc_loss": "1.120e+00", "dlm_acc": "6.098e-01", "anc_acc": "5.810e-01", "epoch": 0.04414} {"step": 22075, "loss": 1.1362, "grad_norm": "3.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.035e-01", "anc_loss": "9.492e-01", "dlm_acc": "6.226e-01", "anc_acc": "6.108e-01", "epoch": 0.04415} {"step": 22080, "loss": 1.1387, "grad_norm": "3.531e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.316e-01", "anc_loss": "8.180e-01", "dlm_acc": "7.151e-01", "anc_acc": "6.944e-01", "epoch": 0.04416} {"step": 22085, "loss": 1.042, "grad_norm": "5.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.947e-01", "anc_loss": "1.076e+00", "dlm_acc": "6.863e-01", "anc_acc": "6.685e-01", "epoch": 0.04417} {"step": 22090, "loss": 1.1311, "grad_norm": "5.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.961e-01", "anc_loss": "1.074e+00", "dlm_acc": "6.439e-01", "anc_acc": "6.285e-01", "epoch": 0.04418} {"step": 22095, "loss": 0.6916, "grad_norm": "1.820e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.207e-01", "anc_loss": "1.500e-01", "dlm_acc": "9.129e-01", "anc_acc": "8.977e-01", "epoch": 0.04419} {"step": 22100, "loss": 1.1373, "grad_norm": "3.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.928e-01", "anc_loss": "8.711e-01", "dlm_acc": "6.942e-01", "anc_acc": "6.709e-01", "epoch": 0.0442} {"step": 22105, "loss": 1.5749, "grad_norm": "3.432e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.196e+00", "anc_loss": "1.295e+00", "dlm_acc": "5.922e-01", "anc_acc": "5.702e-01", "epoch": 0.04421} {"step": 22110, "loss": 1.0937, "grad_norm": "7.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.727e-01", "anc_loss": "1.083e+00", "dlm_acc": "5.665e-01", "anc_acc": "5.299e-01", "epoch": 0.04422} {"step": 22115, "loss": 1.3348, "grad_norm": "2.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.727e-01", "anc_loss": "6.941e-01", "dlm_acc": "5.348e-01", "anc_acc": "5.223e-01", "epoch": 0.04423} {"step": 22120, "loss": 1.4114, "grad_norm": "3.108e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.238e+00", "dlm_acc": "5.610e-01", "anc_acc": "5.369e-01", "epoch": 0.04424} {"step": 22125, "loss": 1.3521, "grad_norm": "4.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.395e-01", "anc_acc": "5.176e-01", "epoch": 0.04425} {"step": 22130, "loss": 1.0064, "grad_norm": "3.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.175e+00", "dlm_acc": "6.091e-01", "anc_acc": "5.898e-01", "epoch": 0.04426} {"step": 22135, "loss": 1.1167, "grad_norm": "3.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.318e-01", "anc_acc": "5.125e-01", "epoch": 0.04427} {"step": 22140, "loss": 1.0212, "grad_norm": "1.914e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.241e-01", "anc_acc": "5.071e-01", "epoch": 0.04428} {"step": 22145, "loss": 1.1877, "grad_norm": "2.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.428e+00", "dlm_acc": "5.551e-01", "anc_acc": "5.312e-01", "epoch": 0.04429} {"step": 22150, "loss": 0.9328, "grad_norm": "8.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.836e-01", "anc_loss": "1.062e+00", "dlm_acc": "6.463e-01", "anc_acc": "6.306e-01", "epoch": 0.0443} {"step": 22155, "loss": 0.8844, "grad_norm": "3.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.578e-01", "anc_loss": "9.359e-01", "dlm_acc": "6.887e-01", "anc_acc": "6.781e-01", "epoch": 0.04431} {"step": 22160, "loss": 1.3698, "grad_norm": "1.047e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.097e+00", "dlm_acc": "6.249e-01", "anc_acc": "6.095e-01", "epoch": 0.04432} {"step": 22165, "loss": 1.3759, "grad_norm": "3.799e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.642e+00", "dlm_acc": "5.104e-01", "anc_acc": "4.892e-01", "epoch": 0.04433} {"step": 22170, "loss": 0.9302, "grad_norm": "3.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.621e-01", "anc_loss": "8.238e-01", "dlm_acc": "6.900e-01", "anc_acc": "6.735e-01", "epoch": 0.04434} {"step": 22175, "loss": 1.1574, "grad_norm": "3.855e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.000e-01", "anc_acc": "4.770e-01", "epoch": 0.04435} {"step": 22180, "loss": 1.3109, "grad_norm": "3.021e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.076e+00", "anc_loss": "1.181e+00", "dlm_acc": "5.936e-01", "anc_acc": "5.686e-01", "epoch": 0.04436} {"step": 22185, "loss": 1.5914, "grad_norm": "4.237e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.658e+00", "anc_loss": "1.769e+00", "dlm_acc": "5.020e-01", "anc_acc": "4.806e-01", "epoch": 0.04437} {"step": 22190, "loss": 0.9722, "grad_norm": "2.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.797e-01", "anc_loss": "1.067e+00", "dlm_acc": "5.886e-01", "anc_acc": "5.637e-01", "epoch": 0.04438} {"step": 22195, "loss": 1.5554, "grad_norm": "7.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.953e+00", "anc_loss": "2.058e+00", "dlm_acc": "4.194e-01", "anc_acc": "4.016e-01", "epoch": 0.04439} {"step": 22200, "loss": 1.5301, "grad_norm": "3.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.717e+00", "dlm_acc": "4.972e-01", "anc_acc": "4.727e-01", "epoch": 0.0444} {"step": 22205, "loss": 1.7365, "grad_norm": "2.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.531e+00", "anc_loss": "1.654e+00", "dlm_acc": "5.376e-01", "anc_acc": "5.098e-01", "epoch": 0.04441} {"step": 22210, "loss": 1.5588, "grad_norm": "4.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.421e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.127e-01", "epoch": 0.04442} {"step": 22215, "loss": 1.3046, "grad_norm": "2.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.193e+00", "anc_loss": "1.279e+00", "dlm_acc": "5.792e-01", "anc_acc": "5.583e-01", "epoch": 0.04443} {"step": 22220, "loss": 0.7949, "grad_norm": "3.486e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.684e-01", "anc_loss": "9.672e-01", "dlm_acc": "6.724e-01", "anc_acc": "6.434e-01", "epoch": 0.04444} {"step": 22225, "loss": 1.1131, "grad_norm": "2.389e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.392e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.236e-01", "anc_acc": "5.006e-01", "epoch": 0.04445} {"step": 22230, "loss": 0.8718, "grad_norm": "4.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.252e+00", "dlm_acc": "6.000e-01", "anc_acc": "5.786e-01", "epoch": 0.04446} {"step": 22235, "loss": 1.0789, "grad_norm": "3.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.271e-01", "anc_acc": "4.986e-01", "epoch": 0.04447} {"step": 22240, "loss": 1.9569, "grad_norm": "4.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.708e+00", "anc_loss": "1.794e+00", "dlm_acc": "4.939e-01", "anc_acc": "4.758e-01", "epoch": 0.04448} {"step": 22245, "loss": 1.4207, "grad_norm": "3.540e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.188e+00", "dlm_acc": "5.500e-01", "anc_acc": "5.261e-01", "epoch": 0.04449} {"step": 22250, "loss": 1.1475, "grad_norm": "3.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.664e-01", "anc_loss": "1.032e+00", "dlm_acc": "5.987e-01", "anc_acc": "5.809e-01", "epoch": 0.0445} {"step": 22255, "loss": 1.3208, "grad_norm": "4.157e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.564e-01", "anc_acc": "5.216e-01", "epoch": 0.04451} {"step": 22260, "loss": 0.872, "grad_norm": "2.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.205e+00", "dlm_acc": "5.981e-01", "anc_acc": "5.628e-01", "epoch": 0.04452} {"step": 22265, "loss": 1.6929, "grad_norm": "3.309e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.477e+00", "dlm_acc": "5.521e-01", "anc_acc": "5.383e-01", "epoch": 0.04453} {"step": 22270, "loss": 0.9544, "grad_norm": "5.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.922e-01", "anc_loss": "1.071e+00", "dlm_acc": "5.833e-01", "anc_acc": "5.565e-01", "epoch": 0.04454} {"step": 22275, "loss": 1.2209, "grad_norm": "3.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.207e+00", "dlm_acc": "5.689e-01", "anc_acc": "5.557e-01", "epoch": 0.04455} {"step": 22280, "loss": 0.9033, "grad_norm": "2.984e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.523e-01", "anc_loss": "9.660e-01", "dlm_acc": "6.725e-01", "anc_acc": "6.412e-01", "epoch": 0.04456} {"step": 22285, "loss": 1.2834, "grad_norm": "2.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.398e-01", "anc_loss": "1.078e+00", "dlm_acc": "7.110e-01", "anc_acc": "6.852e-01", "epoch": 0.04457} {"step": 22290, "loss": 1.0623, "grad_norm": "3.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.680e-01", "anc_loss": "9.852e-01", "dlm_acc": "5.893e-01", "anc_acc": "5.516e-01", "epoch": 0.04458} {"step": 22295, "loss": 0.6524, "grad_norm": "1.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.395e-01", "anc_loss": "5.477e-01", "dlm_acc": "5.039e-01", "anc_acc": "5.002e-01", "epoch": 0.04459} {"step": 22300, "loss": 0.9166, "grad_norm": "3.449e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.383e-01", "anc_loss": "7.562e-01", "dlm_acc": "5.125e-01", "anc_acc": "5.056e-01", "epoch": 0.0446} {"step": 22305, "loss": 0.5629, "grad_norm": "2.113e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.844e-01", "anc_loss": "5.918e-01", "dlm_acc": "5.088e-01", "anc_acc": "5.036e-01", "epoch": 0.04461} {"step": 22310, "loss": 0.9142, "grad_norm": "2.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.922e-01", "anc_loss": "7.039e-01", "dlm_acc": "5.032e-01", "anc_acc": "4.967e-01", "epoch": 0.04462} {"step": 22315, "loss": 0.731, "grad_norm": "1.675e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.695e-01", "anc_loss": "5.773e-01", "dlm_acc": "5.249e-01", "anc_acc": "5.212e-01", "epoch": 0.04463} {"step": 22320, "loss": 0.6887, "grad_norm": "3.629e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.242e-01", "anc_loss": "7.633e-01", "dlm_acc": "5.482e-01", "anc_acc": "5.355e-01", "epoch": 0.04464} {"step": 22325, "loss": 1.0015, "grad_norm": "5.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.092e+00", "anc_loss": "1.181e+00", "dlm_acc": "5.278e-01", "anc_acc": "5.039e-01", "epoch": 0.04465} {"step": 22330, "loss": 0.9822, "grad_norm": "3.260e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.208e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.796e-01", "anc_acc": "5.560e-01", "epoch": 0.04466} {"step": 22335, "loss": 0.9843, "grad_norm": "5.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.734e-01", "anc_loss": "3.047e-01", "dlm_acc": "9.091e-01", "anc_acc": "9.024e-01", "epoch": 0.04467} {"step": 22340, "loss": 1.228, "grad_norm": "3.243e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.979e+00", "anc_loss": "2.050e+00", "dlm_acc": "3.325e-01", "anc_acc": "3.177e-01", "epoch": 0.04468} {"step": 22345, "loss": 1.2896, "grad_norm": "3.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.981e+00", "anc_loss": "2.047e+00", "dlm_acc": "3.440e-01", "anc_acc": "3.314e-01", "epoch": 0.04469} {"step": 22350, "loss": 1.035, "grad_norm": "2.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.556e-01", "anc_acc": "5.238e-01", "epoch": 0.0447} {"step": 22355, "loss": 1.3062, "grad_norm": "5.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.526e+00", "anc_loss": "1.639e+00", "dlm_acc": "5.107e-01", "anc_acc": "4.829e-01", "epoch": 0.04471} {"step": 22360, "loss": 0.8725, "grad_norm": "4.994e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.211e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.645e-01", "anc_acc": "5.384e-01", "epoch": 0.04472} {"step": 22365, "loss": 1.0322, "grad_norm": "4.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.016e+00", "anc_loss": "2.052e+00", "dlm_acc": "2.351e-01", "anc_acc": "2.266e-01", "epoch": 0.04473} {"step": 22370, "loss": 0.9415, "grad_norm": "1.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.213e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.521e-01", "anc_acc": "5.282e-01", "epoch": 0.04474} {"step": 22375, "loss": 0.8672, "grad_norm": "2.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.908e-01", "anc_loss": "8.469e-01", "dlm_acc": "7.019e-01", "anc_acc": "6.853e-01", "epoch": 0.04475} {"step": 22380, "loss": 0.7081, "grad_norm": "4.518e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.967e-01", "anc_loss": "3.363e-01", "dlm_acc": "8.172e-01", "anc_acc": "8.018e-01", "epoch": 0.04476} {"step": 22385, "loss": 0.9908, "grad_norm": "3.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.063e+00", "anc_loss": "1.171e+00", "dlm_acc": "6.251e-01", "anc_acc": "5.932e-01", "epoch": 0.04477} {"step": 22390, "loss": 0.7631, "grad_norm": "3.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.449e-01", "anc_loss": "8.113e-01", "dlm_acc": "7.016e-01", "anc_acc": "6.847e-01", "epoch": 0.04478} {"step": 22395, "loss": 0.9102, "grad_norm": "4.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.253e+00", "dlm_acc": "5.638e-01", "anc_acc": "5.328e-01", "epoch": 0.04479} {"step": 22400, "loss": 1.0847, "grad_norm": "4.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.257e+00", "dlm_acc": "6.099e-01", "anc_acc": "5.915e-01", "epoch": 0.0448} {"step": 22405, "loss": 1.0315, "grad_norm": "3.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.213e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.661e-01", "anc_acc": "5.451e-01", "epoch": 0.04481} {"step": 22410, "loss": 1.3315, "grad_norm": "3.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.348e+00", "dlm_acc": "5.947e-01", "anc_acc": "5.773e-01", "epoch": 0.04482} {"step": 22415, "loss": 0.8376, "grad_norm": "1.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.875e-01", "anc_loss": "1.063e+00", "dlm_acc": "6.119e-01", "anc_acc": "5.932e-01", "epoch": 0.04483} {"step": 22420, "loss": 1.0131, "grad_norm": "3.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.562e+00", "anc_loss": "1.664e+00", "dlm_acc": "5.007e-01", "anc_acc": "4.805e-01", "epoch": 0.04484} {"step": 22425, "loss": 1.1202, "grad_norm": "3.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.463e+00", "anc_loss": "1.571e+00", "dlm_acc": "5.298e-01", "anc_acc": "5.077e-01", "epoch": 0.04485} {"step": 22430, "loss": 1.2433, "grad_norm": "3.766e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.565e-01", "anc_acc": "5.323e-01", "epoch": 0.04486} {"step": 22435, "loss": 1.1196, "grad_norm": "4.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.367e-01", "anc_acc": "5.152e-01", "epoch": 0.04487} {"step": 22440, "loss": 1.6713, "grad_norm": "3.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.534e+00", "anc_loss": "1.639e+00", "dlm_acc": "5.305e-01", "anc_acc": "5.102e-01", "epoch": 0.04488} {"step": 22445, "loss": 1.1755, "grad_norm": "5.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.556e+00", "dlm_acc": "5.124e-01", "anc_acc": "4.928e-01", "epoch": 0.04489} {"step": 22450, "loss": 1.0695, "grad_norm": "2.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.969e-01", "anc_loss": "8.773e-01", "dlm_acc": "6.718e-01", "anc_acc": "6.485e-01", "epoch": 0.0449} {"step": 22455, "loss": 0.9512, "grad_norm": "3.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.063e+00", "anc_loss": "1.156e+00", "dlm_acc": "5.755e-01", "anc_acc": "5.511e-01", "epoch": 0.04491} {"step": 22460, "loss": 0.9915, "grad_norm": "3.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.746e-01", "anc_loss": "7.262e-01", "dlm_acc": "6.877e-01", "anc_acc": "6.722e-01", "epoch": 0.04492} {"step": 22465, "loss": 1.1519, "grad_norm": "3.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.555e-01", "anc_acc": "5.314e-01", "epoch": 0.04493} {"step": 22470, "loss": 1.3946, "grad_norm": "2.766e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.512e+00", "anc_loss": "1.630e+00", "dlm_acc": "5.154e-01", "anc_acc": "4.874e-01", "epoch": 0.04494} {"step": 22475, "loss": 1.1583, "grad_norm": "3.429e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.462e+00", "dlm_acc": "4.656e-01", "anc_acc": "4.512e-01", "epoch": 0.04495} {"step": 22480, "loss": 1.2928, "grad_norm": "3.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.738e+00", "anc_loss": "1.830e+00", "dlm_acc": "4.580e-01", "anc_acc": "4.373e-01", "epoch": 0.04496} {"step": 22485, "loss": 1.3, "grad_norm": "2.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.759e-01", "anc_acc": "5.564e-01", "epoch": 0.04497} {"step": 22490, "loss": 1.4386, "grad_norm": "3.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.758e-01", "anc_acc": "5.520e-01", "epoch": 0.04498} {"step": 22495, "loss": 1.4209, "grad_norm": "3.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.556e-01", "anc_acc": "5.317e-01", "epoch": 0.04499} {"step": 22500, "loss": 1.6181, "grad_norm": "1.785e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.577e+00", "dlm_acc": "5.377e-01", "anc_acc": "5.164e-01", "epoch": 0.045} {"step": 22505, "loss": 1.0929, "grad_norm": "2.855e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.067e+00", "anc_loss": "1.130e+00", "dlm_acc": "5.701e-01", "anc_acc": "5.552e-01", "epoch": 0.04501} {"step": 22510, "loss": 1.1686, "grad_norm": "5.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.448e+00", "anc_loss": "1.545e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.224e-01", "epoch": 0.04502} {"step": 22515, "loss": 1.0597, "grad_norm": "3.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.395e-01", "anc_loss": "7.967e-01", "dlm_acc": "7.187e-01", "anc_acc": "7.062e-01", "epoch": 0.04503} {"step": 22520, "loss": 1.1616, "grad_norm": "2.858e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.551e-01", "anc_loss": "9.258e-01", "dlm_acc": "6.947e-01", "anc_acc": "6.786e-01", "epoch": 0.04504} {"step": 22525, "loss": 1.2072, "grad_norm": "3.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.498e-01", "anc_loss": "9.205e-01", "dlm_acc": "7.088e-01", "anc_acc": "6.924e-01", "epoch": 0.04505} {"step": 22530, "loss": 1.2958, "grad_norm": "3.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.102e-01", "anc_loss": "9.633e-01", "dlm_acc": "6.377e-01", "anc_acc": "6.240e-01", "epoch": 0.04506} {"step": 22535, "loss": 1.4142, "grad_norm": "5.863e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.572e-01", "anc_acc": "5.405e-01", "epoch": 0.04507} {"step": 22540, "loss": 1.3837, "grad_norm": "4.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.592e+00", "anc_loss": "1.683e+00", "dlm_acc": "4.857e-01", "anc_acc": "4.675e-01", "epoch": 0.04508} {"step": 22545, "loss": 0.8488, "grad_norm": "3.496e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.472e+00", "anc_loss": "1.559e+00", "dlm_acc": "4.583e-01", "anc_acc": "4.397e-01", "epoch": 0.04509} {"step": 22550, "loss": 1.0231, "grad_norm": "3.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.095e+00", "dlm_acc": "6.239e-01", "anc_acc": "6.035e-01", "epoch": 0.0451} {"step": 22555, "loss": 1.0931, "grad_norm": "2.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.359e+00", "anc_loss": "1.450e+00", "dlm_acc": "4.958e-01", "anc_acc": "4.749e-01", "epoch": 0.04511} {"step": 22560, "loss": 1.071, "grad_norm": "2.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.444e+00", "dlm_acc": "5.658e-01", "anc_acc": "5.421e-01", "epoch": 0.04512} {"step": 22565, "loss": 0.949, "grad_norm": "3.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.369e+00", "dlm_acc": "5.725e-01", "anc_acc": "5.512e-01", "epoch": 0.04513} {"step": 22570, "loss": 0.9832, "grad_norm": "3.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.729e+00", "dlm_acc": "4.321e-01", "anc_acc": "4.151e-01", "epoch": 0.04514} {"step": 22575, "loss": 0.883, "grad_norm": "2.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.708e+00", "dlm_acc": "5.140e-01", "anc_acc": "4.943e-01", "epoch": 0.04515} {"step": 22580, "loss": 1.396, "grad_norm": "4.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.630e+00", "anc_loss": "1.725e+00", "dlm_acc": "4.849e-01", "anc_acc": "4.671e-01", "epoch": 0.04516} {"step": 22585, "loss": 0.9194, "grad_norm": "2.765e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.177e+00", "dlm_acc": "6.199e-01", "anc_acc": "5.954e-01", "epoch": 0.04517} {"step": 22590, "loss": 0.8726, "grad_norm": "2.259e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.083e+00", "anc_loss": "1.173e+00", "dlm_acc": "5.944e-01", "anc_acc": "5.737e-01", "epoch": 0.04518} {"step": 22595, "loss": 1.1906, "grad_norm": "2.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.520e+00", "dlm_acc": "5.447e-01", "anc_acc": "5.233e-01", "epoch": 0.04519} {"step": 22600, "loss": 1.0128, "grad_norm": "5.061e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.321e+00", "dlm_acc": "5.839e-01", "anc_acc": "5.609e-01", "epoch": 0.0452} {"step": 22605, "loss": 1.3573, "grad_norm": "3.187e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.578e+00", "anc_loss": "1.673e+00", "dlm_acc": "4.981e-01", "anc_acc": "4.771e-01", "epoch": 0.04521} {"step": 22610, "loss": 1.153, "grad_norm": "3.795e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.250e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.931e-01", "anc_acc": "5.678e-01", "epoch": 0.04522} {"step": 22615, "loss": 1.3227, "grad_norm": "2.662e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.461e+00", "anc_loss": "1.579e+00", "dlm_acc": "5.318e-01", "anc_acc": "5.036e-01", "epoch": 0.04523} {"step": 22620, "loss": 1.1514, "grad_norm": "3.767e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.625e-01", "anc_acc": "5.413e-01", "epoch": 0.04524} {"step": 22625, "loss": 1.14, "grad_norm": "3.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.818e-01", "anc_acc": "5.570e-01", "epoch": 0.04525} {"step": 22630, "loss": 0.9953, "grad_norm": "4.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.041e+00", "anc_loss": "1.123e+00", "dlm_acc": "6.022e-01", "anc_acc": "5.812e-01", "epoch": 0.04526} {"step": 22635, "loss": 1.5965, "grad_norm": "2.533e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.748e-01", "anc_acc": "5.532e-01", "epoch": 0.04527} {"step": 22640, "loss": 0.927, "grad_norm": "3.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.146e+00", "anc_loss": "1.248e+00", "dlm_acc": "6.086e-01", "anc_acc": "5.832e-01", "epoch": 0.04528} {"step": 22645, "loss": 0.9876, "grad_norm": "2.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.646e-01", "anc_acc": "5.443e-01", "epoch": 0.04529} {"step": 22650, "loss": 1.232, "grad_norm": "5.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.444e+00", "dlm_acc": "5.365e-01", "anc_acc": "5.175e-01", "epoch": 0.0453} {"step": 22655, "loss": 1.1858, "grad_norm": "3.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.895e-01", "anc_loss": "8.945e-01", "dlm_acc": "6.998e-01", "anc_acc": "6.695e-01", "epoch": 0.04531} {"step": 22660, "loss": 1.0453, "grad_norm": "3.139e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.168e+00", "dlm_acc": "5.202e-01", "anc_acc": "5.081e-01", "epoch": 0.04532} {"step": 22665, "loss": 1.363, "grad_norm": "3.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.375e+00", "dlm_acc": "5.675e-01", "anc_acc": "5.488e-01", "epoch": 0.04533} {"step": 22670, "loss": 1.0561, "grad_norm": "4.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.547e-01", "anc_acc": "5.303e-01", "epoch": 0.04534} {"step": 22675, "loss": 1.466, "grad_norm": "4.869e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.530e+00", "dlm_acc": "4.655e-01", "anc_acc": "4.433e-01", "epoch": 0.04535} {"step": 22680, "loss": 1.0849, "grad_norm": "7.748e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.944e-01", "anc_loss": "1.087e+00", "dlm_acc": "6.728e-01", "anc_acc": "6.475e-01", "epoch": 0.04536} {"step": 22685, "loss": 1.2663, "grad_norm": "3.348e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.417e+00", "dlm_acc": "5.515e-01", "anc_acc": "5.274e-01", "epoch": 0.04537} {"step": 22690, "loss": 0.9646, "grad_norm": "4.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.302e+00", "dlm_acc": "5.053e-01", "anc_acc": "4.837e-01", "epoch": 0.04538} {"step": 22695, "loss": 1.0725, "grad_norm": "4.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.648e+00", "anc_loss": "1.715e+00", "dlm_acc": "4.005e-01", "anc_acc": "3.849e-01", "epoch": 0.04539} {"step": 22700, "loss": 1.369, "grad_norm": "4.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.791e+00", "anc_loss": "2.819e+00", "dlm_acc": "4.795e-02", "anc_acc": "4.486e-02", "epoch": 0.0454} {"step": 22705, "loss": 1.1299, "grad_norm": "4.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.906e+00", "anc_loss": "1.980e+00", "dlm_acc": "3.396e-01", "anc_acc": "3.248e-01", "epoch": 0.04541} {"step": 22710, "loss": 1.3067, "grad_norm": "4.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.622e+00", "anc_loss": "1.825e+00", "dlm_acc": "5.056e-01", "anc_acc": "4.597e-01", "epoch": 0.04542} {"step": 22715, "loss": 1.1525, "grad_norm": "5.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.875e-01", "anc_loss": "8.176e-01", "dlm_acc": "5.765e-01", "anc_acc": "5.660e-01", "epoch": 0.04543} {"step": 22720, "loss": 1.2957, "grad_norm": "7.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.695e-01", "anc_loss": "8.945e-01", "dlm_acc": "4.321e-01", "anc_acc": "4.252e-01", "epoch": 0.04544} {"step": 22725, "loss": 0.7904, "grad_norm": "3.485e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.477e-01", "anc_loss": "6.625e-01", "dlm_acc": "4.783e-01", "anc_acc": "4.698e-01", "epoch": 0.04545} {"step": 22730, "loss": 0.7478, "grad_norm": "3.214e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.562e-01", "anc_loss": "7.695e-01", "dlm_acc": "4.433e-01", "anc_acc": "4.367e-01", "epoch": 0.04546} {"step": 22735, "loss": 0.8157, "grad_norm": "5.267e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.336e-01", "anc_loss": "7.508e-01", "dlm_acc": "4.287e-01", "anc_acc": "4.222e-01", "epoch": 0.04547} {"step": 22740, "loss": 0.6913, "grad_norm": "4.526e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.754e-01", "anc_loss": "8.035e-01", "dlm_acc": "4.713e-01", "anc_acc": "4.573e-01", "epoch": 0.04548} {"step": 22745, "loss": 0.895, "grad_norm": "5.317e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.730e-01", "anc_loss": "8.398e-01", "dlm_acc": "6.040e-01", "anc_acc": "5.846e-01", "epoch": 0.04549} {"step": 22750, "loss": 1.2651, "grad_norm": "7.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.524e+00", "anc_loss": "1.682e+00", "dlm_acc": "5.203e-01", "anc_acc": "4.869e-01", "epoch": 0.0455} {"step": 22755, "loss": 1.4218, "grad_norm": "4.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.360e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.049e-01", "anc_acc": "4.830e-01", "epoch": 0.04551} {"step": 22760, "loss": 1.6655, "grad_norm": "6.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.734e+00", "anc_loss": "2.741e+00", "dlm_acc": "5.041e-02", "anc_acc": "5.210e-02", "epoch": 0.04552} {"step": 22765, "loss": 1.6669, "grad_norm": "5.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.997e+00", "anc_loss": "3.000e+00", "dlm_acc": "2.109e-02", "anc_acc": "2.094e-02", "epoch": 0.04553} {"step": 22770, "loss": 1.5767, "grad_norm": "3.056e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.775e+00", "anc_loss": "2.778e+00", "dlm_acc": "2.231e-02", "anc_acc": "2.271e-02", "epoch": 0.04554} {"step": 22775, "loss": 1.4235, "grad_norm": "2.300e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.568e+00", "anc_loss": "2.593e+00", "dlm_acc": "1.554e-01", "anc_acc": "1.503e-01", "epoch": 0.04555} {"step": 22780, "loss": 1.1656, "grad_norm": "4.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.869e-01", "anc_acc": "5.648e-01", "epoch": 0.04556} {"step": 22785, "loss": 1.5966, "grad_norm": "4.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.092e+00", "anc_loss": "1.193e+00", "dlm_acc": "5.645e-01", "anc_acc": "5.446e-01", "epoch": 0.04557} {"step": 22790, "loss": 1.0744, "grad_norm": "3.035e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.879e-01", "anc_loss": "7.863e-01", "dlm_acc": "7.279e-01", "anc_acc": "6.968e-01", "epoch": 0.04558} {"step": 22795, "loss": 1.1465, "grad_norm": "7.288e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.263e+00", "dlm_acc": "5.875e-01", "anc_acc": "5.609e-01", "epoch": 0.04559} {"step": 22800, "loss": 1.2332, "grad_norm": "4.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.289e-01", "anc_loss": "9.922e-01", "dlm_acc": "6.198e-01", "anc_acc": "6.039e-01", "epoch": 0.0456} {"step": 22805, "loss": 1.3169, "grad_norm": "5.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.531e+00", "anc_loss": "1.615e+00", "dlm_acc": "4.743e-01", "anc_acc": "4.549e-01", "epoch": 0.04561} {"step": 22810, "loss": 1.1791, "grad_norm": "3.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.504e+00", "dlm_acc": "5.155e-01", "anc_acc": "4.843e-01", "epoch": 0.04562} {"step": 22815, "loss": 1.0218, "grad_norm": "2.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.195e+00", "dlm_acc": "5.150e-01", "anc_acc": "4.929e-01", "epoch": 0.04563} {"step": 22820, "loss": 1.3134, "grad_norm": "3.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.330e+00", "dlm_acc": "4.690e-01", "anc_acc": "4.550e-01", "epoch": 0.04564} {"step": 22825, "loss": 1.2247, "grad_norm": "3.386e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.516e-01", "anc_loss": "9.891e-01", "dlm_acc": "4.976e-01", "anc_acc": "4.861e-01", "epoch": 0.04565} {"step": 22830, "loss": 1.5353, "grad_norm": "4.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.581e+00", "anc_loss": "1.675e+00", "dlm_acc": "4.812e-01", "anc_acc": "4.631e-01", "epoch": 0.04566} {"step": 22835, "loss": 1.1149, "grad_norm": "4.629e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.206e+00", "anc_loss": "1.292e+00", "dlm_acc": "4.890e-01", "anc_acc": "4.696e-01", "epoch": 0.04567} {"step": 22840, "loss": 1.0689, "grad_norm": "2.836e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.105e+00", "dlm_acc": "5.686e-01", "anc_acc": "5.416e-01", "epoch": 0.04568} {"step": 22845, "loss": 0.9379, "grad_norm": "4.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.250e-01", "anc_loss": "1.024e+00", "dlm_acc": "6.048e-01", "anc_acc": "5.705e-01", "epoch": 0.04569} {"step": 22850, "loss": 0.6546, "grad_norm": "3.510e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.477e-01", "anc_loss": "8.496e-01", "dlm_acc": "6.631e-01", "anc_acc": "6.329e-01", "epoch": 0.0457} {"step": 22855, "loss": 1.2234, "grad_norm": "4.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.737e-01", "anc_acc": "5.441e-01", "epoch": 0.04571} {"step": 22860, "loss": 1.1277, "grad_norm": "3.487e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.441e-01", "anc_loss": "9.688e-01", "dlm_acc": "6.524e-01", "anc_acc": "6.160e-01", "epoch": 0.04572} {"step": 22865, "loss": 1.0775, "grad_norm": "9.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.479e+00", "anc_loss": "1.573e+00", "dlm_acc": "4.936e-01", "anc_acc": "4.742e-01", "epoch": 0.04573} {"step": 22870, "loss": 1.3782, "grad_norm": "1.735e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.716e+00", "anc_loss": "1.791e+00", "dlm_acc": "4.376e-01", "anc_acc": "4.196e-01", "epoch": 0.04574} {"step": 22875, "loss": 1.2793, "grad_norm": "2.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.480e+00", "anc_loss": "1.556e+00", "dlm_acc": "4.353e-01", "anc_acc": "4.179e-01", "epoch": 0.04575} {"step": 22880, "loss": 1.2373, "grad_norm": "3.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.041e-01", "anc_loss": "9.969e-01", "dlm_acc": "6.313e-01", "anc_acc": "6.031e-01", "epoch": 0.04576} {"step": 22885, "loss": 1.1663, "grad_norm": "4.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.267e+00", "dlm_acc": "5.240e-01", "anc_acc": "5.054e-01", "epoch": 0.04577} {"step": 22890, "loss": 1.4316, "grad_norm": "3.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.249e+00", "dlm_acc": "5.505e-01", "anc_acc": "5.318e-01", "epoch": 0.04578} {"step": 22895, "loss": 0.9719, "grad_norm": "2.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.918e-01", "anc_loss": "6.574e-01", "dlm_acc": "6.655e-01", "anc_acc": "6.397e-01", "epoch": 0.04579} {"step": 22900, "loss": 1.3207, "grad_norm": "2.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.316e-01", "anc_loss": "9.859e-01", "dlm_acc": "5.601e-01", "anc_acc": "5.457e-01", "epoch": 0.0458} {"step": 22905, "loss": 1.0799, "grad_norm": "2.649e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.409e-01", "anc_acc": "5.229e-01", "epoch": 0.04581} {"step": 22910, "loss": 0.8418, "grad_norm": "2.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.656e-01", "anc_loss": "4.023e-01", "dlm_acc": "7.294e-01", "anc_acc": "7.076e-01", "epoch": 0.04582} {"step": 22915, "loss": 1.0428, "grad_norm": "2.365e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.919e-01", "anc_loss": "8.471e-01", "dlm_acc": "6.357e-01", "anc_acc": "6.167e-01", "epoch": 0.04583} {"step": 22920, "loss": 1.1678, "grad_norm": "4.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.012e-01", "anc_loss": "5.332e-01", "dlm_acc": "6.323e-01", "anc_acc": "6.104e-01", "epoch": 0.04584} {"step": 22925, "loss": 1.2748, "grad_norm": "2.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.504e-01", "anc_loss": "6.676e-01", "dlm_acc": "6.083e-01", "anc_acc": "5.986e-01", "epoch": 0.04585} {"step": 22930, "loss": 1.5228, "grad_norm": "4.341e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.375e+00", "dlm_acc": "5.267e-01", "anc_acc": "5.051e-01", "epoch": 0.04586} {"step": 22935, "loss": 1.4078, "grad_norm": "6.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.816e-01", "anc_loss": "1.054e+00", "dlm_acc": "6.093e-01", "anc_acc": "5.924e-01", "epoch": 0.04587} {"step": 22940, "loss": 1.1516, "grad_norm": "2.954e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.418e-01", "anc_loss": "8.117e-01", "dlm_acc": "7.015e-01", "anc_acc": "6.773e-01", "epoch": 0.04588} {"step": 22945, "loss": 1.3555, "grad_norm": "3.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.443e-01", "anc_loss": "4.879e-01", "dlm_acc": "8.110e-01", "anc_acc": "7.942e-01", "epoch": 0.04589} {"step": 22950, "loss": 1.4096, "grad_norm": "3.583e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.125e+00", "anc_loss": "1.202e+00", "dlm_acc": "5.548e-01", "anc_acc": "5.360e-01", "epoch": 0.0459} {"step": 22955, "loss": 1.0529, "grad_norm": "3.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.461e-01", "anc_loss": "6.152e-01", "dlm_acc": "7.410e-01", "anc_acc": "7.139e-01", "epoch": 0.04591} {"step": 22960, "loss": 1.4479, "grad_norm": "3.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.016e-01", "anc_loss": "9.812e-01", "dlm_acc": "6.512e-01", "anc_acc": "6.282e-01", "epoch": 0.04592} {"step": 22965, "loss": 1.6083, "grad_norm": "4.598e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.037e-01", "anc_loss": "9.951e-01", "dlm_acc": "6.395e-01", "anc_acc": "6.182e-01", "epoch": 0.04593} {"step": 22970, "loss": 1.1837, "grad_norm": "3.004e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.534e-01", "anc_loss": "6.015e-01", "dlm_acc": "8.068e-01", "anc_acc": "7.935e-01", "epoch": 0.04594} {"step": 22975, "loss": 1.2484, "grad_norm": "1.324e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.125e-01", "anc_loss": "8.930e-01", "dlm_acc": "6.729e-01", "anc_acc": "6.516e-01", "epoch": 0.04595} {"step": 22980, "loss": 1.4086, "grad_norm": "3.385e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.114e+00", "dlm_acc": "5.189e-01", "anc_acc": "5.030e-01", "epoch": 0.04596} {"step": 22985, "loss": 1.1514, "grad_norm": "3.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.685e-01", "anc_acc": "5.464e-01", "epoch": 0.04597} {"step": 22990, "loss": 1.1099, "grad_norm": "2.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.699e-01", "anc_loss": "2.811e-01", "dlm_acc": "8.342e-01", "anc_acc": "8.281e-01", "epoch": 0.04598} {"step": 22995, "loss": 1.156, "grad_norm": "2.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.156e-01", "anc_loss": "5.713e-01", "dlm_acc": "7.297e-01", "anc_acc": "7.059e-01", "epoch": 0.04599} {"step": 23000, "loss": 1.2744, "grad_norm": "3.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.922e-01", "anc_loss": "4.324e-01", "dlm_acc": "7.191e-01", "anc_acc": "6.931e-01", "epoch": 0.046} {"step": 23005, "loss": 0.9181, "grad_norm": "3.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.320e-01", "anc_loss": "4.775e-01", "dlm_acc": "7.450e-01", "anc_acc": "7.202e-01", "epoch": 0.04601} {"step": 23010, "loss": 1.5058, "grad_norm": "8.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.251e-01", "anc_loss": "1.002e+00", "dlm_acc": "6.346e-01", "anc_acc": "6.164e-01", "epoch": 0.04602} {"step": 23015, "loss": 1.4753, "grad_norm": "7.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.183e+00", "dlm_acc": "5.586e-01", "anc_acc": "5.384e-01", "epoch": 0.04603} {"step": 23020, "loss": 1.2093, "grad_norm": "2.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.781e-01", "anc_loss": "1.047e+00", "dlm_acc": "5.557e-01", "anc_acc": "5.329e-01", "epoch": 0.04604} {"step": 23025, "loss": 1.4532, "grad_norm": "3.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.984e-01", "anc_loss": "8.453e-01", "dlm_acc": "4.876e-01", "anc_acc": "4.612e-01", "epoch": 0.04605} {"step": 23030, "loss": 0.9139, "grad_norm": "1.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.250e-01", "anc_loss": "5.832e-01", "dlm_acc": "5.581e-01", "anc_acc": "5.102e-01", "epoch": 0.04606} {"step": 23035, "loss": 1.5714, "grad_norm": "2.794e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.516e-01", "anc_loss": "8.141e-01", "dlm_acc": "5.899e-01", "anc_acc": "5.664e-01", "epoch": 0.04607} {"step": 23040, "loss": 1.0966, "grad_norm": "2.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.371e-01", "anc_loss": "8.051e-01", "dlm_acc": "6.473e-01", "anc_acc": "6.295e-01", "epoch": 0.04608} {"step": 23045, "loss": 1.161, "grad_norm": "2.436e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.971e-01", "anc_loss": "4.354e-01", "dlm_acc": "6.946e-01", "anc_acc": "6.719e-01", "epoch": 0.04609} {"step": 23050, "loss": 1.1774, "grad_norm": "3.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.730e-01", "anc_loss": "6.129e-01", "dlm_acc": "6.371e-01", "anc_acc": "6.132e-01", "epoch": 0.0461} {"step": 23055, "loss": 1.4128, "grad_norm": "2.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.816e-01", "anc_loss": "7.031e-01", "dlm_acc": "5.432e-01", "anc_acc": "5.325e-01", "epoch": 0.04611} {"step": 23060, "loss": 1.1601, "grad_norm": "5.552e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.078e-01", "anc_loss": "7.484e-01", "dlm_acc": "5.680e-01", "anc_acc": "5.527e-01", "epoch": 0.04612} {"step": 23065, "loss": 1.5356, "grad_norm": "4.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.660e-01", "anc_loss": "8.047e-01", "dlm_acc": "5.658e-01", "anc_acc": "5.527e-01", "epoch": 0.04613} {"step": 23070, "loss": 0.9293, "grad_norm": "1.294e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.961e-01", "anc_loss": "7.211e-01", "dlm_acc": "5.612e-01", "anc_acc": "5.546e-01", "epoch": 0.04614} {"step": 23075, "loss": 1.4165, "grad_norm": "4.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.680e-01", "anc_loss": "9.164e-01", "dlm_acc": "5.639e-01", "anc_acc": "5.462e-01", "epoch": 0.04615} {"step": 23080, "loss": 1.2162, "grad_norm": "3.862e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.079e+00", "dlm_acc": "5.732e-01", "anc_acc": "5.532e-01", "epoch": 0.04616} {"step": 23085, "loss": 1.2496, "grad_norm": "7.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.123e-01", "anc_loss": "8.689e-01", "dlm_acc": "6.063e-01", "anc_acc": "5.887e-01", "epoch": 0.04617} {"step": 23090, "loss": 0.9654, "grad_norm": "3.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.996e-01", "anc_loss": "8.695e-01", "dlm_acc": "6.595e-01", "anc_acc": "6.392e-01", "epoch": 0.04618} {"step": 23095, "loss": 1.0206, "grad_norm": "2.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.754e-01", "anc_acc": "5.508e-01", "epoch": 0.04619} {"step": 23100, "loss": 0.9839, "grad_norm": "3.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.043e-01", "anc_loss": "9.938e-01", "dlm_acc": "6.518e-01", "anc_acc": "6.261e-01", "epoch": 0.0462} {"step": 23105, "loss": 1.3767, "grad_norm": "3.780e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.660e-01", "anc_loss": "1.050e+00", "dlm_acc": "6.198e-01", "anc_acc": "5.950e-01", "epoch": 0.04621} {"step": 23110, "loss": 1.3662, "grad_norm": "4.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.068e-01", "anc_loss": "4.324e-01", "dlm_acc": "7.126e-01", "anc_acc": "6.995e-01", "epoch": 0.04622} {"step": 23115, "loss": 1.4128, "grad_norm": "3.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.590e-01", "anc_loss": "8.820e-01", "dlm_acc": "4.697e-01", "anc_acc": "4.613e-01", "epoch": 0.04623} {"step": 23120, "loss": 1.1806, "grad_norm": "3.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.215e-01", "anc_loss": "9.949e-01", "dlm_acc": "6.388e-01", "anc_acc": "6.175e-01", "epoch": 0.04624} {"step": 23125, "loss": 0.9948, "grad_norm": "3.182e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.173e+00", "dlm_acc": "5.443e-01", "anc_acc": "5.244e-01", "epoch": 0.04625} {"step": 23130, "loss": 1.1214, "grad_norm": "2.684e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.914e-01", "anc_loss": "9.844e-01", "dlm_acc": "6.552e-01", "anc_acc": "6.348e-01", "epoch": 0.04626} {"step": 23135, "loss": 0.9724, "grad_norm": "4.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.350e-01", "anc_loss": "7.145e-01", "dlm_acc": "7.077e-01", "anc_acc": "6.845e-01", "epoch": 0.04627} {"step": 23140, "loss": 1.1658, "grad_norm": "7.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.629e-01", "anc_loss": "9.305e-01", "dlm_acc": "5.979e-01", "anc_acc": "5.731e-01", "epoch": 0.04628} {"step": 23145, "loss": 1.1878, "grad_norm": "3.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.042e+00", "anc_loss": "1.118e+00", "dlm_acc": "5.375e-01", "anc_acc": "5.182e-01", "epoch": 0.04629} {"step": 23150, "loss": 1.139, "grad_norm": "6.968e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.508e-01", "anc_loss": "6.703e-01", "dlm_acc": "5.556e-01", "anc_acc": "5.439e-01", "epoch": 0.0463} {"step": 23155, "loss": 1.1944, "grad_norm": "3.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.039e-01", "anc_loss": "7.367e-01", "dlm_acc": "5.715e-01", "anc_acc": "5.561e-01", "epoch": 0.04631} {"step": 23160, "loss": 0.8014, "grad_norm": "3.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.828e-01", "anc_loss": "7.383e-01", "dlm_acc": "6.536e-01", "anc_acc": "6.355e-01", "epoch": 0.04632} {"step": 23165, "loss": 0.8906, "grad_norm": "2.696e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.133e+00", "anc_loss": "1.213e+00", "dlm_acc": "6.272e-01", "anc_acc": "6.090e-01", "epoch": 0.04633} {"step": 23170, "loss": 1.1486, "grad_norm": "2.906e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.246e+00", "dlm_acc": "6.268e-01", "anc_acc": "6.030e-01", "epoch": 0.04634} {"step": 23175, "loss": 0.9614, "grad_norm": "9.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.381e+00", "anc_loss": "1.483e+00", "dlm_acc": "5.293e-01", "anc_acc": "5.079e-01", "epoch": 0.04635} {"step": 23180, "loss": 1.0337, "grad_norm": "3.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.573e+00", "dlm_acc": "5.201e-01", "anc_acc": "4.995e-01", "epoch": 0.04636} {"step": 23185, "loss": 0.8324, "grad_norm": "1.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.129e+00", "dlm_acc": "5.183e-01", "anc_acc": "5.020e-01", "epoch": 0.04637} {"step": 23190, "loss": 0.7599, "grad_norm": "2.678e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.638e-01", "anc_acc": "5.415e-01", "epoch": 0.04638} {"step": 23195, "loss": 0.5674, "grad_norm": "2.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.047e-01", "anc_loss": "9.754e-01", "dlm_acc": "5.578e-01", "anc_acc": "5.355e-01", "epoch": 0.04639} {"step": 23200, "loss": 0.6826, "grad_norm": "3.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.422e-01", "anc_loss": "7.918e-01", "dlm_acc": "5.887e-01", "anc_acc": "5.650e-01", "epoch": 0.0464} {"step": 23205, "loss": 0.6328, "grad_norm": "3.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.500e-01", "anc_loss": "6.137e-01", "dlm_acc": "6.619e-01", "anc_acc": "6.355e-01", "epoch": 0.04641} {"step": 23210, "loss": 0.7782, "grad_norm": "2.728e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.066e-01", "anc_loss": "5.359e-01", "dlm_acc": "5.895e-01", "anc_acc": "5.699e-01", "epoch": 0.04642} {"step": 23215, "loss": 0.8954, "grad_norm": "4.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.144e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.684e-01", "anc_acc": "5.457e-01", "epoch": 0.04643} {"step": 23220, "loss": 0.9685, "grad_norm": "4.168e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.707e-01", "anc_loss": "8.135e-01", "dlm_acc": "6.492e-01", "anc_acc": "6.356e-01", "epoch": 0.04644} {"step": 23225, "loss": 0.9573, "grad_norm": "3.842e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.716e-01", "anc_loss": "5.123e-01", "dlm_acc": "7.689e-01", "anc_acc": "7.532e-01", "epoch": 0.04645} {"step": 23230, "loss": 0.9648, "grad_norm": "3.309e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.547e-01", "anc_loss": "1.045e+00", "dlm_acc": "6.514e-01", "anc_acc": "6.276e-01", "epoch": 0.04646} {"step": 23235, "loss": 1.1273, "grad_norm": "3.352e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.777e-01", "anc_loss": "9.555e-01", "dlm_acc": "6.451e-01", "anc_acc": "6.229e-01", "epoch": 0.04647} {"step": 23240, "loss": 0.6764, "grad_norm": "1.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.824e-01", "anc_loss": "7.297e-01", "dlm_acc": "6.045e-01", "anc_acc": "5.873e-01", "epoch": 0.04648} {"step": 23245, "loss": 1.0083, "grad_norm": "6.271e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.359e-01", "anc_loss": "9.750e-01", "dlm_acc": "5.125e-01", "anc_acc": "4.987e-01", "epoch": 0.04649} {"step": 23250, "loss": 0.7748, "grad_norm": "5.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.910e-01", "anc_loss": "5.301e-01", "dlm_acc": "7.010e-01", "anc_acc": "6.813e-01", "epoch": 0.0465} {"step": 23255, "loss": 0.8717, "grad_norm": "3.538e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.767e-01", "anc_loss": "2.186e-01", "dlm_acc": "8.732e-01", "anc_acc": "8.468e-01", "epoch": 0.04651} {"step": 23260, "loss": 0.819, "grad_norm": "5.440e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e-01", "anc_loss": "2.021e-01", "dlm_acc": "8.944e-01", "anc_acc": "8.503e-01", "epoch": 0.04652} {"step": 23265, "loss": 0.9842, "grad_norm": "2.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.394e-01", "anc_loss": "3.771e-01", "dlm_acc": "7.746e-01", "anc_acc": "7.506e-01", "epoch": 0.04653} {"step": 23270, "loss": 1.1525, "grad_norm": "3.068e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.092e+00", "dlm_acc": "6.714e-01", "anc_acc": "6.582e-01", "epoch": 0.04654} {"step": 23275, "loss": 1.2224, "grad_norm": "2.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.797e-01", "anc_loss": "1.065e+00", "dlm_acc": "6.586e-01", "anc_acc": "6.359e-01", "epoch": 0.04655} {"step": 23280, "loss": 1.2783, "grad_norm": "2.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.805e-01", "anc_loss": "1.087e+00", "dlm_acc": "5.796e-01", "anc_acc": "5.551e-01", "epoch": 0.04656} {"step": 23285, "loss": 1.4424, "grad_norm": "2.518e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.157e+00", "anc_loss": "1.247e+00", "dlm_acc": "5.649e-01", "anc_acc": "5.416e-01", "epoch": 0.04657} {"step": 23290, "loss": 1.2705, "grad_norm": "4.608e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.239e+00", "dlm_acc": "6.040e-01", "anc_acc": "5.835e-01", "epoch": 0.04658} {"step": 23295, "loss": 1.0784, "grad_norm": "3.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.717e+00", "dlm_acc": "4.858e-01", "anc_acc": "4.634e-01", "epoch": 0.04659} {"step": 23300, "loss": 0.9225, "grad_norm": "4.161e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.642e-01", "anc_loss": "3.990e-01", "dlm_acc": "8.523e-01", "anc_acc": "8.434e-01", "epoch": 0.0466} {"step": 23305, "loss": 1.1219, "grad_norm": "2.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.109e+00", "dlm_acc": "5.925e-01", "anc_acc": "5.730e-01", "epoch": 0.04661} {"step": 23310, "loss": 1.1172, "grad_norm": "3.019e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.158e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.988e-01", "anc_acc": "5.749e-01", "epoch": 0.04662} {"step": 23315, "loss": 0.922, "grad_norm": "2.610e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.281e-01", "anc_loss": "7.922e-01", "dlm_acc": "6.347e-01", "anc_acc": "6.124e-01", "epoch": 0.04663} {"step": 23320, "loss": 1.0367, "grad_norm": "3.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.457e-01", "anc_loss": "8.922e-01", "dlm_acc": "5.408e-01", "anc_acc": "5.186e-01", "epoch": 0.04664} {"step": 23325, "loss": 1.0643, "grad_norm": "2.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.200e+00", "dlm_acc": "6.107e-01", "anc_acc": "5.887e-01", "epoch": 0.04665} {"step": 23330, "loss": 0.7381, "grad_norm": "2.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.531e-01", "anc_loss": "4.855e-01", "dlm_acc": "6.889e-01", "anc_acc": "6.692e-01", "epoch": 0.04666} {"step": 23335, "loss": 1.371, "grad_norm": "5.766e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.279e+00", "dlm_acc": "6.160e-01", "anc_acc": "5.920e-01", "epoch": 0.04667} {"step": 23340, "loss": 1.3536, "grad_norm": "2.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.151e-01", "anc_acc": "4.969e-01", "epoch": 0.04668} {"step": 23345, "loss": 1.0929, "grad_norm": "5.244e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.279e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.497e-01", "anc_acc": "5.266e-01", "epoch": 0.04669} {"step": 23350, "loss": 0.9126, "grad_norm": "2.740e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.160e-01", "anc_loss": "5.609e-01", "dlm_acc": "6.578e-01", "anc_acc": "6.341e-01", "epoch": 0.0467} {"step": 23355, "loss": 1.666, "grad_norm": "8.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.923e+00", "anc_loss": "2.019e+00", "dlm_acc": "4.620e-01", "anc_acc": "4.459e-01", "epoch": 0.04671} {"step": 23360, "loss": 0.949, "grad_norm": "3.294e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.203e-01", "anc_loss": "1.021e+00", "dlm_acc": "6.499e-01", "anc_acc": "6.241e-01", "epoch": 0.04672} {"step": 23365, "loss": 0.935, "grad_norm": "5.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.277e-01", "anc_loss": "5.863e-01", "dlm_acc": "7.178e-01", "anc_acc": "6.971e-01", "epoch": 0.04673} {"step": 23370, "loss": 0.9071, "grad_norm": "2.493e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.840e-01", "anc_loss": "9.805e-01", "dlm_acc": "6.858e-01", "anc_acc": "6.631e-01", "epoch": 0.04674} {"step": 23375, "loss": 1.077, "grad_norm": "5.265e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.051e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.494e-01", "anc_acc": "5.303e-01", "epoch": 0.04675} {"step": 23380, "loss": 0.7418, "grad_norm": "2.380e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.566e-01", "anc_loss": "6.910e-01", "dlm_acc": "6.347e-01", "anc_acc": "6.214e-01", "epoch": 0.04676} {"step": 23385, "loss": 1.1052, "grad_norm": "3.261e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.922e-01", "anc_loss": "5.051e-01", "dlm_acc": "6.430e-01", "anc_acc": "6.356e-01", "epoch": 0.04677} {"step": 23390, "loss": 0.9536, "grad_norm": "1.390e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.578e-01", "anc_loss": "6.914e-01", "dlm_acc": "6.602e-01", "anc_acc": "6.488e-01", "epoch": 0.04678} {"step": 23395, "loss": 0.8732, "grad_norm": "1.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.129e-01", "anc_loss": "7.805e-01", "dlm_acc": "6.704e-01", "anc_acc": "6.498e-01", "epoch": 0.04679} {"step": 23400, "loss": 0.6561, "grad_norm": "3.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.957e-01", "anc_loss": "6.379e-01", "dlm_acc": "5.987e-01", "anc_acc": "5.780e-01", "epoch": 0.0468} {"step": 23405, "loss": 0.8969, "grad_norm": "2.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.242e-01", "anc_loss": "6.631e-01", "dlm_acc": "6.597e-01", "anc_acc": "6.441e-01", "epoch": 0.04681} {"step": 23410, "loss": 1.3658, "grad_norm": "4.129e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.174e+00", "dlm_acc": "5.487e-01", "anc_acc": "5.216e-01", "epoch": 0.04682} {"step": 23415, "loss": 0.9127, "grad_norm": "3.765e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.077e+00", "dlm_acc": "5.077e-01", "anc_acc": "4.945e-01", "epoch": 0.04683} {"step": 23420, "loss": 0.9807, "grad_norm": "2.732e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.184e+00", "dlm_acc": "4.105e-01", "anc_acc": "4.017e-01", "epoch": 0.04684} {"step": 23425, "loss": 0.7061, "grad_norm": "8.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.594e-01", "anc_loss": "9.551e-01", "dlm_acc": "6.376e-01", "anc_acc": "6.126e-01", "epoch": 0.04685} {"step": 23430, "loss": 1.0602, "grad_norm": "3.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.451e+00", "anc_loss": "1.547e+00", "dlm_acc": "5.047e-01", "anc_acc": "4.836e-01", "epoch": 0.04686} {"step": 23435, "loss": 0.8122, "grad_norm": "4.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.637e-01", "anc_loss": "1.024e+00", "dlm_acc": "6.368e-01", "anc_acc": "6.245e-01", "epoch": 0.04687} {"step": 23440, "loss": 1.2688, "grad_norm": "8.372e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.469e+00", "anc_loss": "1.567e+00", "dlm_acc": "5.418e-01", "anc_acc": "5.237e-01", "epoch": 0.04688} {"step": 23445, "loss": 1.0985, "grad_norm": "9.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.155e+00", "dlm_acc": "5.671e-01", "anc_acc": "5.497e-01", "epoch": 0.04689} {"step": 23450, "loss": 0.7571, "grad_norm": "2.794e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.741e-01", "anc_loss": "2.270e-01", "dlm_acc": "9.290e-01", "anc_acc": "9.161e-01", "epoch": 0.0469} {"step": 23455, "loss": 0.8624, "grad_norm": "2.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.630e-01", "anc_loss": "2.168e-01", "dlm_acc": "9.399e-01", "anc_acc": "9.257e-01", "epoch": 0.04691} {"step": 23460, "loss": 0.89, "grad_norm": "1.640e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.659e-01", "anc_loss": "2.164e-01", "dlm_acc": "9.411e-01", "anc_acc": "9.251e-01", "epoch": 0.04692} {"step": 23465, "loss": 1.3411, "grad_norm": "3.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.336e+00", "dlm_acc": "5.758e-01", "anc_acc": "5.543e-01", "epoch": 0.04693} {"step": 23470, "loss": 1.5165, "grad_norm": "2.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.436e+00", "dlm_acc": "5.828e-01", "anc_acc": "5.513e-01", "epoch": 0.04694} {"step": 23475, "loss": 1.6243, "grad_norm": "3.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.648e+00", "anc_loss": "1.758e+00", "dlm_acc": "4.862e-01", "anc_acc": "4.645e-01", "epoch": 0.04695} {"step": 23480, "loss": 1.3374, "grad_norm": "5.813e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.557e-01", "anc_acc": "5.325e-01", "epoch": 0.04696} {"step": 23485, "loss": 0.9827, "grad_norm": "2.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.980e-01", "anc_loss": "1.082e+00", "dlm_acc": "6.191e-01", "anc_acc": "5.976e-01", "epoch": 0.04697} {"step": 23490, "loss": 1.3422, "grad_norm": "3.653e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.325e+00", "dlm_acc": "6.148e-01", "anc_acc": "5.899e-01", "epoch": 0.04698} {"step": 23495, "loss": 1.5021, "grad_norm": "4.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.397e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.405e-01", "anc_acc": "5.171e-01", "epoch": 0.04699} {"step": 23500, "loss": 1.1581, "grad_norm": "4.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.687e-01", "anc_acc": "5.466e-01", "epoch": 0.047} {"step": 23505, "loss": 1.5514, "grad_norm": "2.580e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.799e+00", "dlm_acc": "4.657e-01", "anc_acc": "4.476e-01", "epoch": 0.04701} {"step": 23510, "loss": 1.019, "grad_norm": "2.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.237e+00", "anc_loss": "1.332e+00", "dlm_acc": "5.633e-01", "anc_acc": "5.421e-01", "epoch": 0.04702} {"step": 23515, "loss": 1.4178, "grad_norm": "4.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.550e+00", "anc_loss": "1.662e+00", "dlm_acc": "5.076e-01", "anc_acc": "4.818e-01", "epoch": 0.04703} {"step": 23520, "loss": 1.4673, "grad_norm": "4.842e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.507e+00", "anc_loss": "1.603e+00", "dlm_acc": "4.827e-01", "anc_acc": "4.653e-01", "epoch": 0.04704} {"step": 23525, "loss": 1.1372, "grad_norm": "4.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.546e+00", "dlm_acc": "5.428e-01", "anc_acc": "5.212e-01", "epoch": 0.04705} {"step": 23530, "loss": 0.9595, "grad_norm": "2.422e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.456e+00", "anc_loss": "1.562e+00", "dlm_acc": "5.241e-01", "anc_acc": "5.009e-01", "epoch": 0.04706} {"step": 23535, "loss": 1.1785, "grad_norm": "3.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.484e+00", "anc_loss": "1.587e+00", "dlm_acc": "5.113e-01", "anc_acc": "4.902e-01", "epoch": 0.04707} {"step": 23540, "loss": 1.3281, "grad_norm": "3.331e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e+00", "anc_loss": "1.447e+00", "dlm_acc": "5.591e-01", "anc_acc": "5.383e-01", "epoch": 0.04708} {"step": 23545, "loss": 1.0624, "grad_norm": "2.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.403e+00", "anc_loss": "1.506e+00", "dlm_acc": "5.060e-01", "anc_acc": "4.839e-01", "epoch": 0.04709} {"step": 23550, "loss": 1.1856, "grad_norm": "2.931e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.443e+00", "dlm_acc": "5.418e-01", "anc_acc": "5.189e-01", "epoch": 0.0471} {"step": 23555, "loss": 0.9708, "grad_norm": "4.119e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.304e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.378e-01", "anc_acc": "5.174e-01", "epoch": 0.04711} {"step": 23560, "loss": 1.1653, "grad_norm": "4.576e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.523e+00", "dlm_acc": "5.104e-01", "anc_acc": "4.906e-01", "epoch": 0.04712} {"step": 23565, "loss": 1.1145, "grad_norm": "4.214e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.397e+00", "dlm_acc": "5.629e-01", "anc_acc": "5.360e-01", "epoch": 0.04713} {"step": 23570, "loss": 1.4343, "grad_norm": "6.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.510e+00", "anc_loss": "1.633e+00", "dlm_acc": "5.484e-01", "anc_acc": "5.233e-01", "epoch": 0.04714} {"step": 23575, "loss": 0.9449, "grad_norm": "1.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.144e+00", "dlm_acc": "6.188e-01", "anc_acc": "6.037e-01", "epoch": 0.04715} {"step": 23580, "loss": 1.0038, "grad_norm": "2.709e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.165e+00", "dlm_acc": "5.545e-01", "anc_acc": "5.325e-01", "epoch": 0.04716} {"step": 23585, "loss": 0.6186, "grad_norm": "2.472e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.328e-01", "anc_loss": "4.719e-01", "dlm_acc": "6.820e-01", "anc_acc": "6.587e-01", "epoch": 0.04717} {"step": 23590, "loss": 0.7322, "grad_norm": "3.234e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.633e-01", "anc_loss": "5.051e-01", "dlm_acc": "6.782e-01", "anc_acc": "6.532e-01", "epoch": 0.04718} {"step": 23595, "loss": 0.7778, "grad_norm": "2.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.941e-01", "anc_loss": "4.324e-01", "dlm_acc": "7.035e-01", "anc_acc": "6.770e-01", "epoch": 0.04719} {"step": 23600, "loss": 0.9787, "grad_norm": "3.053e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.643e-01", "anc_loss": "5.016e-01", "dlm_acc": "6.721e-01", "anc_acc": "6.470e-01", "epoch": 0.0472} {"step": 23605, "loss": 0.76, "grad_norm": "4.707e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.332e-01", "anc_loss": "4.773e-01", "dlm_acc": "6.746e-01", "anc_acc": "6.474e-01", "epoch": 0.04721} {"step": 23610, "loss": 0.7147, "grad_norm": "2.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.219e-01", "anc_loss": "4.656e-01", "dlm_acc": "6.659e-01", "anc_acc": "6.386e-01", "epoch": 0.04722} {"step": 23615, "loss": 0.7386, "grad_norm": "2.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.855e-01", "anc_loss": "5.297e-01", "dlm_acc": "6.512e-01", "anc_acc": "6.237e-01", "epoch": 0.04723} {"step": 23620, "loss": 1.0349, "grad_norm": "5.581e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.867e-01", "anc_loss": "9.488e-01", "dlm_acc": "6.110e-01", "anc_acc": "5.898e-01", "epoch": 0.04724} {"step": 23625, "loss": 0.9628, "grad_norm": "2.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.335e+00", "dlm_acc": "5.781e-01", "anc_acc": "5.537e-01", "epoch": 0.04725} {"step": 23630, "loss": 1.0901, "grad_norm": "3.820e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.750e-01", "anc_acc": "5.494e-01", "epoch": 0.04726} {"step": 23635, "loss": 0.9527, "grad_norm": "2.373e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.269e+00", "dlm_acc": "5.652e-01", "anc_acc": "5.390e-01", "epoch": 0.04727} {"step": 23640, "loss": 0.8225, "grad_norm": "3.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.254e+00", "dlm_acc": "5.547e-01", "anc_acc": "5.347e-01", "epoch": 0.04728} {"step": 23645, "loss": 0.741, "grad_norm": "2.153e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.281e-01", "anc_loss": "1.033e+00", "dlm_acc": "6.221e-01", "anc_acc": "5.969e-01", "epoch": 0.04729} {"step": 23650, "loss": 1.4568, "grad_norm": "3.322e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.725e+00", "anc_loss": "1.823e+00", "dlm_acc": "4.520e-01", "anc_acc": "4.337e-01", "epoch": 0.0473} {"step": 23655, "loss": 1.0224, "grad_norm": "2.954e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.670e+00", "dlm_acc": "5.159e-01", "anc_acc": "4.913e-01", "epoch": 0.04731} {"step": 23660, "loss": 1.0822, "grad_norm": "6.950e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.695e-01", "anc_loss": "1.056e+00", "dlm_acc": "6.847e-01", "anc_acc": "6.666e-01", "epoch": 0.04732} {"step": 23665, "loss": 1.1651, "grad_norm": "5.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.591e+00", "anc_loss": "1.702e+00", "dlm_acc": "4.933e-01", "anc_acc": "4.706e-01", "epoch": 0.04733} {"step": 23670, "loss": 1.1561, "grad_norm": "4.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.607e+00", "anc_loss": "1.722e+00", "dlm_acc": "4.978e-01", "anc_acc": "4.731e-01", "epoch": 0.04734} {"step": 23675, "loss": 1.0822, "grad_norm": "3.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.340e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.475e-01", "anc_acc": "5.286e-01", "epoch": 0.04735} {"step": 23680, "loss": 1.2624, "grad_norm": "3.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.759e+00", "anc_loss": "2.791e+00", "dlm_acc": "2.390e-02", "anc_acc": "2.378e-02", "epoch": 0.04736} {"step": 23685, "loss": 0.8891, "grad_norm": "1.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.816e-01", "anc_acc": "5.594e-01", "epoch": 0.04737} {"step": 23690, "loss": 0.8814, "grad_norm": "4.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.525e+00", "dlm_acc": "5.332e-01", "anc_acc": "5.107e-01", "epoch": 0.04738} {"step": 23695, "loss": 0.9413, "grad_norm": "3.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.341e+00", "dlm_acc": "6.035e-01", "anc_acc": "5.773e-01", "epoch": 0.04739} {"step": 23700, "loss": 0.8537, "grad_norm": "3.180e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.123e+00", "dlm_acc": "6.094e-01", "anc_acc": "5.830e-01", "epoch": 0.0474} {"step": 23705, "loss": 1.1467, "grad_norm": "4.943e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.179e+00", "anc_loss": "1.280e+00", "dlm_acc": "6.327e-01", "anc_acc": "6.048e-01", "epoch": 0.04741} {"step": 23710, "loss": 0.7452, "grad_norm": "2.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.307e+00", "dlm_acc": "5.268e-01", "anc_acc": "5.052e-01", "epoch": 0.04742} {"step": 23715, "loss": 1.3444, "grad_norm": "3.320e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.913e+00", "anc_loss": "2.030e+00", "dlm_acc": "4.488e-01", "anc_acc": "4.280e-01", "epoch": 0.04743} {"step": 23720, "loss": 0.7647, "grad_norm": "2.537e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.268e+00", "dlm_acc": "5.704e-01", "anc_acc": "5.471e-01", "epoch": 0.04744} {"step": 23725, "loss": 1.0737, "grad_norm": "2.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.673e+00", "anc_loss": "1.780e+00", "dlm_acc": "4.766e-01", "anc_acc": "4.549e-01", "epoch": 0.04745} {"step": 23730, "loss": 0.6732, "grad_norm": "4.024e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.994e-01", "anc_loss": "8.777e-01", "dlm_acc": "6.855e-01", "anc_acc": "6.632e-01", "epoch": 0.04746} {"step": 23735, "loss": 0.9231, "grad_norm": "4.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.185e+00", "dlm_acc": "6.166e-01", "anc_acc": "5.947e-01", "epoch": 0.04747} {"step": 23740, "loss": 0.9478, "grad_norm": "4.187e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.112e+00", "anc_loss": "1.204e+00", "dlm_acc": "5.861e-01", "anc_acc": "5.616e-01", "epoch": 0.04748} {"step": 23745, "loss": 1.0475, "grad_norm": "3.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.202e-01", "anc_acc": "4.992e-01", "epoch": 0.04749} {"step": 23750, "loss": 1.6665, "grad_norm": "4.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.870e+00", "anc_loss": "1.970e+00", "dlm_acc": "4.373e-01", "anc_acc": "4.202e-01", "epoch": 0.0475} {"step": 23755, "loss": 1.218, "grad_norm": "4.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.411e+00", "dlm_acc": "5.627e-01", "anc_acc": "5.382e-01", "epoch": 0.04751} {"step": 23760, "loss": 0.8586, "grad_norm": "4.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.051e+00", "anc_loss": "1.147e+00", "dlm_acc": "5.749e-01", "anc_acc": "5.494e-01", "epoch": 0.04752} {"step": 23765, "loss": 1.0563, "grad_norm": "2.449e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.177e+00", "dlm_acc": "6.067e-01", "anc_acc": "5.807e-01", "epoch": 0.04753} {"step": 23770, "loss": 0.9844, "grad_norm": "2.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.223e+00", "dlm_acc": "6.042e-01", "anc_acc": "5.767e-01", "epoch": 0.04754} {"step": 23775, "loss": 1.007, "grad_norm": "1.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.078e+00", "anc_loss": "1.168e+00", "dlm_acc": "5.638e-01", "anc_acc": "5.392e-01", "epoch": 0.04755} {"step": 23780, "loss": 1.3589, "grad_norm": "2.756e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.522e+00", "dlm_acc": "5.397e-01", "anc_acc": "5.170e-01", "epoch": 0.04756} {"step": 23785, "loss": 1.0789, "grad_norm": "3.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.089e+00", "dlm_acc": "6.268e-01", "anc_acc": "6.018e-01", "epoch": 0.04757} {"step": 23790, "loss": 1.0824, "grad_norm": "2.770e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.050e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.634e-01", "anc_acc": "5.446e-01", "epoch": 0.04758} {"step": 23795, "loss": 1.215, "grad_norm": "2.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.528e+00", "dlm_acc": "5.132e-01", "anc_acc": "4.930e-01", "epoch": 0.04759} {"step": 23800, "loss": 0.881, "grad_norm": "2.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.055e-01", "anc_loss": "1.011e+00", "dlm_acc": "6.558e-01", "anc_acc": "6.282e-01", "epoch": 0.0476} {"step": 23805, "loss": 1.7678, "grad_norm": "3.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.087e+00", "anc_loss": "2.203e+00", "dlm_acc": "4.791e-01", "anc_acc": "4.613e-01", "epoch": 0.04761} {"step": 23810, "loss": 1.1926, "grad_norm": "3.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.431e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.288e-01", "anc_acc": "5.066e-01", "epoch": 0.04762} {"step": 23815, "loss": 1.3639, "grad_norm": "2.617e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.766e-01", "anc_loss": "1.070e+00", "dlm_acc": "6.756e-01", "anc_acc": "6.533e-01", "epoch": 0.04763} {"step": 23820, "loss": 0.948, "grad_norm": "1.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.867e-01", "anc_loss": "9.754e-01", "dlm_acc": "6.264e-01", "anc_acc": "6.018e-01", "epoch": 0.04764} {"step": 23825, "loss": 1.4312, "grad_norm": "6.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.660e-01", "anc_acc": "5.400e-01", "epoch": 0.04765} {"step": 23830, "loss": 1.9397, "grad_norm": "5.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.800e+00", "anc_loss": "1.908e+00", "dlm_acc": "4.693e-01", "anc_acc": "4.505e-01", "epoch": 0.04766} {"step": 23835, "loss": 1.7562, "grad_norm": "4.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.981e-01", "anc_acc": "5.739e-01", "epoch": 0.04767} {"step": 23840, "loss": 1.4049, "grad_norm": "2.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.268e-01", "anc_loss": "1.018e+00", "dlm_acc": "6.592e-01", "anc_acc": "6.361e-01", "epoch": 0.04768} {"step": 23845, "loss": 1.5892, "grad_norm": "3.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.511e+00", "dlm_acc": "5.585e-01", "anc_acc": "5.320e-01", "epoch": 0.04769} {"step": 23850, "loss": 1.4776, "grad_norm": "2.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.383e+00", "anc_loss": "1.483e+00", "dlm_acc": "5.202e-01", "anc_acc": "4.978e-01", "epoch": 0.0477} {"step": 23855, "loss": 1.1151, "grad_norm": "1.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.250e+00", "dlm_acc": "5.588e-01", "anc_acc": "5.365e-01", "epoch": 0.04771} {"step": 23860, "loss": 1.3512, "grad_norm": "3.003e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.674e-01", "anc_acc": "5.422e-01", "epoch": 0.04772} {"step": 23865, "loss": 0.8535, "grad_norm": "2.401e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.047e-01", "anc_loss": "8.727e-01", "dlm_acc": "6.366e-01", "anc_acc": "6.177e-01", "epoch": 0.04773} {"step": 23870, "loss": 1.1564, "grad_norm": "1.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.801e-01", "anc_loss": "1.077e+00", "dlm_acc": "6.221e-01", "anc_acc": "5.992e-01", "epoch": 0.04774} {"step": 23875, "loss": 1.2296, "grad_norm": "6.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.046e+00", "anc_loss": "1.122e+00", "dlm_acc": "6.263e-01", "anc_acc": "6.104e-01", "epoch": 0.04775} {"step": 23880, "loss": 1.1487, "grad_norm": "2.756e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.836e-01", "anc_loss": "8.758e-01", "dlm_acc": "6.685e-01", "anc_acc": "6.390e-01", "epoch": 0.04776} {"step": 23885, "loss": 1.112, "grad_norm": "5.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.777e-01", "anc_loss": "8.516e-01", "dlm_acc": "6.385e-01", "anc_acc": "6.200e-01", "epoch": 0.04777} {"step": 23890, "loss": 1.4362, "grad_norm": "3.156e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.103e+00", "anc_loss": "1.225e+00", "dlm_acc": "6.101e-01", "anc_acc": "5.806e-01", "epoch": 0.04778} {"step": 23895, "loss": 1.0073, "grad_norm": "2.333e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.074e-01", "anc_loss": "7.965e-01", "dlm_acc": "6.834e-01", "anc_acc": "6.595e-01", "epoch": 0.04779} {"step": 23900, "loss": 1.1015, "grad_norm": "4.430e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.156e+00", "anc_loss": "1.263e+00", "dlm_acc": "5.523e-01", "anc_acc": "5.254e-01", "epoch": 0.0478} {"step": 23905, "loss": 1.3352, "grad_norm": "4.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.290e+00", "dlm_acc": "5.686e-01", "anc_acc": "5.413e-01", "epoch": 0.04781} {"step": 23910, "loss": 1.3999, "grad_norm": "5.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.356e+00", "anc_loss": "1.442e+00", "dlm_acc": "4.951e-01", "anc_acc": "4.753e-01", "epoch": 0.04782} {"step": 23915, "loss": 0.9885, "grad_norm": "1.214e+00", "learning_rate": "1.000e-04", "dlm_loss": "7.924e-01", "anc_loss": "8.691e-01", "dlm_acc": "6.784e-01", "anc_acc": "6.560e-01", "epoch": 0.04783} {"step": 23920, "loss": 1.422, "grad_norm": "3.994e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.260e+00", "anc_loss": "1.383e+00", "dlm_acc": "5.734e-01", "anc_acc": "5.482e-01", "epoch": 0.04784} {"step": 23925, "loss": 1.1984, "grad_norm": "8.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.336e-01", "anc_loss": "6.937e-01", "dlm_acc": "7.253e-01", "anc_acc": "7.037e-01", "epoch": 0.04785} {"step": 23930, "loss": 1.1077, "grad_norm": "3.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.355e-01", "anc_loss": "8.059e-01", "dlm_acc": "6.753e-01", "anc_acc": "6.497e-01", "epoch": 0.04786} {"step": 23935, "loss": 1.5445, "grad_norm": "4.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.492e-01", "anc_loss": "1.023e+00", "dlm_acc": "6.346e-01", "anc_acc": "6.124e-01", "epoch": 0.04787} {"step": 23940, "loss": 0.9635, "grad_norm": "3.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.182e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.665e-01", "anc_acc": "5.384e-01", "epoch": 0.04788} {"step": 23945, "loss": 1.084, "grad_norm": "4.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.362e+00", "dlm_acc": "5.326e-01", "anc_acc": "4.966e-01", "epoch": 0.04789} {"step": 23950, "loss": 1.6136, "grad_norm": "7.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.653e-01", "anc_acc": "5.441e-01", "epoch": 0.0479} {"step": 23955, "loss": 1.5479, "grad_norm": "3.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.231e+00", "anc_loss": "2.272e+00", "dlm_acc": "1.627e-01", "anc_acc": "1.545e-01", "epoch": 0.04791} {"step": 23960, "loss": 1.0572, "grad_norm": "3.756e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.977e+00", "anc_loss": "2.020e+00", "dlm_acc": "3.001e-01", "anc_acc": "2.891e-01", "epoch": 0.04792} {"step": 23965, "loss": 0.8728, "grad_norm": "2.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.367e-01", "anc_loss": "1.018e+00", "dlm_acc": "6.164e-01", "anc_acc": "5.943e-01", "epoch": 0.04793} {"step": 23970, "loss": 1.5026, "grad_norm": "5.875e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.636e+00", "anc_loss": "1.722e+00", "dlm_acc": "4.394e-01", "anc_acc": "4.225e-01", "epoch": 0.04794} {"step": 23975, "loss": 1.6216, "grad_norm": "5.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.615e+00", "anc_loss": "1.763e+00", "dlm_acc": "5.153e-01", "anc_acc": "4.936e-01", "epoch": 0.04795} {"step": 23980, "loss": 1.2364, "grad_norm": "3.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.945e-01", "anc_loss": "9.633e-01", "dlm_acc": "6.076e-01", "anc_acc": "5.896e-01", "epoch": 0.04796} {"step": 23985, "loss": 1.6395, "grad_norm": "4.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.516e+00", "anc_loss": "1.584e+00", "dlm_acc": "4.307e-01", "anc_acc": "4.153e-01", "epoch": 0.04797} {"step": 23990, "loss": 0.939, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.840e-01", "anc_loss": "7.676e-01", "dlm_acc": "7.072e-01", "anc_acc": "6.815e-01", "epoch": 0.04798} {"step": 23995, "loss": 1.4571, "grad_norm": "5.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.428e+00", "anc_loss": "1.515e+00", "dlm_acc": "4.859e-01", "anc_acc": "4.673e-01", "epoch": 0.04799} {"step": 24000, "loss": 1.0831, "grad_norm": "6.388e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.023e-01", "anc_loss": "5.375e-01", "dlm_acc": "6.884e-01", "anc_acc": "6.724e-01", "epoch": 0.048} {"step": 24005, "loss": 0.9722, "grad_norm": "4.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.105e+00", "dlm_acc": "3.633e-01", "anc_acc": "3.554e-01", "epoch": 0.04801} {"step": 24010, "loss": 1.128, "grad_norm": "5.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.142e+00", "dlm_acc": "5.880e-01", "anc_acc": "5.750e-01", "epoch": 0.04802} {"step": 24015, "loss": 1.1403, "grad_norm": "2.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.405e+00", "dlm_acc": "4.681e-01", "anc_acc": "4.424e-01", "epoch": 0.04803} {"step": 24020, "loss": 0.998, "grad_norm": "3.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.182e+00", "anc_loss": "1.302e+00", "dlm_acc": "5.491e-01", "anc_acc": "5.202e-01", "epoch": 0.04804} {"step": 24025, "loss": 0.9176, "grad_norm": "5.122e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.106e-01", "anc_acc": "4.922e-01", "epoch": 0.04805} {"step": 24030, "loss": 1.0481, "grad_norm": "3.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.331e+00", "dlm_acc": "4.683e-01", "anc_acc": "4.410e-01", "epoch": 0.04806} {"step": 24035, "loss": 0.9881, "grad_norm": "1.635e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.128e-01", "anc_loss": "5.471e-01", "dlm_acc": "7.601e-01", "anc_acc": "7.508e-01", "epoch": 0.04807} {"step": 24040, "loss": 0.8364, "grad_norm": "3.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.518e-01", "anc_loss": "8.281e-01", "dlm_acc": "6.768e-01", "anc_acc": "6.547e-01", "epoch": 0.04808} {"step": 24045, "loss": 1.0615, "grad_norm": "1.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.049e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.105e-01", "anc_acc": "5.851e-01", "epoch": 0.04809} {"step": 24050, "loss": 1.4215, "grad_norm": "3.279e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.080e+00", "anc_loss": "2.145e+00", "dlm_acc": "3.033e-01", "anc_acc": "2.898e-01", "epoch": 0.0481} {"step": 24055, "loss": 1.1665, "grad_norm": "2.520e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.134e+00", "dlm_acc": "6.211e-01", "anc_acc": "5.970e-01", "epoch": 0.04811} {"step": 24060, "loss": 1.3192, "grad_norm": "1.712e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.351e-01", "anc_acc": "5.127e-01", "epoch": 0.04812} {"step": 24065, "loss": 1.2375, "grad_norm": "3.751e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.344e+00", "dlm_acc": "6.214e-01", "anc_acc": "5.992e-01", "epoch": 0.04813} {"step": 24070, "loss": 1.3645, "grad_norm": "3.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.506e+00", "anc_loss": "1.617e+00", "dlm_acc": "5.017e-01", "anc_acc": "4.771e-01", "epoch": 0.04814} {"step": 24075, "loss": 1.106, "grad_norm": "3.880e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.222e+00", "dlm_acc": "5.825e-01", "anc_acc": "5.609e-01", "epoch": 0.04815} {"step": 24080, "loss": 1.3968, "grad_norm": "4.868e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.414e+00", "dlm_acc": "5.583e-01", "anc_acc": "5.412e-01", "epoch": 0.04816} {"step": 24085, "loss": 1.1261, "grad_norm": "2.791e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.206e+00", "dlm_acc": "5.942e-01", "anc_acc": "5.671e-01", "epoch": 0.04817} {"step": 24090, "loss": 1.1847, "grad_norm": "2.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.048e-01", "anc_acc": "4.832e-01", "epoch": 0.04818} {"step": 24095, "loss": 1.5018, "grad_norm": "5.921e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.518e+00", "dlm_acc": "5.695e-01", "anc_acc": "5.463e-01", "epoch": 0.04819} {"step": 24100, "loss": 1.4322, "grad_norm": "3.951e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.578e+00", "dlm_acc": "5.509e-01", "anc_acc": "5.240e-01", "epoch": 0.0482} {"step": 24105, "loss": 1.0711, "grad_norm": "2.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.296e+00", "dlm_acc": "5.805e-01", "anc_acc": "5.605e-01", "epoch": 0.04821} {"step": 24110, "loss": 1.3456, "grad_norm": "1.078e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.500e+00", "dlm_acc": "5.561e-01", "anc_acc": "5.315e-01", "epoch": 0.04822} {"step": 24115, "loss": 1.0316, "grad_norm": "2.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.329e+00", "dlm_acc": "5.776e-01", "anc_acc": "5.520e-01", "epoch": 0.04823} {"step": 24120, "loss": 1.0167, "grad_norm": "2.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.000e-01", "anc_loss": "8.277e-01", "dlm_acc": "6.150e-01", "anc_acc": "6.060e-01", "epoch": 0.04824} {"step": 24125, "loss": 1.4145, "grad_norm": "2.540e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.896e-01", "anc_loss": "4.098e-01", "dlm_acc": "7.905e-01", "anc_acc": "7.815e-01", "epoch": 0.04825} {"step": 24130, "loss": 0.7512, "grad_norm": "2.339e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.553e-01", "anc_loss": "9.209e-01", "dlm_acc": "6.328e-01", "anc_acc": "6.125e-01", "epoch": 0.04826} {"step": 24135, "loss": 0.626, "grad_norm": "3.276e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.877e-02", "anc_loss": "9.985e-02", "dlm_acc": "9.492e-01", "anc_acc": "9.286e-01", "epoch": 0.04827} {"step": 24140, "loss": 0.8503, "grad_norm": "6.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.879e-01", "anc_loss": "2.282e-01", "dlm_acc": "8.818e-01", "anc_acc": "8.595e-01", "epoch": 0.04828} {"step": 24145, "loss": 1.2507, "grad_norm": "5.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.631e+00", "dlm_acc": "4.736e-01", "anc_acc": "4.501e-01", "epoch": 0.04829} {"step": 24150, "loss": 0.9406, "grad_norm": "2.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.465e-01", "anc_loss": "6.129e-01", "dlm_acc": "7.069e-01", "anc_acc": "6.856e-01", "epoch": 0.0483} {"step": 24155, "loss": 1.0186, "grad_norm": "3.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.098e-01", "anc_loss": "9.324e-01", "dlm_acc": "5.388e-01", "anc_acc": "5.329e-01", "epoch": 0.04831} {"step": 24160, "loss": 0.8988, "grad_norm": "3.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.882e-01", "anc_acc": "5.694e-01", "epoch": 0.04832} {"step": 24165, "loss": 1.1117, "grad_norm": "2.022e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.180e-01", "anc_loss": "9.898e-01", "dlm_acc": "6.311e-01", "anc_acc": "6.101e-01", "epoch": 0.04833} {"step": 24170, "loss": 1.0134, "grad_norm": "4.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.832e-01", "anc_loss": "7.332e-01", "dlm_acc": "6.170e-01", "anc_acc": "5.974e-01", "epoch": 0.04834} {"step": 24175, "loss": 0.9249, "grad_norm": "4.162e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.875e-01", "anc_loss": "7.078e-01", "dlm_acc": "5.534e-01", "anc_acc": "5.443e-01", "epoch": 0.04835} {"step": 24180, "loss": 0.892, "grad_norm": "5.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.232e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.389e-01", "epoch": 0.04836} {"step": 24185, "loss": 0.9784, "grad_norm": "3.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.237e+00", "dlm_acc": "5.375e-01", "anc_acc": "5.156e-01", "epoch": 0.04837} {"step": 24190, "loss": 0.8827, "grad_norm": "2.620e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.386e-01", "anc_loss": "4.903e-01", "dlm_acc": "7.614e-01", "anc_acc": "7.422e-01", "epoch": 0.04838} {"step": 24195, "loss": 0.8477, "grad_norm": "2.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.204e-01", "anc_loss": "2.423e-01", "dlm_acc": "8.986e-01", "anc_acc": "8.924e-01", "epoch": 0.04839} {"step": 24200, "loss": 0.8943, "grad_norm": "2.908e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.463e-01", "anc_loss": "1.564e-01", "dlm_acc": "9.147e-01", "anc_acc": "9.111e-01", "epoch": 0.0484} {"step": 24205, "loss": 0.8469, "grad_norm": "5.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.787e-01", "anc_loss": "1.859e-01", "dlm_acc": "8.976e-01", "anc_acc": "8.938e-01", "epoch": 0.04841} {"step": 24210, "loss": 0.7088, "grad_norm": "3.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.287e-01", "anc_loss": "3.410e-01", "dlm_acc": "7.876e-01", "anc_acc": "7.825e-01", "epoch": 0.04842} {"step": 24215, "loss": 0.8607, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.156e-01", "anc_loss": "4.297e-01", "dlm_acc": "7.170e-01", "anc_acc": "7.093e-01", "epoch": 0.04843} {"step": 24220, "loss": 0.6565, "grad_norm": "1.737e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.465e-01", "anc_loss": "6.937e-01", "dlm_acc": "6.256e-01", "anc_acc": "6.079e-01", "epoch": 0.04844} {"step": 24225, "loss": 0.7652, "grad_norm": "5.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.664e-01", "anc_loss": "9.242e-01", "dlm_acc": "5.398e-01", "anc_acc": "5.178e-01", "epoch": 0.04845} {"step": 24230, "loss": 0.59, "grad_norm": "2.516e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.367e-01", "anc_loss": "8.953e-01", "dlm_acc": "5.089e-01", "anc_acc": "4.879e-01", "epoch": 0.04846} {"step": 24235, "loss": 0.9318, "grad_norm": "2.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.172e-01", "anc_loss": "9.570e-01", "dlm_acc": "4.298e-01", "anc_acc": "4.160e-01", "epoch": 0.04847} {"step": 24240, "loss": 0.9579, "grad_norm": "1.958e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.352e-01", "anc_loss": "1.023e+00", "dlm_acc": "6.444e-01", "anc_acc": "6.201e-01", "epoch": 0.04848} {"step": 24245, "loss": 0.7246, "grad_norm": "3.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.309e-01", "anc_loss": "8.875e-01", "dlm_acc": "5.738e-01", "anc_acc": "5.541e-01", "epoch": 0.04849} {"step": 24250, "loss": 0.7332, "grad_norm": "2.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.126e+00", "dlm_acc": "6.073e-01", "anc_acc": "5.838e-01", "epoch": 0.0485} {"step": 24255, "loss": 0.9435, "grad_norm": "1.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.336e-01", "anc_loss": "7.383e-01", "dlm_acc": "5.579e-01", "anc_acc": "5.558e-01", "epoch": 0.04851} {"step": 24260, "loss": 0.8448, "grad_norm": "4.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.422e-01", "anc_loss": "7.469e-01", "dlm_acc": "5.515e-01", "anc_acc": "5.497e-01", "epoch": 0.04852} {"step": 24265, "loss": 1.0787, "grad_norm": "7.610e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.016e-01", "anc_loss": "7.039e-01", "dlm_acc": "5.873e-01", "anc_acc": "5.846e-01", "epoch": 0.04853} {"step": 24270, "loss": 1.0086, "grad_norm": "3.544e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.406e-01", "anc_loss": "7.891e-01", "dlm_acc": "6.030e-01", "anc_acc": "5.858e-01", "epoch": 0.04854} {"step": 24275, "loss": 1.1208, "grad_norm": "3.312e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.688e-01", "anc_loss": "8.203e-01", "dlm_acc": "5.755e-01", "anc_acc": "5.559e-01", "epoch": 0.04855} {"step": 24280, "loss": 0.851, "grad_norm": "2.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.555e-01", "anc_loss": "6.289e-01", "dlm_acc": "6.748e-01", "anc_acc": "6.351e-01", "epoch": 0.04856} {"step": 24285, "loss": 0.9533, "grad_norm": "5.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.047e-01", "anc_loss": "9.758e-01", "dlm_acc": "6.338e-01", "anc_acc": "6.156e-01", "epoch": 0.04857} {"step": 24290, "loss": 0.6278, "grad_norm": "4.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.133e-01", "anc_loss": "8.887e-01", "dlm_acc": "6.824e-01", "anc_acc": "6.660e-01", "epoch": 0.04858} {"step": 24295, "loss": 0.9514, "grad_norm": "5.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.361e+00", "dlm_acc": "5.533e-01", "anc_acc": "5.330e-01", "epoch": 0.04859} {"step": 24300, "loss": 0.9372, "grad_norm": "2.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.278e+00", "dlm_acc": "5.428e-01", "anc_acc": "5.253e-01", "epoch": 0.0486} {"step": 24305, "loss": 1.4267, "grad_norm": "3.035e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.641e+00", "anc_loss": "1.742e+00", "dlm_acc": "4.785e-01", "anc_acc": "4.571e-01", "epoch": 0.04861} {"step": 24310, "loss": 1.5011, "grad_norm": "4.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.688e+00", "anc_loss": "1.790e+00", "dlm_acc": "4.722e-01", "anc_acc": "4.517e-01", "epoch": 0.04862} {"step": 24315, "loss": 0.9643, "grad_norm": "3.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.260e-01", "anc_loss": "7.613e-01", "dlm_acc": "6.383e-01", "anc_acc": "6.228e-01", "epoch": 0.04863} {"step": 24320, "loss": 1.2023, "grad_norm": "4.804e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.984e-01", "anc_loss": "7.391e-01", "dlm_acc": "5.850e-01", "anc_acc": "5.720e-01", "epoch": 0.04864} {"step": 24325, "loss": 0.8693, "grad_norm": "3.182e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.398e-01", "anc_loss": "4.754e-01", "dlm_acc": "6.883e-01", "anc_acc": "6.689e-01", "epoch": 0.04865} {"step": 24330, "loss": 0.9608, "grad_norm": "1.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.371e-01", "anc_loss": "1.014e+00", "dlm_acc": "5.839e-01", "anc_acc": "5.572e-01", "epoch": 0.04866} {"step": 24335, "loss": 1.1223, "grad_norm": "5.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.367e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.184e-01", "anc_acc": "4.984e-01", "epoch": 0.04867} {"step": 24340, "loss": 1.2311, "grad_norm": "3.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.115e+00", "dlm_acc": "6.467e-01", "anc_acc": "6.306e-01", "epoch": 0.04868} {"step": 24345, "loss": 1.07, "grad_norm": "4.623e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.791e-01", "anc_loss": "9.694e-01", "dlm_acc": "7.435e-01", "anc_acc": "7.227e-01", "epoch": 0.04869} {"step": 24350, "loss": 0.5948, "grad_norm": "4.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.846e-01", "anc_loss": "3.033e-01", "dlm_acc": "8.219e-01", "anc_acc": "8.141e-01", "epoch": 0.0487} {"step": 24355, "loss": 1.2014, "grad_norm": "5.455e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.375e-01", "anc_loss": "8.066e-01", "dlm_acc": "7.087e-01", "anc_acc": "6.927e-01", "epoch": 0.04871} {"step": 24360, "loss": 1.0355, "grad_norm": "2.222e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.142e-01", "anc_loss": "5.572e-01", "dlm_acc": "7.553e-01", "anc_acc": "7.394e-01", "epoch": 0.04872} {"step": 24365, "loss": 1.0666, "grad_norm": "2.957e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.887e-01", "anc_loss": "6.238e-01", "dlm_acc": "6.892e-01", "anc_acc": "6.787e-01", "epoch": 0.04873} {"step": 24370, "loss": 1.084, "grad_norm": "3.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.883e-01", "anc_loss": "8.203e-01", "dlm_acc": "6.330e-01", "anc_acc": "6.245e-01", "epoch": 0.04874} {"step": 24375, "loss": 0.7816, "grad_norm": "2.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.646e-01", "anc_loss": "6.299e-01", "dlm_acc": "7.653e-01", "anc_acc": "7.413e-01", "epoch": 0.04875} {"step": 24380, "loss": 1.1349, "grad_norm": "1.912e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.376e+00", "anc_loss": "1.486e+00", "dlm_acc": "5.494e-01", "anc_acc": "5.245e-01", "epoch": 0.04876} {"step": 24385, "loss": 0.9349, "grad_norm": "3.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.282e+00", "anc_loss": "1.396e+00", "dlm_acc": "5.700e-01", "anc_acc": "5.436e-01", "epoch": 0.04877} {"step": 24390, "loss": 0.9093, "grad_norm": "1.698e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.273e+00", "dlm_acc": "6.137e-01", "anc_acc": "5.934e-01", "epoch": 0.04878} {"step": 24395, "loss": 0.9762, "grad_norm": "4.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.371e-01", "anc_loss": "6.998e-01", "dlm_acc": "7.532e-01", "anc_acc": "7.394e-01", "epoch": 0.04879} {"step": 24400, "loss": 0.6717, "grad_norm": "2.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.712e-01", "anc_loss": "8.405e-01", "dlm_acc": "6.787e-01", "anc_acc": "6.590e-01", "epoch": 0.0488} {"step": 24405, "loss": 1.0335, "grad_norm": "5.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.290e+00", "dlm_acc": "5.363e-01", "anc_acc": "5.142e-01", "epoch": 0.04881} {"step": 24410, "loss": 0.921, "grad_norm": "2.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.445e-01", "anc_loss": "1.032e+00", "dlm_acc": "6.371e-01", "anc_acc": "6.141e-01", "epoch": 0.04882} {"step": 24415, "loss": 0.8135, "grad_norm": "6.996e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.504e-01", "anc_loss": "4.041e-01", "dlm_acc": "8.302e-01", "anc_acc": "8.163e-01", "epoch": 0.04883} {"step": 24420, "loss": 1.1594, "grad_norm": "2.541e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.621e-01", "anc_loss": "5.199e-01", "dlm_acc": "7.729e-01", "anc_acc": "7.523e-01", "epoch": 0.04884} {"step": 24425, "loss": 1.4901, "grad_norm": "1.260e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.373e+00", "dlm_acc": "5.901e-01", "anc_acc": "5.680e-01", "epoch": 0.04885} {"step": 24430, "loss": 1.2993, "grad_norm": "3.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.430e-01", "anc_loss": "7.742e-01", "dlm_acc": "6.042e-01", "anc_acc": "5.964e-01", "epoch": 0.04886} {"step": 24435, "loss": 1.3635, "grad_norm": "2.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.209e+00", "dlm_acc": "6.676e-01", "anc_acc": "6.446e-01", "epoch": 0.04887} {"step": 24440, "loss": 1.141, "grad_norm": "4.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.090e-01", "anc_loss": "8.707e-01", "dlm_acc": "7.143e-01", "anc_acc": "7.007e-01", "epoch": 0.04888} {"step": 24445, "loss": 0.9982, "grad_norm": "3.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.777e-01", "anc_loss": "9.395e-01", "dlm_acc": "5.630e-01", "anc_acc": "5.448e-01", "epoch": 0.04889} {"step": 24450, "loss": 1.1023, "grad_norm": "4.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.242e-01", "anc_loss": "1.008e+00", "dlm_acc": "6.065e-01", "anc_acc": "5.843e-01", "epoch": 0.0489} {"step": 24455, "loss": 1.4452, "grad_norm": "3.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.283e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.369e-01", "anc_acc": "5.143e-01", "epoch": 0.04891} {"step": 24460, "loss": 1.2332, "grad_norm": "9.467e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.964e-01", "anc_loss": "9.733e-01", "dlm_acc": "6.794e-01", "anc_acc": "6.610e-01", "epoch": 0.04892} {"step": 24465, "loss": 1.6937, "grad_norm": "6.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.703e-01", "anc_loss": "7.342e-01", "dlm_acc": "7.369e-01", "anc_acc": "7.206e-01", "epoch": 0.04893} {"step": 24470, "loss": 1.5754, "grad_norm": "4.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.982e-01", "anc_loss": "9.719e-01", "dlm_acc": "6.808e-01", "anc_acc": "6.623e-01", "epoch": 0.04894} {"step": 24475, "loss": 1.8908, "grad_norm": "5.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.234e-01", "anc_loss": "7.803e-01", "dlm_acc": "7.014e-01", "anc_acc": "6.875e-01", "epoch": 0.04895} {"step": 24480, "loss": 1.3236, "grad_norm": "3.291e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e-01", "anc_loss": "1.372e-01", "dlm_acc": "9.408e-01", "anc_acc": "9.230e-01", "epoch": 0.04896} {"step": 24485, "loss": 1.415, "grad_norm": "6.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.132e+00", "dlm_acc": "5.648e-01", "anc_acc": "5.490e-01", "epoch": 0.04897} {"step": 24490, "loss": 1.1411, "grad_norm": "1.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.097e+00", "anc_loss": "1.186e+00", "dlm_acc": "5.524e-01", "anc_acc": "5.311e-01", "epoch": 0.04898} {"step": 24495, "loss": 1.1111, "grad_norm": "2.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.969e-01", "anc_loss": "5.699e-01", "dlm_acc": "8.217e-01", "anc_acc": "8.063e-01", "epoch": 0.04899} {"step": 24500, "loss": 1.2896, "grad_norm": "3.950e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.617e-01", "anc_loss": "9.525e-01", "dlm_acc": "6.869e-01", "anc_acc": "6.654e-01", "epoch": 0.049} {"step": 24505, "loss": 1.1423, "grad_norm": "4.782e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.613e-01", "anc_loss": "6.512e-01", "dlm_acc": "7.169e-01", "anc_acc": "6.736e-01", "epoch": 0.04901} {"step": 24510, "loss": 1.4926, "grad_norm": "6.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.180e-01", "anc_loss": "7.012e-01", "dlm_acc": "7.232e-01", "anc_acc": "6.963e-01", "epoch": 0.04902} {"step": 24515, "loss": 1.0427, "grad_norm": "3.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.828e-01", "anc_loss": "7.652e-01", "dlm_acc": "7.061e-01", "anc_acc": "6.805e-01", "epoch": 0.04903} {"step": 24520, "loss": 1.2005, "grad_norm": "2.761e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.305e-01", "anc_loss": "4.422e-01", "dlm_acc": "7.243e-01", "anc_acc": "7.213e-01", "epoch": 0.04904} {"step": 24525, "loss": 0.812, "grad_norm": "2.241e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.050e-01", "anc_loss": "2.133e-01", "dlm_acc": "8.709e-01", "anc_acc": "8.671e-01", "epoch": 0.04905} {"step": 24530, "loss": 0.822, "grad_norm": "3.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.599e-01", "anc_loss": "1.696e-01", "dlm_acc": "9.070e-01", "anc_acc": "9.015e-01", "epoch": 0.04906} {"step": 24535, "loss": 0.9873, "grad_norm": "7.406e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.426e-01", "anc_loss": "9.018e-01", "dlm_acc": "6.739e-01", "anc_acc": "6.602e-01", "epoch": 0.04907} {"step": 24540, "loss": 1.0888, "grad_norm": "3.244e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.170e+00", "dlm_acc": "6.116e-01", "anc_acc": "5.865e-01", "epoch": 0.04908} {"step": 24545, "loss": 1.4494, "grad_norm": "4.011e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.239e-01", "anc_acc": "5.014e-01", "epoch": 0.04909} {"step": 24550, "loss": 0.9077, "grad_norm": "3.738e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.157e+00", "dlm_acc": "5.562e-01", "anc_acc": "5.389e-01", "epoch": 0.0491} {"step": 24555, "loss": 0.8737, "grad_norm": "2.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.775e-01", "anc_loss": "7.638e-01", "dlm_acc": "7.129e-01", "anc_acc": "6.870e-01", "epoch": 0.04911} {"step": 24560, "loss": 0.9781, "grad_norm": "4.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.680e-01", "anc_loss": "1.077e+00", "dlm_acc": "5.880e-01", "anc_acc": "5.570e-01", "epoch": 0.04912} {"step": 24565, "loss": 1.0958, "grad_norm": "4.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.112e+00", "anc_loss": "1.207e+00", "dlm_acc": "5.933e-01", "anc_acc": "5.698e-01", "epoch": 0.04913} {"step": 24570, "loss": 1.2007, "grad_norm": "3.375e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.469e+00", "anc_loss": "1.575e+00", "dlm_acc": "5.103e-01", "anc_acc": "4.856e-01", "epoch": 0.04914} {"step": 24575, "loss": 1.4611, "grad_norm": "5.622e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.614e+00", "dlm_acc": "5.284e-01", "anc_acc": "5.014e-01", "epoch": 0.04915} {"step": 24580, "loss": 1.365, "grad_norm": "3.594e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.633e+00", "anc_loss": "1.750e+00", "dlm_acc": "4.743e-01", "anc_acc": "4.490e-01", "epoch": 0.04916} {"step": 24585, "loss": 1.7067, "grad_norm": "7.361e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.583e+00", "dlm_acc": "5.250e-01", "anc_acc": "4.952e-01", "epoch": 0.04917} {"step": 24590, "loss": 1.4987, "grad_norm": "5.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.629e-01", "anc_loss": "1.058e+00", "dlm_acc": "6.671e-01", "anc_acc": "6.444e-01", "epoch": 0.04918} {"step": 24595, "loss": 1.0191, "grad_norm": "3.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.279e-01", "anc_acc": "5.060e-01", "epoch": 0.04919} {"step": 24600, "loss": 0.9939, "grad_norm": "5.353e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.704e-01", "anc_acc": "5.417e-01", "epoch": 0.0492} {"step": 24605, "loss": 0.9825, "grad_norm": "2.774e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.706e-01", "anc_acc": "5.463e-01", "epoch": 0.04921} {"step": 24610, "loss": 1.1034, "grad_norm": "3.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.818e-01", "anc_loss": "1.044e+00", "dlm_acc": "6.359e-01", "anc_acc": "6.159e-01", "epoch": 0.04922} {"step": 24615, "loss": 0.9427, "grad_norm": "2.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.723e-01", "anc_loss": "8.461e-01", "dlm_acc": "6.625e-01", "anc_acc": "6.330e-01", "epoch": 0.04923} {"step": 24620, "loss": 1.4228, "grad_norm": "2.154e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.748e+00", "dlm_acc": "5.116e-01", "anc_acc": "4.842e-01", "epoch": 0.04924} {"step": 24625, "loss": 1.0273, "grad_norm": "3.530e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.312e-01", "anc_loss": "7.227e-01", "dlm_acc": "7.023e-01", "anc_acc": "6.737e-01", "epoch": 0.04925} {"step": 24630, "loss": 0.9154, "grad_norm": "4.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.144e+00", "dlm_acc": "5.739e-01", "anc_acc": "5.427e-01", "epoch": 0.04926} {"step": 24635, "loss": 1.1834, "grad_norm": "3.728e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.390e+00", "anc_loss": "1.479e+00", "dlm_acc": "5.031e-01", "anc_acc": "4.850e-01", "epoch": 0.04927} {"step": 24640, "loss": 1.2768, "grad_norm": "3.382e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.446e+00", "dlm_acc": "5.030e-01", "anc_acc": "4.863e-01", "epoch": 0.04928} {"step": 24645, "loss": 0.9517, "grad_norm": "1.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.180e+00", "dlm_acc": "5.943e-01", "anc_acc": "5.722e-01", "epoch": 0.04929} {"step": 24650, "loss": 1.4047, "grad_norm": "5.613e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.559e+00", "anc_loss": "1.658e+00", "dlm_acc": "5.314e-01", "anc_acc": "5.065e-01", "epoch": 0.0493} {"step": 24655, "loss": 1.2506, "grad_norm": "2.437e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.959e-01", "anc_loss": "9.643e-01", "dlm_acc": "6.418e-01", "anc_acc": "6.250e-01", "epoch": 0.04931} {"step": 24660, "loss": 1.2174, "grad_norm": "2.263e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.845e+00", "anc_loss": "1.911e+00", "dlm_acc": "3.758e-01", "anc_acc": "3.610e-01", "epoch": 0.04932} {"step": 24665, "loss": 1.1191, "grad_norm": "3.395e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.133e+00", "anc_loss": "1.265e+00", "dlm_acc": "6.055e-01", "anc_acc": "5.696e-01", "epoch": 0.04933} {"step": 24670, "loss": 1.2349, "grad_norm": "4.533e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.426e+00", "anc_loss": "1.520e+00", "dlm_acc": "4.913e-01", "anc_acc": "4.730e-01", "epoch": 0.04934} {"step": 24675, "loss": 0.9326, "grad_norm": "3.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.094e+00", "dlm_acc": "5.587e-01", "anc_acc": "5.307e-01", "epoch": 0.04935} {"step": 24680, "loss": 1.0622, "grad_norm": "5.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.035e+00", "anc_loss": "1.125e+00", "dlm_acc": "6.002e-01", "anc_acc": "5.776e-01", "epoch": 0.04936} {"step": 24685, "loss": 1.1273, "grad_norm": "4.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.451e-01", "anc_acc": "5.259e-01", "epoch": 0.04937} {"step": 24690, "loss": 1.1533, "grad_norm": "3.372e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.305e-01", "anc_loss": "1.002e+00", "dlm_acc": "5.831e-01", "anc_acc": "5.647e-01", "epoch": 0.04938} {"step": 24695, "loss": 1.3735, "grad_norm": "4.709e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.461e+00", "anc_loss": "1.583e+00", "dlm_acc": "4.835e-01", "anc_acc": "4.554e-01", "epoch": 0.04939} {"step": 24700, "loss": 1.026, "grad_norm": "2.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.001e+00", "anc_loss": "1.120e+00", "dlm_acc": "6.023e-01", "anc_acc": "5.724e-01", "epoch": 0.0494} {"step": 24705, "loss": 1.0871, "grad_norm": "1.961e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.311e-01", "anc_loss": "7.941e-01", "dlm_acc": "7.101e-01", "anc_acc": "6.921e-01", "epoch": 0.04941} {"step": 24710, "loss": 1.0595, "grad_norm": "3.179e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.912e-01", "anc_loss": "6.502e-01", "dlm_acc": "7.406e-01", "anc_acc": "7.257e-01", "epoch": 0.04942} {"step": 24715, "loss": 1.0873, "grad_norm": "2.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.186e+00", "dlm_acc": "5.687e-01", "anc_acc": "5.430e-01", "epoch": 0.04943} {"step": 24720, "loss": 1.2608, "grad_norm": "3.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.286e+00", "dlm_acc": "5.449e-01", "anc_acc": "5.283e-01", "epoch": 0.04944} {"step": 24725, "loss": 0.9236, "grad_norm": "4.452e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.422e-01", "anc_loss": "8.047e-01", "dlm_acc": "6.108e-01", "anc_acc": "5.850e-01", "epoch": 0.04945} {"step": 24730, "loss": 1.1075, "grad_norm": "3.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.270e+00", "dlm_acc": "6.029e-01", "anc_acc": "5.462e-01", "epoch": 0.04946} {"step": 24735, "loss": 1.1229, "grad_norm": "7.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.019e+00", "anc_loss": "1.125e+00", "dlm_acc": "6.431e-01", "anc_acc": "6.151e-01", "epoch": 0.04947} {"step": 24740, "loss": 1.1344, "grad_norm": "1.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.865e-01", "anc_acc": "5.578e-01", "epoch": 0.04948} {"step": 24745, "loss": 1.1797, "grad_norm": "3.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.539e+00", "dlm_acc": "5.335e-01", "anc_acc": "5.097e-01", "epoch": 0.04949} {"step": 24750, "loss": 1.7476, "grad_norm": "6.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.750e+00", "anc_loss": "1.869e+00", "dlm_acc": "5.030e-01", "anc_acc": "4.817e-01", "epoch": 0.0495} {"step": 24755, "loss": 1.1495, "grad_norm": "3.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.209e-01", "anc_loss": "1.008e+00", "dlm_acc": "6.598e-01", "anc_acc": "6.405e-01", "epoch": 0.04951} {"step": 24760, "loss": 1.3176, "grad_norm": "3.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.608e+00", "anc_loss": "1.716e+00", "dlm_acc": "4.759e-01", "anc_acc": "4.571e-01", "epoch": 0.04952} {"step": 24765, "loss": 1.0455, "grad_norm": "1.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.187e-01", "anc_loss": "1.044e+00", "dlm_acc": "6.216e-01", "anc_acc": "5.806e-01", "epoch": 0.04953} {"step": 24770, "loss": 1.4018, "grad_norm": "2.491e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.219e-01", "anc_loss": "3.614e-01", "dlm_acc": "8.485e-01", "anc_acc": "8.342e-01", "epoch": 0.04954} {"step": 24775, "loss": 1.3827, "grad_norm": "2.390e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.277e-01", "anc_loss": "9.977e-01", "dlm_acc": "6.283e-01", "anc_acc": "6.104e-01", "epoch": 0.04955} {"step": 24780, "loss": 1.8514, "grad_norm": "2.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.664e-01", "anc_acc": "5.444e-01", "epoch": 0.04956} {"step": 24785, "loss": 1.3509, "grad_norm": "5.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.400e-01", "anc_loss": "3.676e-01", "dlm_acc": "8.062e-01", "anc_acc": "7.863e-01", "epoch": 0.04957} {"step": 24790, "loss": 1.4267, "grad_norm": "4.358e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.033e-01", "anc_loss": "3.435e-01", "dlm_acc": "8.123e-01", "anc_acc": "7.914e-01", "epoch": 0.04958} {"step": 24795, "loss": 1.2121, "grad_norm": "3.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.445e-01", "anc_loss": "6.273e-01", "dlm_acc": "7.375e-01", "anc_acc": "7.028e-01", "epoch": 0.04959} {"step": 24800, "loss": 1.3143, "grad_norm": "4.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.434e-01", "anc_loss": "1.047e+00", "dlm_acc": "6.623e-01", "anc_acc": "6.274e-01", "epoch": 0.0496} {"step": 24805, "loss": 1.4553, "grad_norm": "3.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.373e+00", "dlm_acc": "4.790e-01", "anc_acc": "4.609e-01", "epoch": 0.04961} {"step": 24810, "loss": 1.4127, "grad_norm": "3.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.200e+00", "anc_loss": "1.322e+00", "dlm_acc": "6.002e-01", "anc_acc": "5.674e-01", "epoch": 0.04962} {"step": 24815, "loss": 1.5305, "grad_norm": "5.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.536e+00", "dlm_acc": "5.122e-01", "anc_acc": "4.902e-01", "epoch": 0.04963} {"step": 24820, "loss": 1.236, "grad_norm": "2.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.325e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.185e-01", "anc_acc": "4.873e-01", "epoch": 0.04964} {"step": 24825, "loss": 1.2513, "grad_norm": "3.954e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.351e-01", "anc_acc": "5.066e-01", "epoch": 0.04965} {"step": 24830, "loss": 1.0717, "grad_norm": "3.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.271e-01", "anc_loss": "8.086e-01", "dlm_acc": "7.185e-01", "anc_acc": "6.951e-01", "epoch": 0.04966} {"step": 24835, "loss": 1.4689, "grad_norm": "7.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.560e+00", "dlm_acc": "5.006e-01", "anc_acc": "4.717e-01", "epoch": 0.04967} {"step": 24840, "loss": 1.4317, "grad_norm": "3.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.146e+00", "anc_loss": "1.262e+00", "dlm_acc": "6.375e-01", "anc_acc": "6.158e-01", "epoch": 0.04968} {"step": 24845, "loss": 1.2278, "grad_norm": "5.216e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.430e+00", "dlm_acc": "4.920e-01", "anc_acc": "4.739e-01", "epoch": 0.04969} {"step": 24850, "loss": 0.9696, "grad_norm": "3.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.507e+00", "anc_loss": "1.623e+00", "dlm_acc": "4.914e-01", "anc_acc": "4.626e-01", "epoch": 0.0497} {"step": 24855, "loss": 1.1575, "grad_norm": "2.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.613e+00", "dlm_acc": "5.422e-01", "anc_acc": "5.255e-01", "epoch": 0.04971} {"step": 24860, "loss": 1.0315, "grad_norm": "1.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.789e-01", "anc_acc": "5.548e-01", "epoch": 0.04972} {"step": 24865, "loss": 1.1051, "grad_norm": "2.945e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.619e-01", "anc_acc": "5.263e-01", "epoch": 0.04973} {"step": 24870, "loss": 0.9081, "grad_norm": "2.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.383e-01", "anc_loss": "1.073e+00", "dlm_acc": "5.965e-01", "anc_acc": "5.580e-01", "epoch": 0.04974} {"step": 24875, "loss": 1.5397, "grad_norm": "3.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.712e+00", "dlm_acc": "4.614e-01", "anc_acc": "4.424e-01", "epoch": 0.04975} {"step": 24880, "loss": 1.1717, "grad_norm": "4.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.472e+00", "dlm_acc": "5.304e-01", "anc_acc": "5.099e-01", "epoch": 0.04976} {"step": 24885, "loss": 1.2665, "grad_norm": "2.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.203e+00", "dlm_acc": "5.884e-01", "anc_acc": "5.536e-01", "epoch": 0.04977} {"step": 24890, "loss": 1.4018, "grad_norm": "3.994e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.672e-01", "anc_acc": "5.321e-01", "epoch": 0.04978} {"step": 24895, "loss": 1.6046, "grad_norm": "4.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.754e-01", "anc_acc": "5.525e-01", "epoch": 0.04979} {"step": 24900, "loss": 1.2044, "grad_norm": "2.578e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.791e+00", "anc_loss": "1.844e+00", "dlm_acc": "2.689e-01", "anc_acc": "2.564e-01", "epoch": 0.0498} {"step": 24905, "loss": 1.2888, "grad_norm": "2.581e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.625e+00", "anc_loss": "1.674e+00", "dlm_acc": "3.873e-01", "anc_acc": "3.736e-01", "epoch": 0.04981} {"step": 24910, "loss": 1.361, "grad_norm": "4.896e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.156e+00", "anc_loss": "1.255e+00", "dlm_acc": "5.008e-01", "anc_acc": "4.783e-01", "epoch": 0.04982} {"step": 24915, "loss": 1.0555, "grad_norm": "3.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.551e-01", "anc_loss": "6.262e-01", "dlm_acc": "6.520e-01", "anc_acc": "6.294e-01", "epoch": 0.04983} {"step": 24920, "loss": 1.2317, "grad_norm": "4.313e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.531e-01", "anc_loss": "9.266e-01", "dlm_acc": "5.650e-01", "anc_acc": "5.460e-01", "epoch": 0.04984} {"step": 24925, "loss": 1.6736, "grad_norm": "3.095e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.634e+00", "anc_loss": "1.761e+00", "dlm_acc": "5.097e-01", "anc_acc": "4.779e-01", "epoch": 0.04985} {"step": 24930, "loss": 1.1578, "grad_norm": "2.134e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.324e+00", "dlm_acc": "4.553e-01", "anc_acc": "4.377e-01", "epoch": 0.04986} {"step": 24935, "loss": 1.2534, "grad_norm": "3.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.633e-01", "anc_loss": "1.050e+00", "dlm_acc": "5.913e-01", "anc_acc": "5.616e-01", "epoch": 0.04987} {"step": 24940, "loss": 1.2844, "grad_norm": "3.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.190e+00", "dlm_acc": "5.910e-01", "anc_acc": "5.586e-01", "epoch": 0.04988} {"step": 24945, "loss": 1.8349, "grad_norm": "2.362e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.481e-01", "anc_acc": "5.117e-01", "epoch": 0.04989} {"step": 24950, "loss": 1.286, "grad_norm": "3.228e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.273e-01", "anc_loss": "1.004e+00", "dlm_acc": "6.567e-01", "anc_acc": "6.359e-01", "epoch": 0.0499} {"step": 24955, "loss": 1.5535, "grad_norm": "4.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.436e+00", "dlm_acc": "4.673e-01", "anc_acc": "4.481e-01", "epoch": 0.04991} {"step": 24960, "loss": 1.5832, "grad_norm": "6.162e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.233e+00", "anc_loss": "1.351e+00", "dlm_acc": "5.778e-01", "anc_acc": "5.503e-01", "epoch": 0.04992} {"step": 24965, "loss": 1.45, "grad_norm": "3.404e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.189e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.589e-01", "anc_acc": "5.269e-01", "epoch": 0.04993} {"step": 24970, "loss": 1.4761, "grad_norm": "1.487e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.725e+00", "anc_loss": "1.831e+00", "dlm_acc": "4.561e-01", "anc_acc": "4.229e-01", "epoch": 0.04994} {"step": 24975, "loss": 1.4422, "grad_norm": "2.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.248e+00", "dlm_acc": "6.066e-01", "anc_acc": "5.820e-01", "epoch": 0.04995} {"step": 24980, "loss": 1.2287, "grad_norm": "2.717e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.395e+00", "dlm_acc": "4.977e-01", "anc_acc": "4.795e-01", "epoch": 0.04996} {"step": 24985, "loss": 1.5566, "grad_norm": "2.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.355e+00", "anc_loss": "2.384e+00", "dlm_acc": "1.632e-01", "anc_acc": "1.589e-01", "epoch": 0.04997} {"step": 24990, "loss": 1.9173, "grad_norm": "4.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.037e+00", "anc_loss": "2.112e+00", "dlm_acc": "3.960e-01", "anc_acc": "3.835e-01", "epoch": 0.04998} {"step": 24995, "loss": 1.4908, "grad_norm": "5.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.111e-01", "anc_acc": "4.851e-01", "epoch": 0.04999} {"step": 25000, "loss": 1.0745, "grad_norm": "2.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.229e+00", "dlm_acc": "6.120e-01", "anc_acc": "5.924e-01", "epoch": 0.05} {"step": 25005, "loss": 0.8316, "grad_norm": "2.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.944e-02", "anc_loss": "7.852e-02", "dlm_acc": "9.256e-01", "anc_acc": "9.256e-01", "epoch": 0.05001} {"step": 25010, "loss": 1.2636, "grad_norm": "3.158e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.324e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.438e-01", "anc_acc": "5.218e-01", "epoch": 0.05002} {"step": 25015, "loss": 1.4834, "grad_norm": "3.537e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.529e+00", "anc_loss": "1.677e+00", "dlm_acc": "5.019e-01", "anc_acc": "4.709e-01", "epoch": 0.05003} {"step": 25020, "loss": 1.7447, "grad_norm": "1.846e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.812e+00", "anc_loss": "1.877e+00", "dlm_acc": "3.510e-01", "anc_acc": "3.352e-01", "epoch": 0.05004} {"step": 25025, "loss": 1.1127, "grad_norm": "3.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.184e-01", "anc_acc": "5.024e-01", "epoch": 0.05005} {"step": 25030, "loss": 1.127, "grad_norm": "3.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.456e+00", "anc_loss": "1.564e+00", "dlm_acc": "5.263e-01", "anc_acc": "5.020e-01", "epoch": 0.05006} {"step": 25035, "loss": 1.3656, "grad_norm": "3.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.165e-01", "anc_acc": "4.953e-01", "epoch": 0.05007} {"step": 25040, "loss": 1.4494, "grad_norm": "6.236e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.170e-01", "anc_acc": "4.947e-01", "epoch": 0.05008} {"step": 25045, "loss": 1.2217, "grad_norm": "3.518e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.396e+00", "anc_loss": "1.496e+00", "dlm_acc": "5.598e-01", "anc_acc": "5.388e-01", "epoch": 0.05009} {"step": 25050, "loss": 0.9857, "grad_norm": "4.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.025e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.161e-01", "anc_acc": "5.891e-01", "epoch": 0.0501} {"step": 25055, "loss": 1.2246, "grad_norm": "6.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.342e+00", "dlm_acc": "5.646e-01", "anc_acc": "5.365e-01", "epoch": 0.05011} {"step": 25060, "loss": 1.4483, "grad_norm": "3.344e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.628e+00", "anc_loss": "1.747e+00", "dlm_acc": "4.741e-01", "anc_acc": "4.507e-01", "epoch": 0.05012} {"step": 25065, "loss": 1.6207, "grad_norm": "3.846e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.551e+00", "anc_loss": "1.664e+00", "dlm_acc": "5.304e-01", "anc_acc": "5.062e-01", "epoch": 0.05013} {"step": 25070, "loss": 1.5724, "grad_norm": "4.124e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.682e+00", "anc_loss": "1.798e+00", "dlm_acc": "4.737e-01", "anc_acc": "4.506e-01", "epoch": 0.05014} {"step": 25075, "loss": 1.7636, "grad_norm": "4.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.729e+00", "dlm_acc": "5.042e-01", "anc_acc": "4.803e-01", "epoch": 0.05015} {"step": 25080, "loss": 1.4557, "grad_norm": "4.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.633e+00", "anc_loss": "1.745e+00", "dlm_acc": "4.971e-01", "anc_acc": "4.740e-01", "epoch": 0.05016} {"step": 25085, "loss": 1.4729, "grad_norm": "3.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.754e-01", "anc_acc": "5.511e-01", "epoch": 0.05017} {"step": 25090, "loss": 1.0712, "grad_norm": "3.162e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.222e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.551e-01", "anc_acc": "5.274e-01", "epoch": 0.05018} {"step": 25095, "loss": 1.1177, "grad_norm": "4.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.258e-01", "anc_loss": "9.102e-01", "dlm_acc": "6.492e-01", "anc_acc": "6.261e-01", "epoch": 0.05019} {"step": 25100, "loss": 1.1631, "grad_norm": "2.912e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.221e+00", "dlm_acc": "5.971e-01", "anc_acc": "5.712e-01", "epoch": 0.0502} {"step": 25105, "loss": 0.9881, "grad_norm": "1.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.719e-01", "anc_loss": "1.083e+00", "dlm_acc": "6.247e-01", "anc_acc": "5.914e-01", "epoch": 0.05021} {"step": 25110, "loss": 1.3708, "grad_norm": "2.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.212e+00", "dlm_acc": "6.189e-01", "anc_acc": "5.705e-01", "epoch": 0.05022} {"step": 25115, "loss": 1.7487, "grad_norm": "5.358e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.678e+00", "anc_loss": "1.809e+00", "dlm_acc": "4.852e-01", "anc_acc": "4.616e-01", "epoch": 0.05023} {"step": 25120, "loss": 1.3923, "grad_norm": "4.701e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.600e+00", "anc_loss": "1.697e+00", "dlm_acc": "4.277e-01", "anc_acc": "4.073e-01", "epoch": 0.05024} {"step": 25125, "loss": 1.2994, "grad_norm": "4.915e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.501e+00", "anc_loss": "1.534e+00", "dlm_acc": "3.733e-01", "anc_acc": "3.629e-01", "epoch": 0.05025} {"step": 25130, "loss": 1.3488, "grad_norm": "3.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.232e+00", "anc_loss": "1.319e+00", "dlm_acc": "5.441e-01", "anc_acc": "5.230e-01", "epoch": 0.05026} {"step": 25135, "loss": 1.6342, "grad_norm": "4.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.452e+00", "dlm_acc": "5.779e-01", "anc_acc": "5.538e-01", "epoch": 0.05027} {"step": 25140, "loss": 1.5435, "grad_norm": "4.899e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.256e+00", "anc_loss": "1.354e+00", "dlm_acc": "5.964e-01", "anc_acc": "5.780e-01", "epoch": 0.05028} {"step": 25145, "loss": 1.38, "grad_norm": "3.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.266e-01", "anc_loss": "1.003e+00", "dlm_acc": "6.281e-01", "anc_acc": "6.084e-01", "epoch": 0.05029} {"step": 25150, "loss": 1.2163, "grad_norm": "2.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.172e+00", "dlm_acc": "5.570e-01", "anc_acc": "5.374e-01", "epoch": 0.0503} {"step": 25155, "loss": 0.9997, "grad_norm": "4.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.625e-01", "anc_loss": "1.031e+00", "dlm_acc": "5.516e-01", "anc_acc": "5.265e-01", "epoch": 0.05031} {"step": 25160, "loss": 0.9603, "grad_norm": "7.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.191e-01", "anc_loss": "9.941e-01", "dlm_acc": "5.724e-01", "anc_acc": "5.454e-01", "epoch": 0.05032} {"step": 25165, "loss": 0.7223, "grad_norm": "2.756e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.445e-01", "anc_loss": "4.964e-01", "dlm_acc": "7.676e-01", "anc_acc": "7.493e-01", "epoch": 0.05033} {"step": 25170, "loss": 1.1754, "grad_norm": "3.608e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.194e+00", "anc_loss": "1.295e+00", "dlm_acc": "5.551e-01", "anc_acc": "5.256e-01", "epoch": 0.05034} {"step": 25175, "loss": 1.405, "grad_norm": "4.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.220e+00", "dlm_acc": "5.659e-01", "anc_acc": "5.440e-01", "epoch": 0.05035} {"step": 25180, "loss": 1.2378, "grad_norm": "2.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.186e+00", "dlm_acc": "6.189e-01", "anc_acc": "5.969e-01", "epoch": 0.05036} {"step": 25185, "loss": 1.3226, "grad_norm": "4.104e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.195e+00", "dlm_acc": "5.822e-01", "anc_acc": "5.573e-01", "epoch": 0.05037} {"step": 25190, "loss": 1.172, "grad_norm": "1.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.284e+00", "dlm_acc": "5.838e-01", "anc_acc": "5.638e-01", "epoch": 0.05038} {"step": 25195, "loss": 0.897, "grad_norm": "2.370e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.500e-01", "anc_loss": "8.137e-01", "dlm_acc": "5.934e-01", "anc_acc": "5.677e-01", "epoch": 0.05039} {"step": 25200, "loss": 0.949, "grad_norm": "3.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.344e-01", "anc_loss": "9.352e-01", "dlm_acc": "5.435e-01", "anc_acc": "5.068e-01", "epoch": 0.0504} {"step": 25205, "loss": 1.492, "grad_norm": "3.684e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.553e+00", "dlm_acc": "4.453e-01", "anc_acc": "4.236e-01", "epoch": 0.05041} {"step": 25210, "loss": 1.491, "grad_norm": "3.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.530e+00", "dlm_acc": "4.400e-01", "anc_acc": "4.023e-01", "epoch": 0.05042} {"step": 25215, "loss": 1.4825, "grad_norm": "2.986e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.589e+00", "anc_loss": "1.671e+00", "dlm_acc": "4.756e-01", "anc_acc": "4.512e-01", "epoch": 0.05043} {"step": 25220, "loss": 1.295, "grad_norm": "7.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.433e+00", "dlm_acc": "5.765e-01", "anc_acc": "5.506e-01", "epoch": 0.05044} {"step": 25225, "loss": 1.0356, "grad_norm": "4.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.715e-01", "anc_loss": "7.211e-01", "dlm_acc": "6.403e-01", "anc_acc": "6.265e-01", "epoch": 0.05045} {"step": 25230, "loss": 1.6539, "grad_norm": "3.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.422e-01", "anc_acc": "5.207e-01", "epoch": 0.05046} {"step": 25235, "loss": 1.4074, "grad_norm": "3.699e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.694e-01", "anc_acc": "5.428e-01", "epoch": 0.05047} {"step": 25240, "loss": 1.0617, "grad_norm": "4.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.169e+00", "dlm_acc": "5.945e-01", "anc_acc": "5.656e-01", "epoch": 0.05048} {"step": 25245, "loss": 1.046, "grad_norm": "2.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.984e-01", "anc_loss": "1.039e+00", "dlm_acc": "6.557e-01", "anc_acc": "6.149e-01", "epoch": 0.05049} {"step": 25250, "loss": 1.4988, "grad_norm": "2.341e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.580e+00", "anc_loss": "1.667e+00", "dlm_acc": "5.059e-01", "anc_acc": "4.885e-01", "epoch": 0.0505} {"step": 25255, "loss": 1.2086, "grad_norm": "2.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.228e-01", "anc_acc": "4.982e-01", "epoch": 0.05051} {"step": 25260, "loss": 1.7931, "grad_norm": "6.649e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.381e+00", "anc_loss": "1.474e+00", "dlm_acc": "5.131e-01", "anc_acc": "4.926e-01", "epoch": 0.05052} {"step": 25265, "loss": 1.1308, "grad_norm": "5.352e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.226e+00", "anc_loss": "1.323e+00", "dlm_acc": "5.815e-01", "anc_acc": "5.556e-01", "epoch": 0.05053} {"step": 25270, "loss": 1.0845, "grad_norm": "2.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.258e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.655e-01", "anc_acc": "5.403e-01", "epoch": 0.05054} {"step": 25275, "loss": 0.7359, "grad_norm": "2.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.465e-01", "anc_loss": "4.953e-01", "dlm_acc": "8.154e-01", "anc_acc": "8.011e-01", "epoch": 0.05055} {"step": 25280, "loss": 1.2608, "grad_norm": "4.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.664e-01", "anc_loss": "9.383e-01", "dlm_acc": "6.959e-01", "anc_acc": "6.771e-01", "epoch": 0.05056} {"step": 25285, "loss": 1.5573, "grad_norm": "3.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.367e+00", "anc_loss": "1.469e+00", "dlm_acc": "5.530e-01", "anc_acc": "5.260e-01", "epoch": 0.05057} {"step": 25290, "loss": 1.499, "grad_norm": "5.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.365e+00", "anc_loss": "1.477e+00", "dlm_acc": "5.662e-01", "anc_acc": "5.385e-01", "epoch": 0.05058} {"step": 25295, "loss": 1.0975, "grad_norm": "7.758e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.082e-01", "anc_loss": "1.025e+00", "dlm_acc": "6.751e-01", "anc_acc": "6.417e-01", "epoch": 0.05059} {"step": 25300, "loss": 1.5705, "grad_norm": "5.552e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.489e+00", "anc_loss": "1.592e+00", "dlm_acc": "5.449e-01", "anc_acc": "5.234e-01", "epoch": 0.0506} {"step": 25305, "loss": 1.3642, "grad_norm": "6.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.321e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.817e-01", "anc_acc": "5.580e-01", "epoch": 0.05061} {"step": 25310, "loss": 1.2105, "grad_norm": "3.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.206e+00", "anc_loss": "1.307e+00", "dlm_acc": "5.581e-01", "anc_acc": "5.321e-01", "epoch": 0.05062} {"step": 25315, "loss": 1.1684, "grad_norm": "3.523e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.215e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.817e-01", "anc_acc": "5.557e-01", "epoch": 0.05063} {"step": 25320, "loss": 1.191, "grad_norm": "2.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.506e+00", "anc_loss": "1.619e+00", "dlm_acc": "5.233e-01", "anc_acc": "4.998e-01", "epoch": 0.05064} {"step": 25325, "loss": 1.0872, "grad_norm": "3.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.408e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.395e-01", "anc_acc": "5.165e-01", "epoch": 0.05065} {"step": 25330, "loss": 0.9783, "grad_norm": "5.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.255e+00", "dlm_acc": "5.386e-01", "anc_acc": "5.117e-01", "epoch": 0.05066} {"step": 25335, "loss": 1.0059, "grad_norm": "2.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.757e-01", "anc_acc": "5.451e-01", "epoch": 0.05067} {"step": 25340, "loss": 1.0801, "grad_norm": "7.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.722e+00", "dlm_acc": "4.694e-01", "anc_acc": "4.451e-01", "epoch": 0.05068} {"step": 25345, "loss": 0.9283, "grad_norm": "4.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.904e-01", "anc_loss": "5.492e-01", "dlm_acc": "7.422e-01", "anc_acc": "7.196e-01", "epoch": 0.05069} {"step": 25350, "loss": 1.3864, "grad_norm": "5.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.419e-01", "anc_acc": "5.183e-01", "epoch": 0.0507} {"step": 25355, "loss": 1.2845, "grad_norm": "3.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.446e+00", "dlm_acc": "4.754e-01", "anc_acc": "4.505e-01", "epoch": 0.05071} {"step": 25360, "loss": 1.5099, "grad_norm": "2.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.542e+00", "anc_loss": "1.652e+00", "dlm_acc": "5.123e-01", "anc_acc": "4.883e-01", "epoch": 0.05072} {"step": 25365, "loss": 1.3156, "grad_norm": "4.524e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.090e+00", "dlm_acc": "6.011e-01", "anc_acc": "5.794e-01", "epoch": 0.05073} {"step": 25370, "loss": 1.4241, "grad_norm": "3.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.353e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.342e-01", "epoch": 0.05074} {"step": 25375, "loss": 1.2279, "grad_norm": "2.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.031e+00", "anc_loss": "1.144e+00", "dlm_acc": "5.959e-01", "anc_acc": "5.645e-01", "epoch": 0.05075} {"step": 25380, "loss": 1.2188, "grad_norm": "3.404e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.357e-01", "anc_acc": "5.083e-01", "epoch": 0.05076} {"step": 25385, "loss": 1.5259, "grad_norm": "8.048e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.924e-01", "anc_acc": "5.646e-01", "epoch": 0.05077} {"step": 25390, "loss": 1.6357, "grad_norm": "3.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.495e+00", "dlm_acc": "4.285e-01", "anc_acc": "4.151e-01", "epoch": 0.05078} {"step": 25395, "loss": 1.1533, "grad_norm": "2.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.758e-01", "anc_loss": "1.096e+00", "dlm_acc": "6.033e-01", "anc_acc": "5.635e-01", "epoch": 0.05079} {"step": 25400, "loss": 1.1361, "grad_norm": "2.983e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.008e-01", "anc_loss": "1.020e+00", "dlm_acc": "6.213e-01", "anc_acc": "5.762e-01", "epoch": 0.0508} {"step": 25405, "loss": 1.1123, "grad_norm": "2.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.980e-01", "anc_loss": "7.770e-01", "dlm_acc": "6.588e-01", "anc_acc": "6.249e-01", "epoch": 0.05081} {"step": 25410, "loss": 1.3629, "grad_norm": "2.196e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.263e+00", "dlm_acc": "4.896e-01", "anc_acc": "4.712e-01", "epoch": 0.05082} {"step": 25415, "loss": 1.3415, "grad_norm": "3.418e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.442e+00", "dlm_acc": "4.897e-01", "anc_acc": "4.614e-01", "epoch": 0.05083} {"step": 25420, "loss": 1.5235, "grad_norm": "3.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.179e+00", "anc_loss": "1.286e+00", "dlm_acc": "5.967e-01", "anc_acc": "5.712e-01", "epoch": 0.05084} {"step": 25425, "loss": 1.159, "grad_norm": "3.739e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.122e+00", "anc_loss": "1.213e+00", "dlm_acc": "5.884e-01", "anc_acc": "5.644e-01", "epoch": 0.05085} {"step": 25430, "loss": 1.6815, "grad_norm": "3.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.603e+00", "anc_loss": "1.712e+00", "dlm_acc": "5.202e-01", "anc_acc": "4.993e-01", "epoch": 0.05086} {"step": 25435, "loss": 1.2667, "grad_norm": "2.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.773e-01", "anc_loss": "1.045e+00", "dlm_acc": "5.660e-01", "anc_acc": "5.463e-01", "epoch": 0.05087} {"step": 25440, "loss": 1.4293, "grad_norm": "3.513e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.199e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.900e-01", "anc_acc": "5.567e-01", "epoch": 0.05088} {"step": 25445, "loss": 1.1395, "grad_norm": "3.749e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.574e-01", "anc_loss": "8.293e-01", "dlm_acc": "6.822e-01", "anc_acc": "6.628e-01", "epoch": 0.05089} {"step": 25450, "loss": 1.4651, "grad_norm": "2.516e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.085e+00", "dlm_acc": "6.280e-01", "anc_acc": "6.119e-01", "epoch": 0.0509} {"step": 25455, "loss": 1.127, "grad_norm": "3.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.406e-01", "anc_loss": "9.094e-01", "dlm_acc": "6.198e-01", "anc_acc": "5.988e-01", "epoch": 0.05091} {"step": 25460, "loss": 1.4382, "grad_norm": "6.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.362e+00", "dlm_acc": "5.690e-01", "anc_acc": "5.386e-01", "epoch": 0.05092} {"step": 25465, "loss": 0.9869, "grad_norm": "3.185e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.598e-01", "anc_loss": "8.434e-01", "dlm_acc": "6.255e-01", "anc_acc": "6.013e-01", "epoch": 0.05093} {"step": 25470, "loss": 1.5782, "grad_norm": "5.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.400e+00", "anc_loss": "1.510e+00", "dlm_acc": "5.133e-01", "anc_acc": "4.843e-01", "epoch": 0.05094} {"step": 25475, "loss": 1.4533, "grad_norm": "7.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.270e+00", "dlm_acc": "5.516e-01", "anc_acc": "5.276e-01", "epoch": 0.05095} {"step": 25480, "loss": 1.6835, "grad_norm": "6.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.443e-01", "anc_acc": "5.222e-01", "epoch": 0.05096} {"step": 25485, "loss": 1.1077, "grad_norm": "2.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.437e-01", "anc_loss": "1.028e+00", "dlm_acc": "6.493e-01", "anc_acc": "6.278e-01", "epoch": 0.05097} {"step": 25490, "loss": 0.8524, "grad_norm": "5.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.683e-01", "anc_loss": "7.179e-01", "dlm_acc": "7.656e-01", "anc_acc": "7.519e-01", "epoch": 0.05098} {"step": 25495, "loss": 1.0542, "grad_norm": "2.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.209e+00", "dlm_acc": "6.139e-01", "anc_acc": "5.862e-01", "epoch": 0.05099} {"step": 25500, "loss": 1.3588, "grad_norm": "3.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.483e+00", "dlm_acc": "5.512e-01", "anc_acc": "5.265e-01", "epoch": 0.051} {"step": 25505, "loss": 1.5155, "grad_norm": "3.733e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.555e-01", "anc_acc": "5.296e-01", "epoch": 0.05101} {"step": 25510, "loss": 1.8244, "grad_norm": "4.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.653e+00", "anc_loss": "1.762e+00", "dlm_acc": "5.068e-01", "anc_acc": "4.852e-01", "epoch": 0.05102} {"step": 25515, "loss": 1.0293, "grad_norm": "2.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.547e-01", "anc_loss": "1.055e+00", "dlm_acc": "6.231e-01", "anc_acc": "5.952e-01", "epoch": 0.05103} {"step": 25520, "loss": 1.0289, "grad_norm": "2.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.832e-01", "anc_loss": "7.637e-01", "dlm_acc": "7.543e-01", "anc_acc": "7.326e-01", "epoch": 0.05104} {"step": 25525, "loss": 1.0815, "grad_norm": "2.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.453e-01", "anc_loss": "1.052e+00", "dlm_acc": "6.365e-01", "anc_acc": "6.094e-01", "epoch": 0.05105} {"step": 25530, "loss": 1.1963, "grad_norm": "5.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.029e+00", "anc_loss": "1.129e+00", "dlm_acc": "6.133e-01", "anc_acc": "5.867e-01", "epoch": 0.05106} {"step": 25535, "loss": 1.3612, "grad_norm": "3.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.613e+00", "anc_loss": "1.731e+00", "dlm_acc": "4.843e-01", "anc_acc": "4.596e-01", "epoch": 0.05107} {"step": 25540, "loss": 1.7171, "grad_norm": "8.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.483e+00", "anc_loss": "1.586e+00", "dlm_acc": "5.328e-01", "anc_acc": "5.111e-01", "epoch": 0.05108} {"step": 25545, "loss": 1.3889, "grad_norm": "9.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.293e+00", "dlm_acc": "6.178e-01", "anc_acc": "5.993e-01", "epoch": 0.05109} {"step": 25550, "loss": 1.5853, "grad_norm": "4.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.533e-01", "anc_acc": "5.299e-01", "epoch": 0.0511} {"step": 25555, "loss": 1.4224, "grad_norm": "4.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.404e+00", "anc_loss": "1.506e+00", "dlm_acc": "5.711e-01", "anc_acc": "5.464e-01", "epoch": 0.05111} {"step": 25560, "loss": 1.3956, "grad_norm": "3.322e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.523e+00", "dlm_acc": "5.294e-01", "anc_acc": "5.083e-01", "epoch": 0.05112} {"step": 25565, "loss": 1.6884, "grad_norm": "7.261e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.512e+00", "anc_loss": "1.600e+00", "dlm_acc": "5.205e-01", "anc_acc": "5.018e-01", "epoch": 0.05113} {"step": 25570, "loss": 1.8547, "grad_norm": "3.685e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.520e-01", "anc_acc": "5.261e-01", "epoch": 0.05114} {"step": 25575, "loss": 1.1967, "grad_norm": "4.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.589e-01", "anc_acc": "5.324e-01", "epoch": 0.05115} {"step": 25580, "loss": 1.3997, "grad_norm": "4.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.353e+00", "dlm_acc": "5.662e-01", "anc_acc": "5.386e-01", "epoch": 0.05116} {"step": 25585, "loss": 1.1757, "grad_norm": "6.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.276e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.658e-01", "anc_acc": "5.428e-01", "epoch": 0.05117} {"step": 25590, "loss": 1.2168, "grad_norm": "2.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.220e+00", "dlm_acc": "6.116e-01", "anc_acc": "5.887e-01", "epoch": 0.05118} {"step": 25595, "loss": 1.5743, "grad_norm": "4.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.335e+00", "dlm_acc": "5.889e-01", "anc_acc": "5.604e-01", "epoch": 0.05119} {"step": 25600, "loss": 1.2533, "grad_norm": "2.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.262e+00", "dlm_acc": "6.254e-01", "anc_acc": "6.009e-01", "epoch": 0.0512} {"step": 25605, "loss": 1.336, "grad_norm": "3.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.417e+00", "anc_loss": "1.522e+00", "dlm_acc": "5.133e-01", "anc_acc": "4.887e-01", "epoch": 0.05121} {"step": 25610, "loss": 1.1086, "grad_norm": "2.092e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.560e-01", "anc_acc": "5.301e-01", "epoch": 0.05122} {"step": 25615, "loss": 1.352, "grad_norm": "2.326e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.362e+00", "anc_loss": "1.472e+00", "dlm_acc": "5.374e-01", "anc_acc": "5.097e-01", "epoch": 0.05123} {"step": 25620, "loss": 0.8899, "grad_norm": "4.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.056e+00", "anc_loss": "1.145e+00", "dlm_acc": "6.233e-01", "anc_acc": "6.020e-01", "epoch": 0.05124} {"step": 25625, "loss": 1.1319, "grad_norm": "2.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.498e+00", "anc_loss": "1.652e+00", "dlm_acc": "5.143e-01", "anc_acc": "4.772e-01", "epoch": 0.05125} {"step": 25630, "loss": 1.0597, "grad_norm": "3.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.823e-01", "anc_loss": "1.082e+00", "dlm_acc": "6.297e-01", "anc_acc": "6.044e-01", "epoch": 0.05126} {"step": 25635, "loss": 1.1791, "grad_norm": "4.220e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.260e+00", "dlm_acc": "5.805e-01", "anc_acc": "5.518e-01", "epoch": 0.05127} {"step": 25640, "loss": 0.9718, "grad_norm": "3.818e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.109e-01", "anc_loss": "8.195e-01", "dlm_acc": "6.910e-01", "anc_acc": "6.594e-01", "epoch": 0.05128} {"step": 25645, "loss": 1.8271, "grad_norm": "3.430e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.994e+00", "anc_loss": "2.062e+00", "dlm_acc": "3.038e-01", "anc_acc": "2.833e-01", "epoch": 0.05129} {"step": 25650, "loss": 2.1689, "grad_norm": "5.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.428e+00", "anc_loss": "2.498e+00", "dlm_acc": "2.966e-01", "anc_acc": "2.827e-01", "epoch": 0.0513} {"step": 25655, "loss": 1.7205, "grad_norm": "6.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.770e+00", "anc_loss": "1.847e+00", "dlm_acc": "4.275e-01", "anc_acc": "4.104e-01", "epoch": 0.05131} {"step": 25660, "loss": 1.5732, "grad_norm": "3.741e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.226e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.363e-01", "epoch": 0.05132} {"step": 25665, "loss": 1.2125, "grad_norm": "1.969e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.153e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.827e-01", "anc_acc": "5.575e-01", "epoch": 0.05133} {"step": 25670, "loss": 1.284, "grad_norm": "5.422e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.583e+00", "anc_loss": "1.695e+00", "dlm_acc": "4.836e-01", "anc_acc": "4.588e-01", "epoch": 0.05134} {"step": 25675, "loss": 0.8743, "grad_norm": "2.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.211e-01", "anc_loss": "1.006e+00", "dlm_acc": "5.832e-01", "anc_acc": "5.612e-01", "epoch": 0.05135} {"step": 25680, "loss": 0.9668, "grad_norm": "4.753e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.922e-01", "anc_loss": "1.065e+00", "dlm_acc": "6.337e-01", "anc_acc": "6.169e-01", "epoch": 0.05136} {"step": 25685, "loss": 0.8277, "grad_norm": "2.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.242e-01", "anc_loss": "8.902e-01", "dlm_acc": "6.271e-01", "anc_acc": "6.086e-01", "epoch": 0.05137} {"step": 25690, "loss": 1.0838, "grad_norm": "2.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.629e-01", "anc_acc": "5.391e-01", "epoch": 0.05138} {"step": 25695, "loss": 1.0144, "grad_norm": "3.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.200e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.751e-01", "anc_acc": "5.491e-01", "epoch": 0.05139} {"step": 25700, "loss": 1.3741, "grad_norm": "4.520e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.519e+00", "dlm_acc": "5.042e-01", "anc_acc": "4.687e-01", "epoch": 0.0514} {"step": 25705, "loss": 1.4648, "grad_norm": "8.361e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.109e+00", "dlm_acc": "5.155e-01", "anc_acc": "4.956e-01", "epoch": 0.05141} {"step": 25710, "loss": 1.3413, "grad_norm": "3.068e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.078e-01", "anc_loss": "7.508e-01", "dlm_acc": "5.304e-01", "anc_acc": "5.162e-01", "epoch": 0.05142} {"step": 25715, "loss": 1.2147, "grad_norm": "3.379e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.484e-01", "anc_loss": "6.789e-01", "dlm_acc": "5.476e-01", "anc_acc": "5.359e-01", "epoch": 0.05143} {"step": 25720, "loss": 1.5005, "grad_norm": "4.132e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.257e+00", "dlm_acc": "5.984e-01", "anc_acc": "5.684e-01", "epoch": 0.05144} {"step": 25725, "loss": 1.214, "grad_norm": "2.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.374e+00", "anc_loss": "1.472e+00", "dlm_acc": "5.550e-01", "anc_acc": "5.308e-01", "epoch": 0.05145} {"step": 25730, "loss": 1.2385, "grad_norm": "3.783e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.883e-01", "anc_loss": "8.445e-01", "dlm_acc": "6.170e-01", "anc_acc": "6.010e-01", "epoch": 0.05146} {"step": 25735, "loss": 1.0722, "grad_norm": "6.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.898e-01", "anc_loss": "7.602e-01", "dlm_acc": "5.989e-01", "anc_acc": "5.678e-01", "epoch": 0.05147} {"step": 25740, "loss": 1.4171, "grad_norm": "4.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.546e-01", "anc_loss": "1.045e+00", "dlm_acc": "6.427e-01", "anc_acc": "6.198e-01", "epoch": 0.05148} {"step": 25745, "loss": 1.7391, "grad_norm": "3.898e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.548e+00", "anc_loss": "1.660e+00", "dlm_acc": "4.968e-01", "anc_acc": "4.762e-01", "epoch": 0.05149} {"step": 25750, "loss": 1.5411, "grad_norm": "6.479e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.727e+00", "anc_loss": "1.837e+00", "dlm_acc": "4.556e-01", "anc_acc": "4.324e-01", "epoch": 0.0515} {"step": 25755, "loss": 0.9536, "grad_norm": "4.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.719e-01", "anc_loss": "1.057e+00", "dlm_acc": "5.399e-01", "anc_acc": "5.224e-01", "epoch": 0.05151} {"step": 25760, "loss": 1.688, "grad_norm": "4.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.483e+00", "anc_loss": "1.587e+00", "dlm_acc": "5.017e-01", "anc_acc": "4.800e-01", "epoch": 0.05152} {"step": 25765, "loss": 1.47, "grad_norm": "6.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.489e-01", "anc_acc": "5.101e-01", "epoch": 0.05153} {"step": 25770, "loss": 1.0612, "grad_norm": "4.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.133e+00", "dlm_acc": "6.365e-01", "anc_acc": "6.132e-01", "epoch": 0.05154} {"step": 25775, "loss": 1.1707, "grad_norm": "1.322e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.220e+00", "dlm_acc": "6.141e-01", "anc_acc": "5.939e-01", "epoch": 0.05155} {"step": 25780, "loss": 1.4122, "grad_norm": "3.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.539e+00", "anc_loss": "1.650e+00", "dlm_acc": "4.336e-01", "anc_acc": "4.077e-01", "epoch": 0.05156} {"step": 25785, "loss": 1.4879, "grad_norm": "3.288e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.194e+00", "anc_loss": "1.393e+00", "dlm_acc": "5.269e-01", "anc_acc": "4.656e-01", "epoch": 0.05157} {"step": 25790, "loss": 1.3244, "grad_norm": "1.681e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.200e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.836e-01", "anc_acc": "5.350e-01", "epoch": 0.05158} {"step": 25795, "loss": 1.1444, "grad_norm": "2.905e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.539e-01", "anc_loss": "8.477e-01", "dlm_acc": "6.905e-01", "anc_acc": "6.644e-01", "epoch": 0.05159} {"step": 25800, "loss": 1.4204, "grad_norm": "2.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.195e-01", "anc_acc": "4.834e-01", "epoch": 0.0516} {"step": 25805, "loss": 1.4763, "grad_norm": "3.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.326e+00", "anc_loss": "1.431e+00", "dlm_acc": "5.602e-01", "anc_acc": "5.345e-01", "epoch": 0.05161} {"step": 25810, "loss": 1.1827, "grad_norm": "4.049e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.241e-01", "anc_acc": "5.042e-01", "epoch": 0.05162} {"step": 25815, "loss": 1.2216, "grad_norm": "3.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.377e-01", "anc_acc": "5.157e-01", "epoch": 0.05163} {"step": 25820, "loss": 1.377, "grad_norm": "2.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.488e-01", "anc_acc": "5.235e-01", "epoch": 0.05164} {"step": 25825, "loss": 1.3704, "grad_norm": "2.291e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.182e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.781e-01", "anc_acc": "5.509e-01", "epoch": 0.05165} {"step": 25830, "loss": 1.7131, "grad_norm": "3.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.269e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.352e-01", "anc_acc": "5.018e-01", "epoch": 0.05166} {"step": 25835, "loss": 1.6847, "grad_norm": "3.288e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.447e+00", "dlm_acc": "5.552e-01", "anc_acc": "5.325e-01", "epoch": 0.05167} {"step": 25840, "loss": 1.0979, "grad_norm": "2.560e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.242e-01", "anc_loss": "7.922e-01", "dlm_acc": "7.321e-01", "anc_acc": "7.153e-01", "epoch": 0.05168} {"step": 25845, "loss": 1.3766, "grad_norm": "3.333e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.269e+00", "anc_loss": "1.358e+00", "dlm_acc": "4.501e-01", "anc_acc": "4.185e-01", "epoch": 0.05169} {"step": 25850, "loss": 1.6494, "grad_norm": "3.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.714e+00", "anc_loss": "1.746e+00", "dlm_acc": "3.047e-01", "anc_acc": "2.862e-01", "epoch": 0.0517} {"step": 25855, "loss": 1.4719, "grad_norm": "2.136e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.173e+00", "dlm_acc": "6.056e-01", "anc_acc": "5.777e-01", "epoch": 0.05171} {"step": 25860, "loss": 1.3021, "grad_norm": "3.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.883e-01", "anc_loss": "7.871e-01", "dlm_acc": "7.110e-01", "anc_acc": "6.778e-01", "epoch": 0.05172} {"step": 25865, "loss": 1.5456, "grad_norm": "6.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.126e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.374e-01", "anc_acc": "5.112e-01", "epoch": 0.05173} {"step": 25870, "loss": 1.6538, "grad_norm": "4.138e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.356e+00", "dlm_acc": "5.431e-01", "anc_acc": "5.208e-01", "epoch": 0.05174} {"step": 25875, "loss": 1.0613, "grad_norm": "1.613e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.125e-01", "anc_loss": "9.902e-01", "dlm_acc": "6.156e-01", "anc_acc": "5.939e-01", "epoch": 0.05175} {"step": 25880, "loss": 1.4065, "grad_norm": "4.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.079e+00", "dlm_acc": "5.267e-01", "anc_acc": "5.105e-01", "epoch": 0.05176} {"step": 25885, "loss": 1.0598, "grad_norm": "3.770e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.484e-01", "anc_loss": "6.562e-01", "dlm_acc": "5.004e-01", "anc_acc": "4.955e-01", "epoch": 0.05177} {"step": 25890, "loss": 0.72, "grad_norm": "2.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.723e-01", "anc_loss": "5.766e-01", "dlm_acc": "5.083e-01", "anc_acc": "5.057e-01", "epoch": 0.05178} {"step": 25895, "loss": 1.0577, "grad_norm": "2.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.117e-01", "anc_loss": "6.180e-01", "dlm_acc": "4.993e-01", "anc_acc": "4.964e-01", "epoch": 0.05179} {"step": 25900, "loss": 1.3434, "grad_norm": "3.583e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.203e-01", "anc_loss": "7.336e-01", "dlm_acc": "4.834e-01", "anc_acc": "4.762e-01", "epoch": 0.0518} {"step": 25905, "loss": 1.0851, "grad_norm": "4.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.024e+00", "anc_loss": "1.084e+00", "dlm_acc": "6.280e-01", "anc_acc": "6.141e-01", "epoch": 0.05181} {"step": 25910, "loss": 1.2241, "grad_norm": "4.425e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.637e+00", "dlm_acc": "5.148e-01", "anc_acc": "4.786e-01", "epoch": 0.05182} {"step": 25915, "loss": 1.0015, "grad_norm": "3.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.600e-01", "anc_loss": "5.230e-01", "dlm_acc": "8.121e-01", "anc_acc": "7.968e-01", "epoch": 0.05183} {"step": 25920, "loss": 1.2121, "grad_norm": "4.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.648e+00", "anc_loss": "1.745e+00", "dlm_acc": "5.079e-01", "anc_acc": "4.896e-01", "epoch": 0.05184} {"step": 25925, "loss": 0.9456, "grad_norm": "4.128e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.346e-01", "anc_loss": "9.092e-01", "dlm_acc": "6.906e-01", "anc_acc": "6.717e-01", "epoch": 0.05185} {"step": 25930, "loss": 0.868, "grad_norm": "3.201e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.165e+00", "dlm_acc": "5.549e-01", "anc_acc": "5.341e-01", "epoch": 0.05186} {"step": 25935, "loss": 0.9749, "grad_norm": "2.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.418e+00", "dlm_acc": "4.933e-01", "anc_acc": "4.659e-01", "epoch": 0.05187} {"step": 25940, "loss": 1.2197, "grad_norm": "1.647e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.125e+00", "anc_loss": "1.255e+00", "dlm_acc": "5.746e-01", "anc_acc": "5.473e-01", "epoch": 0.05188} {"step": 25945, "loss": 1.165, "grad_norm": "2.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.073e+00", "dlm_acc": "6.080e-01", "anc_acc": "5.888e-01", "epoch": 0.05189} {"step": 25950, "loss": 1.2283, "grad_norm": "4.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.097e+00", "anc_loss": "1.179e+00", "dlm_acc": "5.827e-01", "anc_acc": "5.605e-01", "epoch": 0.0519} {"step": 25955, "loss": 0.8725, "grad_norm": "2.774e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.445e-01", "anc_loss": "1.043e+00", "dlm_acc": "6.265e-01", "anc_acc": "6.002e-01", "epoch": 0.05191} {"step": 25960, "loss": 0.8543, "grad_norm": "3.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.078e-01", "anc_loss": "1.013e+00", "dlm_acc": "6.697e-01", "anc_acc": "6.368e-01", "epoch": 0.05192} {"step": 25965, "loss": 0.9489, "grad_norm": "3.539e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.246e-01", "anc_loss": "5.625e-01", "dlm_acc": "6.498e-01", "anc_acc": "6.285e-01", "epoch": 0.05193} {"step": 25970, "loss": 0.9176, "grad_norm": "2.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.364e+00", "anc_loss": "1.483e+00", "dlm_acc": "5.411e-01", "anc_acc": "5.170e-01", "epoch": 0.05194} {"step": 25975, "loss": 1.4985, "grad_norm": "4.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.588e+00", "anc_loss": "1.687e+00", "dlm_acc": "5.014e-01", "anc_acc": "4.799e-01", "epoch": 0.05195} {"step": 25980, "loss": 1.2075, "grad_norm": "3.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.261e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.627e-01", "anc_acc": "5.412e-01", "epoch": 0.05196} {"step": 25985, "loss": 1.383, "grad_norm": "5.137e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.592e+00", "anc_loss": "1.703e+00", "dlm_acc": "5.168e-01", "anc_acc": "4.929e-01", "epoch": 0.05197} {"step": 25990, "loss": 0.8886, "grad_norm": "3.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.174e-01", "anc_loss": "9.996e-01", "dlm_acc": "6.547e-01", "anc_acc": "6.338e-01", "epoch": 0.05198} {"step": 25995, "loss": 1.2281, "grad_norm": "2.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.444e+00", "anc_loss": "1.553e+00", "dlm_acc": "5.095e-01", "anc_acc": "4.843e-01", "epoch": 0.05199} {"step": 26000, "loss": 1.9544, "grad_norm": "6.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.671e+00", "dlm_acc": "5.052e-01", "anc_acc": "4.852e-01", "epoch": 0.052} {"step": 26005, "loss": 1.7476, "grad_norm": "3.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.730e+00", "anc_loss": "1.834e+00", "dlm_acc": "4.659e-01", "anc_acc": "4.451e-01", "epoch": 0.05201} {"step": 26010, "loss": 1.4722, "grad_norm": "2.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.513e+00", "anc_loss": "1.608e+00", "dlm_acc": "4.892e-01", "anc_acc": "4.659e-01", "epoch": 0.05202} {"step": 26015, "loss": 1.1026, "grad_norm": "4.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.269e+00", "dlm_acc": "5.920e-01", "anc_acc": "5.681e-01", "epoch": 0.05203} {"step": 26020, "loss": 1.2199, "grad_norm": "5.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.131e-01", "anc_acc": "4.943e-01", "epoch": 0.05204} {"step": 26025, "loss": 1.2235, "grad_norm": "3.557e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.162e+00", "dlm_acc": "6.210e-01", "anc_acc": "5.940e-01", "epoch": 0.05205} {"step": 26030, "loss": 1.9481, "grad_norm": "3.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.564e+00", "anc_loss": "1.666e+00", "dlm_acc": "4.938e-01", "anc_acc": "4.734e-01", "epoch": 0.05206} {"step": 26035, "loss": 1.5223, "grad_norm": "3.771e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.487e+00", "anc_loss": "1.592e+00", "dlm_acc": "5.098e-01", "anc_acc": "4.877e-01", "epoch": 0.05207} {"step": 26040, "loss": 1.3352, "grad_norm": "5.024e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.326e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.518e-01", "anc_acc": "5.236e-01", "epoch": 0.05208} {"step": 26045, "loss": 1.3945, "grad_norm": "5.210e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.567e+00", "dlm_acc": "5.381e-01", "anc_acc": "5.160e-01", "epoch": 0.05209} {"step": 26050, "loss": 0.9184, "grad_norm": "5.951e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.141e+00", "dlm_acc": "6.349e-01", "anc_acc": "6.066e-01", "epoch": 0.0521} {"step": 26055, "loss": 0.6626, "grad_norm": "2.008e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.016e-01", "anc_loss": "8.775e-01", "dlm_acc": "6.617e-01", "anc_acc": "6.401e-01", "epoch": 0.05211} {"step": 26060, "loss": 1.1651, "grad_norm": "3.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.402e+00", "dlm_acc": "4.953e-01", "anc_acc": "4.745e-01", "epoch": 0.05212} {"step": 26065, "loss": 0.6678, "grad_norm": "3.244e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.121e-01", "anc_loss": "6.621e-01", "dlm_acc": "6.098e-01", "anc_acc": "5.834e-01", "epoch": 0.05213} {"step": 26070, "loss": 0.7962, "grad_norm": "4.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.527e-01", "anc_loss": "6.059e-01", "dlm_acc": "6.563e-01", "anc_acc": "6.337e-01", "epoch": 0.05214} {"step": 26075, "loss": 1.0522, "grad_norm": "1.032e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.011e+00", "anc_loss": "1.105e+00", "dlm_acc": "5.984e-01", "anc_acc": "5.690e-01", "epoch": 0.05215} {"step": 26080, "loss": 0.7306, "grad_norm": "2.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.340e-01", "anc_loss": "9.141e-01", "dlm_acc": "6.234e-01", "anc_acc": "5.962e-01", "epoch": 0.05216} {"step": 26085, "loss": 0.8629, "grad_norm": "3.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.891e-01", "anc_loss": "1.091e+00", "dlm_acc": "6.256e-01", "anc_acc": "5.992e-01", "epoch": 0.05217} {"step": 26090, "loss": 0.9275, "grad_norm": "5.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.117e-01", "anc_loss": "9.195e-01", "dlm_acc": "3.080e-01", "anc_acc": "3.034e-01", "epoch": 0.05218} {"step": 26095, "loss": 0.8877, "grad_norm": "3.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.922e-01", "anc_loss": "9.617e-01", "dlm_acc": "5.407e-01", "anc_acc": "5.169e-01", "epoch": 0.05219} {"step": 26100, "loss": 1.2403, "grad_norm": "3.344e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.198e-01", "anc_loss": "6.422e-01", "dlm_acc": "6.527e-01", "anc_acc": "6.444e-01", "epoch": 0.0522} {"step": 26105, "loss": 1.1253, "grad_norm": "3.256e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.016e-01", "anc_loss": "7.117e-01", "dlm_acc": "5.577e-01", "anc_acc": "5.561e-01", "epoch": 0.05221} {"step": 26110, "loss": 1.1795, "grad_norm": "4.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.115e+00", "anc_loss": "1.193e+00", "dlm_acc": "6.072e-01", "anc_acc": "5.918e-01", "epoch": 0.05222} {"step": 26115, "loss": 0.8009, "grad_norm": "1.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.719e-01", "anc_loss": "7.016e-01", "dlm_acc": "5.483e-01", "anc_acc": "5.409e-01", "epoch": 0.05223} {"step": 26120, "loss": 0.9926, "grad_norm": "5.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.070e-01", "anc_loss": "8.906e-01", "dlm_acc": "6.400e-01", "anc_acc": "6.158e-01", "epoch": 0.05224} {"step": 26125, "loss": 1.0777, "grad_norm": "3.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.953e-01", "anc_acc": "5.787e-01", "epoch": 0.05225} {"step": 26130, "loss": 0.8684, "grad_norm": "1.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.086e+00", "dlm_acc": "5.201e-01", "anc_acc": "5.029e-01", "epoch": 0.05226} {"step": 26135, "loss": 0.9715, "grad_norm": "2.787e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.430e-01", "anc_loss": "7.453e-01", "dlm_acc": "4.219e-01", "anc_acc": "4.200e-01", "epoch": 0.05227} {"step": 26140, "loss": 0.9997, "grad_norm": "2.568e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.078e-01", "anc_loss": "8.164e-01", "dlm_acc": "3.861e-01", "anc_acc": "3.827e-01", "epoch": 0.05228} {"step": 26145, "loss": 1.36, "grad_norm": "4.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.164e-01", "anc_loss": "9.719e-01", "dlm_acc": "5.432e-01", "anc_acc": "5.288e-01", "epoch": 0.05229} {"step": 26150, "loss": 1.3429, "grad_norm": "3.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.461e-01", "anc_loss": "1.020e+00", "dlm_acc": "5.741e-01", "anc_acc": "5.534e-01", "epoch": 0.0523} {"step": 26155, "loss": 1.1564, "grad_norm": "2.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.287e-01", "anc_loss": "8.977e-01", "dlm_acc": "6.562e-01", "anc_acc": "6.323e-01", "epoch": 0.05231} {"step": 26160, "loss": 1.0295, "grad_norm": "4.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.477e-01", "anc_loss": "9.227e-01", "dlm_acc": "5.995e-01", "anc_acc": "5.739e-01", "epoch": 0.05232} {"step": 26165, "loss": 1.1958, "grad_norm": "2.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.187e-01", "anc_loss": "9.805e-01", "dlm_acc": "5.965e-01", "anc_acc": "5.780e-01", "epoch": 0.05233} {"step": 26170, "loss": 1.1118, "grad_norm": "3.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.473e-01", "anc_loss": "9.082e-01", "dlm_acc": "5.836e-01", "anc_acc": "5.629e-01", "epoch": 0.05234} {"step": 26175, "loss": 1.1343, "grad_norm": "2.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.348e-01", "anc_loss": "8.031e-01", "dlm_acc": "5.815e-01", "anc_acc": "5.562e-01", "epoch": 0.05235} {"step": 26180, "loss": 0.8786, "grad_norm": "3.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.194e-01", "anc_loss": "4.505e-01", "dlm_acc": "7.881e-01", "anc_acc": "7.769e-01", "epoch": 0.05236} {"step": 26185, "loss": 1.0229, "grad_norm": "3.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.302e-01", "anc_loss": "6.776e-01", "dlm_acc": "7.195e-01", "anc_acc": "7.051e-01", "epoch": 0.05237} {"step": 26190, "loss": 1.2298, "grad_norm": "2.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.299e+00", "anc_loss": "1.355e+00", "dlm_acc": "4.246e-01", "anc_acc": "4.125e-01", "epoch": 0.05238} {"step": 26195, "loss": 0.9466, "grad_norm": "2.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.795e-01", "anc_loss": "8.244e-01", "dlm_acc": "6.881e-01", "anc_acc": "6.801e-01", "epoch": 0.05239} {"step": 26200, "loss": 1.0664, "grad_norm": "1.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.850e-01", "anc_loss": "1.063e+00", "dlm_acc": "6.205e-01", "anc_acc": "5.949e-01", "epoch": 0.0524} {"step": 26205, "loss": 1.1952, "grad_norm": "3.425e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.273e-01", "anc_loss": "8.629e-01", "dlm_acc": "6.000e-01", "anc_acc": "5.882e-01", "epoch": 0.05241} {"step": 26210, "loss": 1.1695, "grad_norm": "3.077e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.125e-01", "anc_loss": "6.500e-01", "dlm_acc": "5.745e-01", "anc_acc": "5.532e-01", "epoch": 0.05242} {"step": 26215, "loss": 1.448, "grad_norm": "2.211e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.153e+00", "anc_loss": "1.249e+00", "dlm_acc": "5.989e-01", "anc_acc": "5.733e-01", "epoch": 0.05243} {"step": 26220, "loss": 1.2878, "grad_norm": "3.688e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.197e+00", "anc_loss": "1.289e+00", "dlm_acc": "5.600e-01", "anc_acc": "5.342e-01", "epoch": 0.05244} {"step": 26225, "loss": 1.4259, "grad_norm": "6.010e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.508e-01", "anc_loss": "7.688e-01", "dlm_acc": "7.279e-01", "anc_acc": "6.927e-01", "epoch": 0.05245} {"step": 26230, "loss": 1.2714, "grad_norm": "4.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.818e-01", "anc_loss": "1.034e+00", "dlm_acc": "5.981e-01", "anc_acc": "5.850e-01", "epoch": 0.05246} {"step": 26235, "loss": 1.1339, "grad_norm": "3.347e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.844e-01", "anc_loss": "1.052e+00", "dlm_acc": "5.414e-01", "anc_acc": "5.182e-01", "epoch": 0.05247} {"step": 26240, "loss": 1.158, "grad_norm": "2.313e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.215e+00", "anc_loss": "1.314e+00", "dlm_acc": "5.881e-01", "anc_acc": "5.666e-01", "epoch": 0.05248} {"step": 26245, "loss": 0.8451, "grad_norm": "3.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.057e-01", "anc_loss": "6.297e-01", "dlm_acc": "6.902e-01", "anc_acc": "6.822e-01", "epoch": 0.05249} {"step": 26250, "loss": 1.5515, "grad_norm": "9.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.185e+00", "dlm_acc": "6.061e-01", "anc_acc": "5.863e-01", "epoch": 0.0525} {"step": 26255, "loss": 1.2788, "grad_norm": "4.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.227e+00", "dlm_acc": "6.438e-01", "anc_acc": "6.142e-01", "epoch": 0.05251} {"step": 26260, "loss": 1.3667, "grad_norm": "4.280e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.188e+00", "dlm_acc": "6.407e-01", "anc_acc": "6.165e-01", "epoch": 0.05252} {"step": 26265, "loss": 1.4199, "grad_norm": "3.280e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.201e+00", "anc_loss": "1.297e+00", "dlm_acc": "6.018e-01", "anc_acc": "5.777e-01", "epoch": 0.05253} {"step": 26270, "loss": 1.0742, "grad_norm": "2.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.992e-01", "anc_loss": "1.100e+00", "dlm_acc": "5.949e-01", "anc_acc": "5.677e-01", "epoch": 0.05254} {"step": 26275, "loss": 1.546, "grad_norm": "6.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.516e+00", "anc_loss": "1.628e+00", "dlm_acc": "5.502e-01", "anc_acc": "5.289e-01", "epoch": 0.05255} {"step": 26280, "loss": 1.292, "grad_norm": "5.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.430e-01", "anc_loss": "1.043e+00", "dlm_acc": "6.602e-01", "anc_acc": "6.364e-01", "epoch": 0.05256} {"step": 26285, "loss": 1.7578, "grad_norm": "5.216e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.241e+00", "dlm_acc": "6.483e-01", "anc_acc": "6.259e-01", "epoch": 0.05257} {"step": 26290, "loss": 1.2433, "grad_norm": "3.563e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.231e+00", "anc_loss": "1.322e+00", "dlm_acc": "5.608e-01", "anc_acc": "5.387e-01", "epoch": 0.05258} {"step": 26295, "loss": 1.5298, "grad_norm": "1.053e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.313e+00", "dlm_acc": "5.819e-01", "anc_acc": "5.591e-01", "epoch": 0.05259} {"step": 26300, "loss": 1.8156, "grad_norm": "3.771e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.922e-01", "anc_acc": "5.587e-01", "epoch": 0.0526} {"step": 26305, "loss": 1.9688, "grad_norm": "4.552e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.806e+00", "anc_loss": "1.913e+00", "dlm_acc": "4.880e-01", "anc_acc": "4.669e-01", "epoch": 0.05261} {"step": 26310, "loss": 1.5317, "grad_norm": "5.533e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.276e+00", "dlm_acc": "6.348e-01", "anc_acc": "6.068e-01", "epoch": 0.05262} {"step": 26315, "loss": 1.1028, "grad_norm": "2.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.178e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.546e-01", "anc_acc": "5.275e-01", "epoch": 0.05263} {"step": 26320, "loss": 1.1838, "grad_norm": "2.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.174e+00", "dlm_acc": "6.310e-01", "anc_acc": "5.990e-01", "epoch": 0.05264} {"step": 26325, "loss": 1.2379, "grad_norm": "9.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.268e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.300e-01", "anc_acc": "5.063e-01", "epoch": 0.05265} {"step": 26330, "loss": 1.4636, "grad_norm": "3.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.494e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.339e-01", "epoch": 0.05266} {"step": 26335, "loss": 1.2143, "grad_norm": "2.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.241e+00", "dlm_acc": "5.846e-01", "anc_acc": "5.612e-01", "epoch": 0.05267} {"step": 26340, "loss": 1.1193, "grad_norm": "3.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.262e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.847e-01", "anc_acc": "5.593e-01", "epoch": 0.05268} {"step": 26345, "loss": 1.4502, "grad_norm": "3.541e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.469e+00", "dlm_acc": "5.369e-01", "anc_acc": "5.128e-01", "epoch": 0.05269} {"step": 26350, "loss": 1.1728, "grad_norm": "4.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.565e-01", "anc_acc": "5.329e-01", "epoch": 0.0527} {"step": 26355, "loss": 1.4403, "grad_norm": "1.211e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.410e+00", "dlm_acc": "5.478e-01", "anc_acc": "5.232e-01", "epoch": 0.05271} {"step": 26360, "loss": 1.1399, "grad_norm": "3.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.056e-01", "anc_acc": "4.882e-01", "epoch": 0.05272} {"step": 26365, "loss": 1.5138, "grad_norm": "5.709e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.977e-01", "anc_loss": "8.219e-01", "dlm_acc": "5.181e-01", "anc_acc": "5.070e-01", "epoch": 0.05273} {"step": 26370, "loss": 1.3001, "grad_norm": "2.464e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.436e-01", "anc_acc": "5.235e-01", "epoch": 0.05274} {"step": 26375, "loss": 1.4348, "grad_norm": "3.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.475e+00", "dlm_acc": "5.257e-01", "anc_acc": "5.061e-01", "epoch": 0.05275} {"step": 26380, "loss": 0.9752, "grad_norm": "2.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.803e-01", "anc_loss": "4.129e-01", "dlm_acc": "7.432e-01", "anc_acc": "7.262e-01", "epoch": 0.05276} {"step": 26385, "loss": 1.05, "grad_norm": "3.076e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.818e-01", "anc_loss": "4.219e-01", "dlm_acc": "7.408e-01", "anc_acc": "7.179e-01", "epoch": 0.05277} {"step": 26390, "loss": 0.9207, "grad_norm": "2.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.900e-01", "anc_loss": "6.438e-01", "dlm_acc": "6.763e-01", "anc_acc": "6.513e-01", "epoch": 0.05278} {"step": 26395, "loss": 1.2046, "grad_norm": "2.110e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.809e+00", "anc_loss": "1.927e+00", "dlm_acc": "4.658e-01", "anc_acc": "4.432e-01", "epoch": 0.05279} {"step": 26400, "loss": 1.232, "grad_norm": "2.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.553e+00", "anc_loss": "1.652e+00", "dlm_acc": "5.185e-01", "anc_acc": "4.969e-01", "epoch": 0.0528} {"step": 26405, "loss": 1.1516, "grad_norm": "3.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.748e+00", "anc_loss": "1.861e+00", "dlm_acc": "4.905e-01", "anc_acc": "4.671e-01", "epoch": 0.05281} {"step": 26410, "loss": 1.1032, "grad_norm": "2.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.550e+00", "dlm_acc": "5.095e-01", "anc_acc": "4.877e-01", "epoch": 0.05282} {"step": 26415, "loss": 0.8617, "grad_norm": "1.813e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.816e-01", "anc_acc": "5.566e-01", "epoch": 0.05283} {"step": 26420, "loss": 0.7481, "grad_norm": "3.207e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.289e-01", "anc_loss": "1.030e+00", "dlm_acc": "6.565e-01", "anc_acc": "6.290e-01", "epoch": 0.05284} {"step": 26425, "loss": 1.0461, "grad_norm": "2.701e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.018e+00", "anc_loss": "1.134e+00", "dlm_acc": "6.359e-01", "anc_acc": "6.101e-01", "epoch": 0.05285} {"step": 26430, "loss": 1.4773, "grad_norm": "3.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.570e+00", "anc_loss": "1.682e+00", "dlm_acc": "5.224e-01", "anc_acc": "5.005e-01", "epoch": 0.05286} {"step": 26435, "loss": 1.0904, "grad_norm": "4.340e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.707e-01", "anc_loss": "1.067e+00", "dlm_acc": "6.880e-01", "anc_acc": "6.664e-01", "epoch": 0.05287} {"step": 26440, "loss": 1.5441, "grad_norm": "4.168e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.610e+00", "dlm_acc": "5.510e-01", "anc_acc": "5.260e-01", "epoch": 0.05288} {"step": 26445, "loss": 1.2089, "grad_norm": "1.155e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.822e-01", "anc_acc": "5.552e-01", "epoch": 0.05289} {"step": 26450, "loss": 1.6083, "grad_norm": "3.849e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.516e+00", "dlm_acc": "5.273e-01", "anc_acc": "5.065e-01", "epoch": 0.0529} {"step": 26455, "loss": 0.9404, "grad_norm": "2.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.367e-01", "anc_loss": "1.027e+00", "dlm_acc": "6.291e-01", "anc_acc": "6.068e-01", "epoch": 0.05291} {"step": 26460, "loss": 1.3957, "grad_norm": "5.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.570e+00", "anc_loss": "1.698e+00", "dlm_acc": "5.041e-01", "anc_acc": "4.753e-01", "epoch": 0.05292} {"step": 26465, "loss": 1.7842, "grad_norm": "7.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.489e+00", "anc_loss": "1.606e+00", "dlm_acc": "5.282e-01", "anc_acc": "5.018e-01", "epoch": 0.05293} {"step": 26470, "loss": 1.2367, "grad_norm": "5.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.397e+00", "dlm_acc": "5.725e-01", "anc_acc": "5.468e-01", "epoch": 0.05294} {"step": 26475, "loss": 1.2675, "grad_norm": "4.483e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.417e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.357e-01", "anc_acc": "5.113e-01", "epoch": 0.05295} {"step": 26480, "loss": 0.8492, "grad_norm": "2.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.918e-01", "anc_loss": "9.758e-01", "dlm_acc": "6.468e-01", "anc_acc": "6.251e-01", "epoch": 0.05296} {"step": 26485, "loss": 1.2613, "grad_norm": "2.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.814e+00", "anc_loss": "1.923e+00", "dlm_acc": "4.440e-01", "anc_acc": "4.241e-01", "epoch": 0.05297} {"step": 26490, "loss": 1.3621, "grad_norm": "3.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.667e+00", "anc_loss": "1.784e+00", "dlm_acc": "4.860e-01", "anc_acc": "4.624e-01", "epoch": 0.05298} {"step": 26495, "loss": 1.0545, "grad_norm": "3.530e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.149e+00", "dlm_acc": "5.970e-01", "anc_acc": "5.674e-01", "epoch": 0.05299} {"step": 26500, "loss": 1.1434, "grad_norm": "2.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.086e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.454e-01", "anc_acc": "6.097e-01", "epoch": 0.053} {"step": 26505, "loss": 1.1465, "grad_norm": "1.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.583e+00", "anc_loss": "1.661e+00", "dlm_acc": "4.417e-01", "anc_acc": "4.212e-01", "epoch": 0.05301} {"step": 26510, "loss": 1.3974, "grad_norm": "3.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.977e+00", "anc_loss": "2.089e+00", "dlm_acc": "3.527e-01", "anc_acc": "3.239e-01", "epoch": 0.05302} {"step": 26515, "loss": 1.2661, "grad_norm": "4.245e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.644e+00", "dlm_acc": "5.050e-01", "anc_acc": "4.833e-01", "epoch": 0.05303} {"step": 26520, "loss": 1.1567, "grad_norm": "2.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.040e+00", "anc_loss": "1.137e+00", "dlm_acc": "6.086e-01", "anc_acc": "5.846e-01", "epoch": 0.05304} {"step": 26525, "loss": 1.3469, "grad_norm": "2.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.623e+00", "anc_loss": "1.728e+00", "dlm_acc": "5.053e-01", "anc_acc": "4.837e-01", "epoch": 0.05305} {"step": 26530, "loss": 1.0687, "grad_norm": "3.050e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.812e-01", "anc_loss": "1.087e+00", "dlm_acc": "5.925e-01", "anc_acc": "5.604e-01", "epoch": 0.05306} {"step": 26535, "loss": 1.0194, "grad_norm": "3.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.035e-01", "anc_loss": "8.871e-01", "dlm_acc": "6.564e-01", "anc_acc": "6.320e-01", "epoch": 0.05307} {"step": 26540, "loss": 0.8897, "grad_norm": "4.280e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.942e-01", "anc_acc": "5.640e-01", "epoch": 0.05308} {"step": 26545, "loss": 0.8852, "grad_norm": "2.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.253e+00", "dlm_acc": "5.543e-01", "anc_acc": "5.265e-01", "epoch": 0.05309} {"step": 26550, "loss": 0.9142, "grad_norm": "2.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.178e+00", "anc_loss": "1.232e+00", "dlm_acc": "5.030e-01", "anc_acc": "4.824e-01", "epoch": 0.0531} {"step": 26555, "loss": 1.4341, "grad_norm": "2.658e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.776e+00", "anc_loss": "1.897e+00", "dlm_acc": "3.583e-01", "anc_acc": "3.270e-01", "epoch": 0.05311} {"step": 26560, "loss": 1.3242, "grad_norm": "3.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.798e+00", "anc_loss": "1.961e+00", "dlm_acc": "3.710e-01", "anc_acc": "3.326e-01", "epoch": 0.05312} {"step": 26565, "loss": 1.0258, "grad_norm": "3.938e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.192e+00", "dlm_acc": "6.127e-01", "anc_acc": "5.896e-01", "epoch": 0.05313} {"step": 26570, "loss": 1.1654, "grad_norm": "4.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.323e+00", "dlm_acc": "5.751e-01", "anc_acc": "5.515e-01", "epoch": 0.05314} {"step": 26575, "loss": 1.0647, "grad_norm": "3.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.586e-01", "anc_loss": "9.563e-01", "dlm_acc": "6.397e-01", "anc_acc": "6.102e-01", "epoch": 0.05315} {"step": 26580, "loss": 1.0996, "grad_norm": "4.187e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.474e+00", "anc_loss": "1.523e+00", "dlm_acc": "3.333e-01", "anc_acc": "3.125e-01", "epoch": 0.05316} {"step": 26585, "loss": 1.2624, "grad_norm": "4.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.255e+00", "anc_loss": "1.335e+00", "dlm_acc": "5.684e-01", "anc_acc": "5.485e-01", "epoch": 0.05317} {"step": 26590, "loss": 1.0402, "grad_norm": "5.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.331e+00", "dlm_acc": "4.741e-01", "anc_acc": "4.559e-01", "epoch": 0.05318} {"step": 26595, "loss": 0.9772, "grad_norm": "6.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.625e-01", "anc_loss": "1.040e+00", "dlm_acc": "5.939e-01", "anc_acc": "5.753e-01", "epoch": 0.05319} {"step": 26600, "loss": 1.0235, "grad_norm": "5.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.197e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.718e-01", "anc_acc": "5.283e-01", "epoch": 0.0532} {"step": 26605, "loss": 1.0176, "grad_norm": "2.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.012e-01", "anc_loss": "6.730e-01", "dlm_acc": "7.276e-01", "anc_acc": "7.014e-01", "epoch": 0.05321} {"step": 26610, "loss": 0.8896, "grad_norm": "3.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.301e+00", "dlm_acc": "5.284e-01", "anc_acc": "5.090e-01", "epoch": 0.05322} {"step": 26615, "loss": 0.8317, "grad_norm": "2.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.084e-01", "anc_loss": "9.270e-01", "dlm_acc": "6.842e-01", "anc_acc": "6.423e-01", "epoch": 0.05323} {"step": 26620, "loss": 1.0324, "grad_norm": "5.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.424e+00", "anc_loss": "1.567e+00", "dlm_acc": "5.348e-01", "anc_acc": "5.004e-01", "epoch": 0.05324} {"step": 26625, "loss": 1.1121, "grad_norm": "3.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.284e+00", "dlm_acc": "5.035e-01", "anc_acc": "4.886e-01", "epoch": 0.05325} {"step": 26630, "loss": 1.2864, "grad_norm": "3.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.272e+00", "dlm_acc": "5.653e-01", "anc_acc": "5.423e-01", "epoch": 0.05326} {"step": 26635, "loss": 0.9966, "grad_norm": "3.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.359e-01", "anc_loss": "7.125e-01", "dlm_acc": "7.059e-01", "anc_acc": "6.800e-01", "epoch": 0.05327} {"step": 26640, "loss": 1.101, "grad_norm": "4.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.110e+00", "dlm_acc": "5.717e-01", "anc_acc": "5.510e-01", "epoch": 0.05328} {"step": 26645, "loss": 1.4263, "grad_norm": "3.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.965e+00", "anc_loss": "2.061e+00", "dlm_acc": "3.799e-01", "anc_acc": "3.648e-01", "epoch": 0.05329} {"step": 26650, "loss": 1.5548, "grad_norm": "3.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.586e+00", "anc_loss": "1.673e+00", "dlm_acc": "4.079e-01", "anc_acc": "3.872e-01", "epoch": 0.0533} {"step": 26655, "loss": 1.0475, "grad_norm": "1.970e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.216e+00", "dlm_acc": "5.898e-01", "anc_acc": "5.736e-01", "epoch": 0.05331} {"step": 26660, "loss": 1.1734, "grad_norm": "3.672e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.643e-01", "anc_loss": "1.072e+00", "dlm_acc": "6.617e-01", "anc_acc": "6.312e-01", "epoch": 0.05332} {"step": 26665, "loss": 1.2679, "grad_norm": "4.295e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.511e-01", "anc_acc": "5.240e-01", "epoch": 0.05333} {"step": 26670, "loss": 1.3389, "grad_norm": "3.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.483e+00", "anc_loss": "1.580e+00", "dlm_acc": "4.899e-01", "anc_acc": "4.692e-01", "epoch": 0.05334} {"step": 26675, "loss": 1.1682, "grad_norm": "2.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.594e+00", "anc_loss": "1.691e+00", "dlm_acc": "4.900e-01", "anc_acc": "4.674e-01", "epoch": 0.05335} {"step": 26680, "loss": 1.2689, "grad_norm": "3.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.542e+00", "anc_loss": "1.630e+00", "dlm_acc": "4.867e-01", "anc_acc": "4.679e-01", "epoch": 0.05336} {"step": 26685, "loss": 1.1944, "grad_norm": "2.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.509e+00", "anc_loss": "1.607e+00", "dlm_acc": "5.151e-01", "anc_acc": "4.935e-01", "epoch": 0.05337} {"step": 26690, "loss": 1.2838, "grad_norm": "6.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.374e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.534e-01", "anc_acc": "5.336e-01", "epoch": 0.05338} {"step": 26695, "loss": 1.3316, "grad_norm": "3.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.360e+00", "anc_loss": "1.476e+00", "dlm_acc": "5.470e-01", "anc_acc": "5.262e-01", "epoch": 0.05339} {"step": 26700, "loss": 0.8844, "grad_norm": "3.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.121e-01", "anc_loss": "8.826e-01", "dlm_acc": "6.409e-01", "anc_acc": "6.166e-01", "epoch": 0.0534} {"step": 26705, "loss": 1.0209, "grad_norm": "5.309e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.849e-01", "anc_loss": "9.504e-01", "dlm_acc": "6.770e-01", "anc_acc": "6.600e-01", "epoch": 0.05341} {"step": 26710, "loss": 1.0957, "grad_norm": "3.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.177e-01", "anc_loss": "5.300e-01", "dlm_acc": "6.348e-01", "anc_acc": "6.273e-01", "epoch": 0.05342} {"step": 26715, "loss": 1.3069, "grad_norm": "4.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.534e+00", "anc_loss": "1.652e+00", "dlm_acc": "5.396e-01", "anc_acc": "5.150e-01", "epoch": 0.05343} {"step": 26720, "loss": 1.1994, "grad_norm": "3.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.325e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.262e-01", "anc_acc": "5.050e-01", "epoch": 0.05344} {"step": 26725, "loss": 1.2668, "grad_norm": "3.712e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.681e+00", "anc_loss": "1.803e+00", "dlm_acc": "4.842e-01", "anc_acc": "4.601e-01", "epoch": 0.05345} {"step": 26730, "loss": 1.2384, "grad_norm": "3.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.516e+00", "anc_loss": "1.619e+00", "dlm_acc": "4.982e-01", "anc_acc": "4.759e-01", "epoch": 0.05346} {"step": 26735, "loss": 1.1691, "grad_norm": "2.791e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.422e-01", "anc_acc": "5.172e-01", "epoch": 0.05347} {"step": 26740, "loss": 0.8705, "grad_norm": "2.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.232e+00", "dlm_acc": "5.714e-01", "anc_acc": "5.457e-01", "epoch": 0.05348} {"step": 26745, "loss": 1.1851, "grad_norm": "6.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.017e+00", "anc_loss": "1.098e+00", "dlm_acc": "6.382e-01", "anc_acc": "6.170e-01", "epoch": 0.05349} {"step": 26750, "loss": 1.5903, "grad_norm": "4.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.764e+00", "anc_loss": "1.880e+00", "dlm_acc": "4.650e-01", "anc_acc": "4.425e-01", "epoch": 0.0535} {"step": 26755, "loss": 1.019, "grad_norm": "2.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.024e+00", "anc_loss": "1.101e+00", "dlm_acc": "6.513e-01", "anc_acc": "6.312e-01", "epoch": 0.05351} {"step": 26760, "loss": 1.6856, "grad_norm": "8.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.850e-01", "anc_loss": "3.172e-01", "dlm_acc": "8.503e-01", "anc_acc": "8.381e-01", "epoch": 0.05352} {"step": 26765, "loss": 1.1078, "grad_norm": "8.004e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.157e-01", "anc_loss": "1.325e-01", "dlm_acc": "9.244e-01", "anc_acc": "9.174e-01", "epoch": 0.05353} {"step": 26770, "loss": 1.2163, "grad_norm": "4.648e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.354e-01", "anc_loss": "3.679e-01", "dlm_acc": "8.738e-01", "anc_acc": "8.640e-01", "epoch": 0.05354} {"step": 26775, "loss": 0.9832, "grad_norm": "5.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.764e-01", "anc_loss": "1.955e-01", "dlm_acc": "8.982e-01", "anc_acc": "8.898e-01", "epoch": 0.05355} {"step": 26780, "loss": 1.0237, "grad_norm": "1.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e-01", "anc_loss": "1.446e-01", "dlm_acc": "9.116e-01", "anc_acc": "9.058e-01", "epoch": 0.05356} {"step": 26785, "loss": 0.8297, "grad_norm": "2.785e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.241e-02", "anc_loss": "1.042e-01", "dlm_acc": "9.322e-01", "anc_acc": "9.264e-01", "epoch": 0.05357} {"step": 26790, "loss": 0.9059, "grad_norm": "3.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.267e-02", "anc_loss": "9.463e-02", "dlm_acc": "9.427e-01", "anc_acc": "9.369e-01", "epoch": 0.05358} {"step": 26795, "loss": 0.7556, "grad_norm": "2.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.760e-01", "anc_loss": "1.988e-01", "dlm_acc": "8.949e-01", "anc_acc": "8.842e-01", "epoch": 0.05359} {"step": 26800, "loss": 1.1051, "grad_norm": "2.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.375e-01", "anc_loss": "1.031e+00", "dlm_acc": "6.234e-01", "anc_acc": "5.984e-01", "epoch": 0.0536} {"step": 26805, "loss": 1.1298, "grad_norm": "3.214e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.393e-01", "anc_loss": "1.024e+00", "dlm_acc": "6.424e-01", "anc_acc": "6.222e-01", "epoch": 0.05361} {"step": 26810, "loss": 1.6265, "grad_norm": "3.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.979e-01", "anc_loss": "8.539e-01", "dlm_acc": "6.575e-01", "anc_acc": "6.369e-01", "epoch": 0.05362} {"step": 26815, "loss": 1.036, "grad_norm": "3.158e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.745e-01", "anc_loss": "5.181e-01", "dlm_acc": "7.745e-01", "anc_acc": "7.555e-01", "epoch": 0.05363} {"step": 26820, "loss": 1.0407, "grad_norm": "1.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.784e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.184e-01", "anc_acc": "5.930e-01", "epoch": 0.05364} {"step": 26825, "loss": 1.6292, "grad_norm": "5.594e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.359e+00", "dlm_acc": "6.298e-01", "anc_acc": "6.026e-01", "epoch": 0.05365} {"step": 26830, "loss": 1.1257, "grad_norm": "6.461e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.480e-01", "anc_loss": "8.479e-01", "dlm_acc": "7.352e-01", "anc_acc": "7.117e-01", "epoch": 0.05366} {"step": 26835, "loss": 1.3133, "grad_norm": "3.408e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.770e-01", "anc_loss": "6.262e-01", "dlm_acc": "7.495e-01", "anc_acc": "7.339e-01", "epoch": 0.05367} {"step": 26840, "loss": 1.3515, "grad_norm": "3.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.949e-01", "anc_loss": "9.492e-01", "dlm_acc": "6.123e-01", "anc_acc": "5.986e-01", "epoch": 0.05368} {"step": 26845, "loss": 0.9402, "grad_norm": "3.299e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.523e-01", "anc_loss": "6.842e-01", "dlm_acc": "6.465e-01", "anc_acc": "6.366e-01", "epoch": 0.05369} {"step": 26850, "loss": 0.9407, "grad_norm": "5.050e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.961e-01", "anc_loss": "1.062e+00", "dlm_acc": "5.569e-01", "anc_acc": "5.393e-01", "epoch": 0.0537} {"step": 26855, "loss": 0.9181, "grad_norm": "3.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.891e-01", "anc_loss": "6.898e-01", "dlm_acc": "7.435e-01", "anc_acc": "7.128e-01", "epoch": 0.05371} {"step": 26860, "loss": 1.0017, "grad_norm": "2.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.929e-01", "anc_loss": "6.498e-01", "dlm_acc": "7.792e-01", "anc_acc": "7.623e-01", "epoch": 0.05372} {"step": 26865, "loss": 1.2109, "grad_norm": "2.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.656e-01", "anc_loss": "8.055e-01", "dlm_acc": "5.420e-01", "anc_acc": "5.248e-01", "epoch": 0.05373} {"step": 26870, "loss": 1.0473, "grad_norm": "3.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.180e-01", "anc_loss": "5.496e-01", "dlm_acc": "5.973e-01", "anc_acc": "5.726e-01", "epoch": 0.05374} {"step": 26875, "loss": 1.0171, "grad_norm": "4.856e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.797e-01", "anc_loss": "8.219e-01", "dlm_acc": "5.204e-01", "anc_acc": "5.071e-01", "epoch": 0.05375} {"step": 26880, "loss": 1.1247, "grad_norm": "3.467e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.289e+00", "dlm_acc": "5.895e-01", "anc_acc": "5.688e-01", "epoch": 0.05376} {"step": 26885, "loss": 1.1471, "grad_norm": "4.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.940e-01", "anc_loss": "3.105e-01", "dlm_acc": "8.391e-01", "anc_acc": "8.342e-01", "epoch": 0.05377} {"step": 26890, "loss": 1.5346, "grad_norm": "2.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.414e-01", "anc_loss": "9.166e-01", "dlm_acc": "6.945e-01", "anc_acc": "6.754e-01", "epoch": 0.05378} {"step": 26895, "loss": 1.3053, "grad_norm": "3.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.527e-01", "anc_loss": "8.230e-01", "dlm_acc": "7.101e-01", "anc_acc": "6.871e-01", "epoch": 0.05379} {"step": 26900, "loss": 1.2677, "grad_norm": "3.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.127e-01", "anc_loss": "7.740e-01", "dlm_acc": "7.305e-01", "anc_acc": "7.189e-01", "epoch": 0.0538} {"step": 26905, "loss": 1.238, "grad_norm": "3.210e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.180e+00", "dlm_acc": "6.125e-01", "anc_acc": "5.927e-01", "epoch": 0.05381} {"step": 26910, "loss": 0.7506, "grad_norm": "2.830e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.934e-01", "anc_loss": "5.336e-01", "dlm_acc": "6.858e-01", "anc_acc": "6.698e-01", "epoch": 0.05382} {"step": 26915, "loss": 1.258, "grad_norm": "4.351e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.395e-01", "anc_loss": "7.875e-01", "dlm_acc": "6.111e-01", "anc_acc": "5.931e-01", "epoch": 0.05383} {"step": 26920, "loss": 1.0758, "grad_norm": "3.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.096e-01", "anc_loss": "8.688e-01", "dlm_acc": "6.992e-01", "anc_acc": "6.865e-01", "epoch": 0.05384} {"step": 26925, "loss": 1.1484, "grad_norm": "2.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.114e+00", "dlm_acc": "5.934e-01", "anc_acc": "5.717e-01", "epoch": 0.05385} {"step": 26930, "loss": 1.3385, "grad_norm": "4.527e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.301e-01", "anc_loss": "5.778e-01", "dlm_acc": "7.887e-01", "anc_acc": "7.750e-01", "epoch": 0.05386} {"step": 26935, "loss": 1.2626, "grad_norm": "2.681e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.304e-01", "anc_loss": "7.860e-01", "dlm_acc": "6.724e-01", "anc_acc": "6.586e-01", "epoch": 0.05387} {"step": 26940, "loss": 1.0657, "grad_norm": "2.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.754e-01", "anc_loss": "5.133e-01", "dlm_acc": "7.504e-01", "anc_acc": "7.386e-01", "epoch": 0.05388} {"step": 26945, "loss": 1.0379, "grad_norm": "2.749e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.799e-01", "anc_loss": "6.441e-01", "dlm_acc": "7.686e-01", "anc_acc": "7.467e-01", "epoch": 0.05389} {"step": 26950, "loss": 1.3983, "grad_norm": "9.418e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.186e+00", "anc_loss": "1.310e+00", "dlm_acc": "6.248e-01", "anc_acc": "5.946e-01", "epoch": 0.0539} {"step": 26955, "loss": 0.9611, "grad_norm": "3.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.041e+00", "anc_loss": "1.121e+00", "dlm_acc": "5.670e-01", "anc_acc": "5.488e-01", "epoch": 0.05391} {"step": 26960, "loss": 0.8523, "grad_norm": "1.658e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.790e-01", "anc_loss": "5.066e-01", "dlm_acc": "8.368e-01", "anc_acc": "8.308e-01", "epoch": 0.05392} {"step": 26965, "loss": 0.9151, "grad_norm": "5.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.620e-01", "anc_loss": "1.792e-01", "dlm_acc": "8.839e-01", "anc_acc": "8.768e-01", "epoch": 0.05393} {"step": 26970, "loss": 0.8573, "grad_norm": "5.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.030e-01", "anc_loss": "7.753e-01", "dlm_acc": "7.524e-01", "anc_acc": "7.339e-01", "epoch": 0.05394} {"step": 26975, "loss": 0.6659, "grad_norm": "3.085e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.828e-01", "anc_loss": "6.203e-01", "dlm_acc": "6.509e-01", "anc_acc": "6.434e-01", "epoch": 0.05395} {"step": 26980, "loss": 1.096, "grad_norm": "5.088e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.090e-01", "anc_loss": "9.840e-01", "dlm_acc": "6.638e-01", "anc_acc": "6.452e-01", "epoch": 0.05396} {"step": 26985, "loss": 0.9499, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.254e-01", "anc_loss": "9.109e-01", "dlm_acc": "7.008e-01", "anc_acc": "6.810e-01", "epoch": 0.05397} {"step": 26990, "loss": 1.4143, "grad_norm": "2.429e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.154e-01", "anc_acc": "4.941e-01", "epoch": 0.05398} {"step": 26995, "loss": 0.9733, "grad_norm": "2.802e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.091e-01", "anc_acc": "5.878e-01", "epoch": 0.05399} {"step": 27000, "loss": 1.0632, "grad_norm": "2.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.369e+00", "dlm_acc": "6.137e-01", "anc_acc": "5.925e-01", "epoch": 0.054} {"step": 27005, "loss": 0.6444, "grad_norm": "1.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.978e-01", "anc_loss": "5.518e-01", "dlm_acc": "7.560e-01", "anc_acc": "7.381e-01", "epoch": 0.05401} {"step": 27010, "loss": 1.2979, "grad_norm": "8.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e-01", "anc_loss": "1.277e-01", "dlm_acc": "9.336e-01", "anc_acc": "9.310e-01", "epoch": 0.05402} {"step": 27015, "loss": 1.084, "grad_norm": "3.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.496e-01", "anc_loss": "4.919e-01", "dlm_acc": "8.344e-01", "anc_acc": "8.229e-01", "epoch": 0.05403} {"step": 27020, "loss": 1.2074, "grad_norm": "4.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.844e-01", "anc_loss": "9.375e-01", "dlm_acc": "6.073e-01", "anc_acc": "5.914e-01", "epoch": 0.05404} {"step": 27025, "loss": 1.0736, "grad_norm": "3.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.099e+00", "dlm_acc": "5.922e-01", "anc_acc": "5.730e-01", "epoch": 0.05405} {"step": 27030, "loss": 1.5595, "grad_norm": "4.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.104e+00", "anc_loss": "1.170e+00", "dlm_acc": "4.764e-01", "anc_acc": "4.598e-01", "epoch": 0.05406} {"step": 27035, "loss": 0.9312, "grad_norm": "4.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.469e-01", "anc_loss": "5.773e-01", "dlm_acc": "6.331e-01", "anc_acc": "6.205e-01", "epoch": 0.05407} {"step": 27040, "loss": 1.0356, "grad_norm": "3.222e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.457e-01", "anc_loss": "9.277e-01", "dlm_acc": "6.592e-01", "anc_acc": "6.355e-01", "epoch": 0.05408} {"step": 27045, "loss": 0.9472, "grad_norm": "3.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.844e-01", "anc_loss": "9.488e-01", "dlm_acc": "5.833e-01", "anc_acc": "5.579e-01", "epoch": 0.05409} {"step": 27050, "loss": 0.9441, "grad_norm": "2.578e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.193e+00", "dlm_acc": "5.832e-01", "anc_acc": "5.600e-01", "epoch": 0.0541} {"step": 27055, "loss": 1.364, "grad_norm": "4.003e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.502e+00", "anc_loss": "1.602e+00", "dlm_acc": "4.920e-01", "anc_acc": "4.717e-01", "epoch": 0.05411} {"step": 27060, "loss": 1.4647, "grad_norm": "2.648e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.398e+00", "dlm_acc": "6.200e-01", "anc_acc": "6.016e-01", "epoch": 0.05412} {"step": 27065, "loss": 1.1985, "grad_norm": "2.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.198e+00", "dlm_acc": "6.334e-01", "anc_acc": "6.115e-01", "epoch": 0.05413} {"step": 27070, "loss": 1.0384, "grad_norm": "2.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.434e-01", "anc_loss": "6.883e-01", "dlm_acc": "6.456e-01", "anc_acc": "6.343e-01", "epoch": 0.05414} {"step": 27075, "loss": 1.4154, "grad_norm": "3.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.094e+00", "anc_loss": "1.175e+00", "dlm_acc": "6.426e-01", "anc_acc": "6.254e-01", "epoch": 0.05415} {"step": 27080, "loss": 1.1562, "grad_norm": "5.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.098e-01", "anc_loss": "9.750e-01", "dlm_acc": "6.076e-01", "anc_acc": "5.855e-01", "epoch": 0.05416} {"step": 27085, "loss": 1.3247, "grad_norm": "9.271e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.332e-01", "anc_loss": "6.516e-01", "dlm_acc": "5.566e-01", "anc_acc": "5.434e-01", "epoch": 0.05417} {"step": 27090, "loss": 1.3382, "grad_norm": "5.595e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.082e+00", "dlm_acc": "5.641e-01", "anc_acc": "5.399e-01", "epoch": 0.05418} {"step": 27095, "loss": 0.8305, "grad_norm": "1.189e+00", "learning_rate": "1.000e-04", "dlm_loss": "5.046e-01", "anc_loss": "5.701e-01", "dlm_acc": "7.233e-01", "anc_acc": "7.032e-01", "epoch": 0.05419} {"step": 27100, "loss": 0.9254, "grad_norm": "4.168e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.082e-01", "anc_loss": "3.566e-01", "dlm_acc": "8.374e-01", "anc_acc": "8.166e-01", "epoch": 0.0542} {"step": 27105, "loss": 0.8876, "grad_norm": "2.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.836e-01", "anc_loss": "8.676e-01", "dlm_acc": "6.540e-01", "anc_acc": "6.270e-01", "epoch": 0.05421} {"step": 27110, "loss": 1.2251, "grad_norm": "2.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.414e+00", "dlm_acc": "5.459e-01", "anc_acc": "5.236e-01", "epoch": 0.05422} {"step": 27115, "loss": 1.5469, "grad_norm": "3.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.608e-01", "anc_acc": "5.411e-01", "epoch": 0.05423} {"step": 27120, "loss": 1.0109, "grad_norm": "1.836e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.273e-01", "anc_loss": "8.865e-01", "dlm_acc": "6.345e-01", "anc_acc": "6.174e-01", "epoch": 0.05424} {"step": 27125, "loss": 0.8745, "grad_norm": "3.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.322e-01", "anc_loss": "8.203e-01", "dlm_acc": "6.649e-01", "anc_acc": "6.399e-01", "epoch": 0.05425} {"step": 27130, "loss": 1.4828, "grad_norm": "2.485e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.750e-01", "anc_loss": "8.336e-01", "dlm_acc": "6.276e-01", "anc_acc": "6.092e-01", "epoch": 0.05426} {"step": 27135, "loss": 1.4247, "grad_norm": "8.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.468e+00", "dlm_acc": "5.022e-01", "anc_acc": "4.712e-01", "epoch": 0.05427} {"step": 27140, "loss": 0.9024, "grad_norm": "2.685e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.725e-01", "anc_loss": "4.087e-01", "dlm_acc": "7.463e-01", "anc_acc": "7.286e-01", "epoch": 0.05428} {"step": 27145, "loss": 1.0701, "grad_norm": "3.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.652e-01", "anc_loss": "1.021e+00", "dlm_acc": "5.575e-01", "anc_acc": "5.373e-01", "epoch": 0.05429} {"step": 27150, "loss": 1.6843, "grad_norm": "4.940e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.496e+00", "anc_loss": "1.591e+00", "dlm_acc": "5.387e-01", "anc_acc": "5.176e-01", "epoch": 0.0543} {"step": 27155, "loss": 1.2714, "grad_norm": "2.906e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.261e+00", "dlm_acc": "4.947e-01", "anc_acc": "4.721e-01", "epoch": 0.05431} {"step": 27160, "loss": 1.0505, "grad_norm": "2.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.703e-01", "anc_loss": "8.117e-01", "dlm_acc": "4.087e-01", "anc_acc": "3.809e-01", "epoch": 0.05432} {"step": 27165, "loss": 1.3453, "grad_norm": "3.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.305e-01", "anc_loss": "8.820e-01", "dlm_acc": "4.226e-01", "anc_acc": "3.897e-01", "epoch": 0.05433} {"step": 27170, "loss": 1.2509, "grad_norm": "2.782e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.094e-01", "anc_loss": "8.609e-01", "dlm_acc": "4.426e-01", "anc_acc": "4.093e-01", "epoch": 0.05434} {"step": 27175, "loss": 1.2121, "grad_norm": "8.183e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.156e-01", "anc_loss": "7.633e-01", "dlm_acc": "4.392e-01", "anc_acc": "4.062e-01", "epoch": 0.05435} {"step": 27180, "loss": 1.3658, "grad_norm": "4.273e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.194e+00", "dlm_acc": "5.112e-01", "anc_acc": "4.800e-01", "epoch": 0.05436} {"step": 27185, "loss": 1.3807, "grad_norm": "3.736e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.216e+00", "dlm_acc": "6.350e-01", "anc_acc": "6.161e-01", "epoch": 0.05437} {"step": 27190, "loss": 1.1316, "grad_norm": "2.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.821e-01", "anc_loss": "3.125e-01", "dlm_acc": "8.128e-01", "anc_acc": "7.958e-01", "epoch": 0.05438} {"step": 27195, "loss": 0.8855, "grad_norm": "1.649e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.501e-01", "anc_loss": "2.793e-01", "dlm_acc": "8.337e-01", "anc_acc": "8.156e-01", "epoch": 0.05439} {"step": 27200, "loss": 1.3598, "grad_norm": "3.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.752e-01", "anc_loss": "4.015e-01", "dlm_acc": "7.982e-01", "anc_acc": "7.863e-01", "epoch": 0.0544} {"step": 27205, "loss": 1.0681, "grad_norm": "2.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.566e-01", "anc_loss": "6.594e-01", "dlm_acc": "5.691e-01", "anc_acc": "5.666e-01", "epoch": 0.05441} {"step": 27210, "loss": 1.4491, "grad_norm": "3.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.023e-01", "anc_loss": "8.094e-01", "dlm_acc": "5.424e-01", "anc_acc": "5.394e-01", "epoch": 0.05442} {"step": 27215, "loss": 1.3605, "grad_norm": "4.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.266e-01", "anc_loss": "7.336e-01", "dlm_acc": "5.621e-01", "anc_acc": "5.596e-01", "epoch": 0.05443} {"step": 27220, "loss": 1.3009, "grad_norm": "3.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.633e-01", "anc_loss": "9.008e-01", "dlm_acc": "5.982e-01", "anc_acc": "5.903e-01", "epoch": 0.05444} {"step": 27225, "loss": 1.33, "grad_norm": "2.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.132e+00", "dlm_acc": "6.556e-01", "anc_acc": "6.342e-01", "epoch": 0.05445} {"step": 27230, "loss": 1.1434, "grad_norm": "4.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.279e-01", "anc_loss": "6.777e-01", "dlm_acc": "6.745e-01", "anc_acc": "6.518e-01", "epoch": 0.05446} {"step": 27235, "loss": 1.4977, "grad_norm": "3.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.138e+00", "anc_loss": "1.198e+00", "dlm_acc": "4.288e-01", "anc_acc": "4.123e-01", "epoch": 0.05447} {"step": 27240, "loss": 1.2543, "grad_norm": "2.608e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.179e+00", "dlm_acc": "4.962e-01", "anc_acc": "4.759e-01", "epoch": 0.05448} {"step": 27245, "loss": 1.123, "grad_norm": "7.046e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.427e-01", "anc_acc": "5.174e-01", "epoch": 0.05449} {"step": 27250, "loss": 1.2433, "grad_norm": "2.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.716e+00", "dlm_acc": "5.028e-01", "anc_acc": "4.781e-01", "epoch": 0.0545} {"step": 27255, "loss": 1.2687, "grad_norm": "2.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.216e-01", "anc_acc": "4.996e-01", "epoch": 0.05451} {"step": 27260, "loss": 1.1464, "grad_norm": "4.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.214e+00", "dlm_acc": "6.115e-01", "anc_acc": "5.828e-01", "epoch": 0.05452} {"step": 27265, "loss": 1.5284, "grad_norm": "2.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.561e+00", "dlm_acc": "5.428e-01", "anc_acc": "5.167e-01", "epoch": 0.05453} {"step": 27270, "loss": 1.4928, "grad_norm": "2.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.356e+00", "dlm_acc": "5.821e-01", "anc_acc": "5.573e-01", "epoch": 0.05454} {"step": 27275, "loss": 1.7601, "grad_norm": "2.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.684e+00", "anc_loss": "1.795e+00", "dlm_acc": "4.851e-01", "anc_acc": "4.606e-01", "epoch": 0.05455} {"step": 27280, "loss": 1.1997, "grad_norm": "2.834e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.793e-01", "anc_loss": "1.091e+00", "dlm_acc": "6.430e-01", "anc_acc": "6.132e-01", "epoch": 0.05456} {"step": 27285, "loss": 1.3369, "grad_norm": "3.191e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.812e-01", "anc_loss": "1.087e+00", "dlm_acc": "6.527e-01", "anc_acc": "6.286e-01", "epoch": 0.05457} {"step": 27290, "loss": 1.4713, "grad_norm": "3.276e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.361e+00", "anc_loss": "1.472e+00", "dlm_acc": "5.553e-01", "anc_acc": "5.297e-01", "epoch": 0.05458} {"step": 27295, "loss": 1.0291, "grad_norm": "2.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.437e-01", "anc_loss": "1.040e+00", "dlm_acc": "6.532e-01", "anc_acc": "6.289e-01", "epoch": 0.05459} {"step": 27300, "loss": 1.7195, "grad_norm": "3.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.523e+00", "dlm_acc": "5.563e-01", "anc_acc": "5.340e-01", "epoch": 0.0546} {"step": 27305, "loss": 1.5414, "grad_norm": "3.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.353e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.408e-01", "anc_acc": "5.149e-01", "epoch": 0.05461} {"step": 27310, "loss": 1.7095, "grad_norm": "3.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.409e+00", "anc_loss": "1.528e+00", "dlm_acc": "5.644e-01", "anc_acc": "5.382e-01", "epoch": 0.05462} {"step": 27315, "loss": 1.251, "grad_norm": "3.179e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.617e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.210e-01", "anc_acc": "5.929e-01", "epoch": 0.05463} {"step": 27320, "loss": 1.7324, "grad_norm": "2.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.541e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.099e-01", "anc_acc": "4.877e-01", "epoch": 0.05464} {"step": 27325, "loss": 1.3552, "grad_norm": "3.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.245e+00", "dlm_acc": "5.830e-01", "anc_acc": "5.591e-01", "epoch": 0.05465} {"step": 27330, "loss": 1.5682, "grad_norm": "4.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.336e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.726e-01", "anc_acc": "5.441e-01", "epoch": 0.05466} {"step": 27335, "loss": 1.7131, "grad_norm": "4.328e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.663e+00", "anc_loss": "1.795e+00", "dlm_acc": "4.989e-01", "anc_acc": "4.734e-01", "epoch": 0.05467} {"step": 27340, "loss": 1.6036, "grad_norm": "4.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.672e+00", "dlm_acc": "5.109e-01", "anc_acc": "4.868e-01", "epoch": 0.05468} {"step": 27345, "loss": 1.1492, "grad_norm": "3.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.171e+00", "dlm_acc": "6.036e-01", "anc_acc": "5.798e-01", "epoch": 0.05469} {"step": 27350, "loss": 1.0442, "grad_norm": "3.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.297e-01", "anc_acc": "5.065e-01", "epoch": 0.0547} {"step": 27355, "loss": 1.4066, "grad_norm": "4.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.531e+00", "anc_loss": "1.659e+00", "dlm_acc": "5.444e-01", "anc_acc": "5.178e-01", "epoch": 0.05471} {"step": 27360, "loss": 1.1292, "grad_norm": "2.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.531e+00", "anc_loss": "1.653e+00", "dlm_acc": "5.284e-01", "anc_acc": "5.046e-01", "epoch": 0.05472} {"step": 27365, "loss": 1.0896, "grad_norm": "2.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.420e-01", "anc_acc": "5.159e-01", "epoch": 0.05473} {"step": 27370, "loss": 1.1446, "grad_norm": "2.907e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.035e+00", "anc_loss": "1.148e+00", "dlm_acc": "6.405e-01", "anc_acc": "6.127e-01", "epoch": 0.05474} {"step": 27375, "loss": 1.5056, "grad_norm": "2.849e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.310e+00", "anc_loss": "1.412e+00", "dlm_acc": "5.644e-01", "anc_acc": "5.367e-01", "epoch": 0.05475} {"step": 27380, "loss": 1.2517, "grad_norm": "3.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.406e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.509e-01", "anc_acc": "5.234e-01", "epoch": 0.05476} {"step": 27385, "loss": 1.5065, "grad_norm": "3.153e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.658e+00", "anc_loss": "1.769e+00", "dlm_acc": "4.791e-01", "anc_acc": "4.559e-01", "epoch": 0.05477} {"step": 27390, "loss": 1.5006, "grad_norm": "3.236e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.522e+00", "anc_loss": "1.619e+00", "dlm_acc": "4.629e-01", "anc_acc": "4.394e-01", "epoch": 0.05478} {"step": 27395, "loss": 1.4024, "grad_norm": "4.806e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.756e-01", "anc_acc": "5.490e-01", "epoch": 0.05479} {"step": 27400, "loss": 1.3868, "grad_norm": "3.802e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.068e+00", "anc_loss": "1.198e+00", "dlm_acc": "6.402e-01", "anc_acc": "6.085e-01", "epoch": 0.0548} {"step": 27405, "loss": 1.1359, "grad_norm": "2.246e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.155e+00", "dlm_acc": "6.083e-01", "anc_acc": "5.805e-01", "epoch": 0.05481} {"step": 27410, "loss": 1.5694, "grad_norm": "6.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.490e+00", "anc_loss": "1.609e+00", "dlm_acc": "5.802e-01", "anc_acc": "5.516e-01", "epoch": 0.05482} {"step": 27415, "loss": 1.356, "grad_norm": "4.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.813e-01", "anc_acc": "5.550e-01", "epoch": 0.05483} {"step": 27420, "loss": 1.4795, "grad_norm": "5.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.560e+00", "anc_loss": "1.653e+00", "dlm_acc": "5.520e-01", "anc_acc": "5.324e-01", "epoch": 0.05484} {"step": 27425, "loss": 1.4956, "grad_norm": "3.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.553e+00", "anc_loss": "1.653e+00", "dlm_acc": "5.005e-01", "anc_acc": "4.782e-01", "epoch": 0.05485} {"step": 27430, "loss": 1.3609, "grad_norm": "4.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.732e-01", "anc_acc": "5.465e-01", "epoch": 0.05486} {"step": 27435, "loss": 1.4325, "grad_norm": "3.914e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.494e+00", "dlm_acc": "5.144e-01", "anc_acc": "4.919e-01", "epoch": 0.05487} {"step": 27440, "loss": 0.9931, "grad_norm": "4.316e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.107e+00", "dlm_acc": "6.152e-01", "anc_acc": "5.897e-01", "epoch": 0.05488} {"step": 27445, "loss": 0.9706, "grad_norm": "1.390e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.383e-01", "anc_loss": "8.043e-01", "dlm_acc": "6.350e-01", "anc_acc": "6.158e-01", "epoch": 0.05489} {"step": 27450, "loss": 1.1611, "grad_norm": "5.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.486e-01", "anc_acc": "5.229e-01", "epoch": 0.0549} {"step": 27455, "loss": 1.2989, "grad_norm": "5.632e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.306e+00", "dlm_acc": "5.282e-01", "anc_acc": "5.117e-01", "epoch": 0.05491} {"step": 27460, "loss": 1.5751, "grad_norm": "3.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.808e+00", "anc_loss": "1.934e+00", "dlm_acc": "4.726e-01", "anc_acc": "4.493e-01", "epoch": 0.05492} {"step": 27465, "loss": 1.2813, "grad_norm": "2.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.941e+00", "anc_loss": "2.014e+00", "dlm_acc": "3.303e-01", "anc_acc": "3.133e-01", "epoch": 0.05493} {"step": 27470, "loss": 1.5428, "grad_norm": "2.808e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.605e+00", "anc_loss": "1.689e+00", "dlm_acc": "4.215e-01", "anc_acc": "4.007e-01", "epoch": 0.05494} {"step": 27475, "loss": 1.0406, "grad_norm": "2.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.196e+00", "dlm_acc": "5.804e-01", "anc_acc": "5.448e-01", "epoch": 0.05495} {"step": 27480, "loss": 0.9126, "grad_norm": "4.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.340e-01", "anc_loss": "9.996e-01", "dlm_acc": "5.694e-01", "anc_acc": "5.509e-01", "epoch": 0.05496} {"step": 27485, "loss": 1.1866, "grad_norm": "7.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.508e-01", "anc_loss": "1.131e+00", "dlm_acc": "6.588e-01", "anc_acc": "6.005e-01", "epoch": 0.05497} {"step": 27490, "loss": 0.8493, "grad_norm": "2.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.114e+00", "dlm_acc": "5.976e-01", "anc_acc": "5.700e-01", "epoch": 0.05498} {"step": 27495, "loss": 0.9876, "grad_norm": "2.077e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.043e-01", "anc_loss": "7.715e-01", "dlm_acc": "6.334e-01", "anc_acc": "6.131e-01", "epoch": 0.05499} {"step": 27500, "loss": 1.2203, "grad_norm": "3.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.475e+00", "dlm_acc": "5.140e-01", "anc_acc": "4.912e-01", "epoch": 0.055} {"step": 27505, "loss": 1.228, "grad_norm": "7.359e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.918e-01", "anc_loss": "1.061e+00", "dlm_acc": "5.480e-01", "anc_acc": "5.289e-01", "epoch": 0.05501} {"step": 27510, "loss": 1.1605, "grad_norm": "5.236e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.344e-01", "anc_loss": "5.637e-01", "dlm_acc": "6.338e-01", "anc_acc": "6.181e-01", "epoch": 0.05502} {"step": 27515, "loss": 1.2781, "grad_norm": "3.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.875e-01", "anc_loss": "9.563e-01", "dlm_acc": "5.875e-01", "anc_acc": "5.661e-01", "epoch": 0.05503} {"step": 27520, "loss": 1.2026, "grad_norm": "3.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.716e+00", "anc_loss": "1.786e+00", "dlm_acc": "3.608e-01", "anc_acc": "3.418e-01", "epoch": 0.05504} {"step": 27525, "loss": 1.3222, "grad_norm": "3.225e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.670e+00", "anc_loss": "1.798e+00", "dlm_acc": "4.115e-01", "anc_acc": "3.904e-01", "epoch": 0.05505} {"step": 27530, "loss": 1.4227, "grad_norm": "4.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.451e+00", "dlm_acc": "5.547e-01", "anc_acc": "5.034e-01", "epoch": 0.05506} {"step": 27535, "loss": 1.2868, "grad_norm": "2.046e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.034e+00", "anc_loss": "2.081e+00", "dlm_acc": "2.689e-01", "anc_acc": "2.534e-01", "epoch": 0.05507} {"step": 27540, "loss": 1.4861, "grad_norm": "5.687e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.709e+00", "anc_loss": "1.765e+00", "dlm_acc": "4.212e-01", "anc_acc": "4.071e-01", "epoch": 0.05508} {"step": 27545, "loss": 1.1808, "grad_norm": "4.131e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.281e-01", "anc_loss": "1.021e+00", "dlm_acc": "6.108e-01", "anc_acc": "5.803e-01", "epoch": 0.05509} {"step": 27550, "loss": 1.7962, "grad_norm": "4.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.254e+00", "dlm_acc": "6.439e-01", "anc_acc": "6.195e-01", "epoch": 0.0551} {"step": 27555, "loss": 1.1923, "grad_norm": "3.125e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.024e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.249e-01", "anc_acc": "5.983e-01", "epoch": 0.05511} {"step": 27560, "loss": 1.3904, "grad_norm": "7.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.969e-01", "anc_loss": "1.107e+00", "dlm_acc": "6.179e-01", "anc_acc": "5.866e-01", "epoch": 0.05512} {"step": 27565, "loss": 1.203, "grad_norm": "4.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.208e+00", "dlm_acc": "5.958e-01", "anc_acc": "5.631e-01", "epoch": 0.05513} {"step": 27570, "loss": 1.3996, "grad_norm": "4.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.599e+00", "anc_loss": "1.713e+00", "dlm_acc": "4.806e-01", "anc_acc": "4.551e-01", "epoch": 0.05514} {"step": 27575, "loss": 1.2171, "grad_norm": "1.043e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.379e-01", "anc_loss": "9.527e-01", "dlm_acc": "6.522e-01", "anc_acc": "6.193e-01", "epoch": 0.05515} {"step": 27580, "loss": 1.9524, "grad_norm": "5.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.485e-01", "anc_acc": "5.156e-01", "epoch": 0.05516} {"step": 27585, "loss": 1.1707, "grad_norm": "4.216e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.211e-01", "anc_loss": "9.578e-01", "dlm_acc": "6.777e-01", "anc_acc": "6.339e-01", "epoch": 0.05517} {"step": 27590, "loss": 1.2008, "grad_norm": "4.107e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.336e-01", "anc_loss": "7.258e-01", "dlm_acc": "7.508e-01", "anc_acc": "7.228e-01", "epoch": 0.05518} {"step": 27595, "loss": 1.1561, "grad_norm": "2.331e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.977e-01", "anc_loss": "9.848e-01", "dlm_acc": "6.110e-01", "anc_acc": "5.850e-01", "epoch": 0.05519} {"step": 27600, "loss": 1.2955, "grad_norm": "6.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.556e-01", "anc_acc": "5.270e-01", "epoch": 0.0552} {"step": 27605, "loss": 1.4817, "grad_norm": "5.478e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.545e+00", "dlm_acc": "3.939e-01", "anc_acc": "3.835e-01", "epoch": 0.05521} {"step": 27610, "loss": 1.2829, "grad_norm": "2.684e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.238e+00", "dlm_acc": "5.824e-01", "anc_acc": "5.521e-01", "epoch": 0.05522} {"step": 27615, "loss": 1.3301, "grad_norm": "3.113e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.283e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.449e-01", "anc_acc": "5.128e-01", "epoch": 0.05523} {"step": 27620, "loss": 0.7738, "grad_norm": "2.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.992e-01", "anc_loss": "7.914e-01", "dlm_acc": "6.976e-01", "anc_acc": "6.658e-01", "epoch": 0.05524} {"step": 27625, "loss": 1.1298, "grad_norm": "2.353e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.261e-01", "epoch": 0.05525} {"step": 27630, "loss": 1.111, "grad_norm": "2.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.884e-01", "anc_acc": "5.636e-01", "epoch": 0.05526} {"step": 27635, "loss": 1.797, "grad_norm": "4.192e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.231e+00", "dlm_acc": "6.070e-01", "anc_acc": "5.844e-01", "epoch": 0.05527} {"step": 27640, "loss": 1.7252, "grad_norm": "6.168e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.309e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.637e-01", "anc_acc": "5.355e-01", "epoch": 0.05528} {"step": 27645, "loss": 1.8969, "grad_norm": "6.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.526e+00", "anc_loss": "1.641e+00", "dlm_acc": "5.112e-01", "anc_acc": "4.834e-01", "epoch": 0.05529} {"step": 27650, "loss": 1.2019, "grad_norm": "1.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.111e+00", "anc_loss": "1.212e+00", "dlm_acc": "6.084e-01", "anc_acc": "5.800e-01", "epoch": 0.0553} {"step": 27655, "loss": 1.3137, "grad_norm": "3.273e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.181e+00", "dlm_acc": "6.188e-01", "anc_acc": "5.960e-01", "epoch": 0.05531} {"step": 27660, "loss": 1.6695, "grad_norm": "7.590e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.528e+00", "anc_loss": "1.623e+00", "dlm_acc": "5.177e-01", "anc_acc": "4.973e-01", "epoch": 0.05532} {"step": 27665, "loss": 1.3669, "grad_norm": "3.678e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.977e-01", "anc_loss": "1.082e+00", "dlm_acc": "6.130e-01", "anc_acc": "5.937e-01", "epoch": 0.05533} {"step": 27670, "loss": 1.3829, "grad_norm": "2.344e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.438e-01", "anc_acc": "5.178e-01", "epoch": 0.05534} {"step": 27675, "loss": 1.0241, "grad_norm": "2.210e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.181e-01", "anc_acc": "4.912e-01", "epoch": 0.05535} {"step": 27680, "loss": 0.8971, "grad_norm": "2.322e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.445e-01", "anc_loss": "1.035e+00", "dlm_acc": "6.078e-01", "anc_acc": "5.816e-01", "epoch": 0.05536} {"step": 27685, "loss": 2.1251, "grad_norm": "3.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.933e+00", "anc_loss": "2.061e+00", "dlm_acc": "4.709e-01", "anc_acc": "4.485e-01", "epoch": 0.05537} {"step": 27690, "loss": 1.1135, "grad_norm": "4.257e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.500e+00", "dlm_acc": "5.255e-01", "anc_acc": "5.045e-01", "epoch": 0.05538} {"step": 27695, "loss": 1.3872, "grad_norm": "3.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.745e-01", "anc_acc": "5.529e-01", "epoch": 0.05539} {"step": 27700, "loss": 1.7672, "grad_norm": "4.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.689e+00", "anc_loss": "1.783e+00", "dlm_acc": "4.847e-01", "anc_acc": "4.658e-01", "epoch": 0.0554} {"step": 27705, "loss": 1.2637, "grad_norm": "3.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.278e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.626e-01", "anc_acc": "5.364e-01", "epoch": 0.05541} {"step": 27710, "loss": 1.3889, "grad_norm": "3.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.349e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.456e-01", "anc_acc": "5.221e-01", "epoch": 0.05542} {"step": 27715, "loss": 1.2564, "grad_norm": "5.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.433e+00", "dlm_acc": "5.597e-01", "anc_acc": "5.346e-01", "epoch": 0.05543} {"step": 27720, "loss": 0.834, "grad_norm": "3.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.748e-01", "anc_loss": "5.420e-01", "dlm_acc": "8.134e-01", "anc_acc": "7.938e-01", "epoch": 0.05544} {"step": 27725, "loss": 0.9042, "grad_norm": "4.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.241e-01", "anc_loss": "1.011e+00", "dlm_acc": "7.117e-01", "anc_acc": "6.916e-01", "epoch": 0.05545} {"step": 27730, "loss": 1.0384, "grad_norm": "2.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.591e+00", "dlm_acc": "5.396e-01", "anc_acc": "5.108e-01", "epoch": 0.05546} {"step": 27735, "loss": 1.2689, "grad_norm": "3.043e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.513e+00", "anc_loss": "1.595e+00", "dlm_acc": "4.731e-01", "anc_acc": "4.541e-01", "epoch": 0.05547} {"step": 27740, "loss": 1.2399, "grad_norm": "1.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.324e+00", "dlm_acc": "6.021e-01", "anc_acc": "5.774e-01", "epoch": 0.05548} {"step": 27745, "loss": 1.0643, "grad_norm": "3.074e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.320e-01", "anc_loss": "1.016e+00", "dlm_acc": "6.069e-01", "anc_acc": "5.838e-01", "epoch": 0.05549} {"step": 27750, "loss": 1.011, "grad_norm": "2.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.364e+00", "anc_loss": "1.471e+00", "dlm_acc": "5.322e-01", "anc_acc": "5.084e-01", "epoch": 0.0555} {"step": 27755, "loss": 1.278, "grad_norm": "4.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.587e+00", "dlm_acc": "4.979e-01", "anc_acc": "4.812e-01", "epoch": 0.05551} {"step": 27760, "loss": 0.8927, "grad_norm": "3.347e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.203e-01", "anc_loss": "7.609e-01", "dlm_acc": "4.460e-01", "anc_acc": "4.181e-01", "epoch": 0.05552} {"step": 27765, "loss": 1.1214, "grad_norm": "4.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.422e-01", "anc_loss": "7.789e-01", "dlm_acc": "4.407e-01", "anc_acc": "4.194e-01", "epoch": 0.05553} {"step": 27770, "loss": 1.088, "grad_norm": "3.751e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.961e-01", "anc_loss": "8.305e-01", "dlm_acc": "4.128e-01", "anc_acc": "3.913e-01", "epoch": 0.05554} {"step": 27775, "loss": 1.1762, "grad_norm": "2.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.097e+00", "anc_loss": "1.182e+00", "dlm_acc": "5.177e-01", "anc_acc": "4.907e-01", "epoch": 0.05555} {"step": 27780, "loss": 0.9079, "grad_norm": "2.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.657e-01", "anc_acc": "5.339e-01", "epoch": 0.05556} {"step": 27785, "loss": 1.005, "grad_norm": "3.239e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.147e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.422e-01", "anc_acc": "5.085e-01", "epoch": 0.05557} {"step": 27790, "loss": 1.218, "grad_norm": "3.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.041e+00", "anc_loss": "1.057e+00", "dlm_acc": "3.368e-01", "anc_acc": "3.277e-01", "epoch": 0.05558} {"step": 27795, "loss": 1.0192, "grad_norm": "3.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.809e-01", "anc_loss": "9.961e-01", "dlm_acc": "4.225e-01", "anc_acc": "4.165e-01", "epoch": 0.05559} {"step": 27800, "loss": 1.1314, "grad_norm": "4.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.027e+00", "dlm_acc": "3.369e-01", "anc_acc": "3.366e-01", "epoch": 0.0556} {"step": 27805, "loss": 0.8871, "grad_norm": "2.470e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.133e+00", "dlm_acc": "4.812e-01", "anc_acc": "4.639e-01", "epoch": 0.05561} {"step": 27810, "loss": 1.2122, "grad_norm": "3.122e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.478e+00", "anc_loss": "1.600e+00", "dlm_acc": "5.270e-01", "anc_acc": "5.013e-01", "epoch": 0.05562} {"step": 27815, "loss": 1.2862, "grad_norm": "4.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.556e+00", "anc_loss": "1.623e+00", "dlm_acc": "4.001e-01", "anc_acc": "3.877e-01", "epoch": 0.05563} {"step": 27820, "loss": 1.2677, "grad_norm": "7.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.180e+00", "dlm_acc": "3.861e-01", "anc_acc": "3.838e-01", "epoch": 0.05564} {"step": 27825, "loss": 1.0213, "grad_norm": "3.868e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.984e-01", "anc_loss": "9.070e-01", "dlm_acc": "4.269e-01", "anc_acc": "4.228e-01", "epoch": 0.05565} {"step": 27830, "loss": 1.0636, "grad_norm": "3.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.812e-01", "anc_loss": "9.930e-01", "dlm_acc": "3.908e-01", "anc_acc": "3.877e-01", "epoch": 0.05566} {"step": 27835, "loss": 1.3501, "grad_norm": "9.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.417e+00", "anc_loss": "1.452e+00", "dlm_acc": "2.617e-01", "anc_acc": "2.561e-01", "epoch": 0.05567} {"step": 27840, "loss": 1.0435, "grad_norm": "4.237e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.300e+00", "anc_loss": "1.351e+00", "dlm_acc": "3.510e-01", "anc_acc": "3.393e-01", "epoch": 0.05568} {"step": 27845, "loss": 1.1708, "grad_norm": "3.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.645e+00", "anc_loss": "1.748e+00", "dlm_acc": "5.014e-01", "anc_acc": "4.806e-01", "epoch": 0.05569} {"step": 27850, "loss": 1.2141, "grad_norm": "3.939e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.493e+00", "anc_loss": "1.579e+00", "dlm_acc": "4.648e-01", "anc_acc": "4.424e-01", "epoch": 0.0557} {"step": 27855, "loss": 1.5096, "grad_norm": "3.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.645e+00", "anc_loss": "1.761e+00", "dlm_acc": "4.935e-01", "anc_acc": "4.696e-01", "epoch": 0.05571} {"step": 27860, "loss": 1.298, "grad_norm": "2.399e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.686e+00", "anc_loss": "1.803e+00", "dlm_acc": "4.629e-01", "anc_acc": "4.393e-01", "epoch": 0.05572} {"step": 27865, "loss": 1.3212, "grad_norm": "3.581e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.481e+00", "anc_loss": "1.606e+00", "dlm_acc": "5.251e-01", "anc_acc": "4.970e-01", "epoch": 0.05573} {"step": 27870, "loss": 1.2506, "grad_norm": "3.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.157e-01", "anc_acc": "4.935e-01", "epoch": 0.05574} {"step": 27875, "loss": 1.1647, "grad_norm": "2.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.637e+00", "anc_loss": "1.742e+00", "dlm_acc": "4.901e-01", "anc_acc": "4.664e-01", "epoch": 0.05575} {"step": 27880, "loss": 1.2092, "grad_norm": "3.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.694e+00", "anc_loss": "1.807e+00", "dlm_acc": "5.011e-01", "anc_acc": "4.786e-01", "epoch": 0.05576} {"step": 27885, "loss": 1.3316, "grad_norm": "3.422e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.723e+00", "dlm_acc": "4.760e-01", "anc_acc": "4.497e-01", "epoch": 0.05577} {"step": 27890, "loss": 0.8478, "grad_norm": "1.167e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.253e+00", "dlm_acc": "5.672e-01", "anc_acc": "5.391e-01", "epoch": 0.05578} {"step": 27895, "loss": 1.1059, "grad_norm": "6.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.207e+00", "anc_loss": "1.297e+00", "dlm_acc": "5.692e-01", "anc_acc": "5.466e-01", "epoch": 0.05579} {"step": 27900, "loss": 1.0204, "grad_norm": "3.071e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.128e+00", "dlm_acc": "5.596e-01", "anc_acc": "5.381e-01", "epoch": 0.0558} {"step": 27905, "loss": 0.9984, "grad_norm": "2.572e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.237e+00", "dlm_acc": "5.553e-01", "anc_acc": "5.330e-01", "epoch": 0.05581} {"step": 27910, "loss": 1.1635, "grad_norm": "4.379e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.385e+00", "dlm_acc": "5.560e-01", "anc_acc": "5.309e-01", "epoch": 0.05582} {"step": 27915, "loss": 1.2037, "grad_norm": "3.768e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.476e+00", "dlm_acc": "4.441e-01", "anc_acc": "4.297e-01", "epoch": 0.05583} {"step": 27920, "loss": 1.0882, "grad_norm": "2.472e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.611e+00", "dlm_acc": "5.217e-01", "anc_acc": "4.983e-01", "epoch": 0.05584} {"step": 27925, "loss": 1.1724, "grad_norm": "3.201e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.152e+00", "dlm_acc": "6.056e-01", "anc_acc": "5.813e-01", "epoch": 0.05585} {"step": 27930, "loss": 1.4087, "grad_norm": "5.170e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.669e+00", "anc_loss": "1.778e+00", "dlm_acc": "4.706e-01", "anc_acc": "4.468e-01", "epoch": 0.05586} {"step": 27935, "loss": 1.4411, "grad_norm": "5.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.788e+00", "anc_loss": "1.869e+00", "dlm_acc": "4.749e-01", "anc_acc": "4.585e-01", "epoch": 0.05587} {"step": 27940, "loss": 1.1634, "grad_norm": "5.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.270e-01", "anc_loss": "3.496e-01", "dlm_acc": "7.882e-01", "anc_acc": "7.800e-01", "epoch": 0.05588} {"step": 27945, "loss": 1.0097, "grad_norm": "2.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.286e+00", "anc_loss": "1.392e+00", "dlm_acc": "5.463e-01", "anc_acc": "5.231e-01", "epoch": 0.05589} {"step": 27950, "loss": 1.3853, "grad_norm": "6.871e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.259e+00", "dlm_acc": "4.231e-01", "anc_acc": "4.149e-01", "epoch": 0.0559} {"step": 27955, "loss": 1.1687, "grad_norm": "5.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.121e+00", "dlm_acc": "3.438e-01", "anc_acc": "3.421e-01", "epoch": 0.05591} {"step": 27960, "loss": 1.3884, "grad_norm": "3.820e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.361e+00", "dlm_acc": "4.222e-01", "anc_acc": "4.101e-01", "epoch": 0.05592} {"step": 27965, "loss": 1.1318, "grad_norm": "2.547e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.516e+00", "dlm_acc": "5.299e-01", "anc_acc": "5.047e-01", "epoch": 0.05593} {"step": 27970, "loss": 1.1646, "grad_norm": "2.456e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.267e+00", "dlm_acc": "5.940e-01", "anc_acc": "5.746e-01", "epoch": 0.05594} {"step": 27975, "loss": 1.1849, "grad_norm": "2.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.644e+00", "dlm_acc": "5.111e-01", "anc_acc": "4.848e-01", "epoch": 0.05595} {"step": 27980, "loss": 1.4008, "grad_norm": "3.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.819e+00", "anc_loss": "1.902e+00", "dlm_acc": "4.139e-01", "anc_acc": "3.960e-01", "epoch": 0.05596} {"step": 27985, "loss": 0.9086, "grad_norm": "7.208e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.461e-01", "anc_loss": "1.027e+00", "dlm_acc": "6.732e-01", "anc_acc": "6.526e-01", "epoch": 0.05597} {"step": 27990, "loss": 1.4852, "grad_norm": "4.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.660e-01", "anc_acc": "5.409e-01", "epoch": 0.05598} {"step": 27995, "loss": 1.2136, "grad_norm": "2.732e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.232e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.451e-01", "anc_acc": "5.210e-01", "epoch": 0.05599} {"step": 28000, "loss": 0.9304, "grad_norm": "6.871e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.304e+00", "dlm_acc": "6.114e-01", "anc_acc": "5.809e-01", "epoch": 0.056} {"step": 28005, "loss": 0.991, "grad_norm": "3.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.665e-01", "anc_acc": "5.398e-01", "epoch": 0.05601} {"step": 28010, "loss": 1.38, "grad_norm": "3.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.598e+00", "dlm_acc": "5.183e-01", "anc_acc": "4.940e-01", "epoch": 0.05602} {"step": 28015, "loss": 1.9285, "grad_norm": "2.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.260e+00", "dlm_acc": "6.333e-01", "anc_acc": "6.106e-01", "epoch": 0.05603} {"step": 28020, "loss": 1.9106, "grad_norm": "2.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.142e+00", "dlm_acc": "6.120e-01", "anc_acc": "5.895e-01", "epoch": 0.05604} {"step": 28025, "loss": 1.3432, "grad_norm": "2.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.336e-01", "anc_loss": "1.023e+00", "dlm_acc": "6.423e-01", "anc_acc": "6.155e-01", "epoch": 0.05605} {"step": 28030, "loss": 1.0806, "grad_norm": "3.307e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.295e+00", "dlm_acc": "5.911e-01", "anc_acc": "5.674e-01", "epoch": 0.05606} {"step": 28035, "loss": 1.5903, "grad_norm": "3.657e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.595e+00", "dlm_acc": "5.436e-01", "anc_acc": "5.180e-01", "epoch": 0.05607} {"step": 28040, "loss": 1.4628, "grad_norm": "2.994e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.486e+00", "dlm_acc": "5.355e-01", "anc_acc": "5.102e-01", "epoch": 0.05608} {"step": 28045, "loss": 1.1648, "grad_norm": "2.753e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.477e-01", "anc_loss": "7.469e-01", "dlm_acc": "7.154e-01", "anc_acc": "6.890e-01", "epoch": 0.05609} {"step": 28050, "loss": 1.6333, "grad_norm": "2.487e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.480e+00", "anc_loss": "1.594e+00", "dlm_acc": "5.453e-01", "anc_acc": "5.211e-01", "epoch": 0.0561} {"step": 28055, "loss": 1.224, "grad_norm": "3.125e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.181e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.744e-01", "anc_acc": "5.503e-01", "epoch": 0.05611} {"step": 28060, "loss": 1.1235, "grad_norm": "7.871e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.804e-01", "anc_acc": "5.564e-01", "epoch": 0.05612} {"step": 28065, "loss": 0.8473, "grad_norm": "1.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.272e-01", "anc_loss": "7.819e-01", "dlm_acc": "7.334e-01", "anc_acc": "7.162e-01", "epoch": 0.05613} {"step": 28070, "loss": 0.9963, "grad_norm": "5.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.982e-01", "anc_loss": "3.177e-01", "dlm_acc": "8.814e-01", "anc_acc": "8.712e-01", "epoch": 0.05614} {"step": 28075, "loss": 0.8497, "grad_norm": "3.466e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.491e-01", "anc_loss": "3.934e-01", "dlm_acc": "8.269e-01", "anc_acc": "8.064e-01", "epoch": 0.05615} {"step": 28080, "loss": 1.0489, "grad_norm": "4.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.268e+00", "dlm_acc": "5.949e-01", "anc_acc": "5.762e-01", "epoch": 0.05616} {"step": 28085, "loss": 0.9939, "grad_norm": "3.842e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.399e-01", "anc_loss": "5.946e-01", "dlm_acc": "7.655e-01", "anc_acc": "7.500e-01", "epoch": 0.05617} {"step": 28090, "loss": 0.9829, "grad_norm": "1.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.491e-01", "anc_loss": "4.321e-01", "dlm_acc": "8.800e-01", "anc_acc": "8.563e-01", "epoch": 0.05618} {"step": 28095, "loss": 1.0973, "grad_norm": "2.898e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.566e-01", "anc_loss": "7.727e-01", "dlm_acc": "7.372e-01", "anc_acc": "6.996e-01", "epoch": 0.05619} {"step": 28100, "loss": 1.3759, "grad_norm": "4.290e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.687e-01", "anc_loss": "7.255e-01", "dlm_acc": "7.159e-01", "anc_acc": "6.991e-01", "epoch": 0.0562} {"step": 28105, "loss": 0.7788, "grad_norm": "2.791e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.771e-01", "anc_loss": "2.858e-01", "dlm_acc": "8.598e-01", "anc_acc": "8.628e-01", "epoch": 0.05621} {"step": 28110, "loss": 1.0516, "grad_norm": "4.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.730e-01", "anc_loss": "9.418e-01", "dlm_acc": "6.641e-01", "anc_acc": "6.461e-01", "epoch": 0.05622} {"step": 28115, "loss": 0.8362, "grad_norm": "5.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.727e-01", "anc_loss": "6.041e-01", "dlm_acc": "5.694e-01", "anc_acc": "5.509e-01", "epoch": 0.05623} {"step": 28120, "loss": 1.2766, "grad_norm": "3.782e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.200e+00", "anc_loss": "1.264e+00", "dlm_acc": "4.556e-01", "anc_acc": "4.353e-01", "epoch": 0.05624} {"step": 28125, "loss": 1.1737, "grad_norm": "2.716e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.281e-01", "anc_loss": "1.012e+00", "dlm_acc": "6.586e-01", "anc_acc": "6.363e-01", "epoch": 0.05625} {"step": 28130, "loss": 1.1467, "grad_norm": "3.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.754e-01", "anc_loss": "6.352e-01", "dlm_acc": "7.538e-01", "anc_acc": "7.367e-01", "epoch": 0.05626} {"step": 28135, "loss": 1.3207, "grad_norm": "3.315e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.738e-01", "anc_loss": "1.053e+00", "dlm_acc": "6.555e-01", "anc_acc": "6.369e-01", "epoch": 0.05627} {"step": 28140, "loss": 1.1931, "grad_norm": "1.508e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.855e-01", "anc_loss": "8.470e-01", "dlm_acc": "7.416e-01", "anc_acc": "7.243e-01", "epoch": 0.05628} {"step": 28145, "loss": 1.263, "grad_norm": "2.925e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.679e-01", "anc_loss": "4.096e-01", "dlm_acc": "8.001e-01", "anc_acc": "7.846e-01", "epoch": 0.05629} {"step": 28150, "loss": 0.9865, "grad_norm": "3.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.035e+00", "anc_loss": "1.105e+00", "dlm_acc": "6.152e-01", "anc_acc": "5.944e-01", "epoch": 0.0563} {"step": 28155, "loss": 1.4193, "grad_norm": "6.736e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.205e+00", "dlm_acc": "5.973e-01", "anc_acc": "5.763e-01", "epoch": 0.05631} {"step": 28160, "loss": 0.7422, "grad_norm": "1.279e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.351e-01", "anc_loss": "4.737e-01", "dlm_acc": "8.348e-01", "anc_acc": "8.215e-01", "epoch": 0.05632} {"step": 28165, "loss": 0.8758, "grad_norm": "3.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.617e-01", "anc_loss": "5.060e-01", "dlm_acc": "8.044e-01", "anc_acc": "7.891e-01", "epoch": 0.05633} {"step": 28170, "loss": 1.5256, "grad_norm": "6.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.438e-01", "anc_acc": "5.223e-01", "epoch": 0.05634} {"step": 28175, "loss": 1.2738, "grad_norm": "2.458e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.444e-01", "anc_loss": "7.938e-01", "dlm_acc": "6.521e-01", "anc_acc": "6.345e-01", "epoch": 0.05635} {"step": 28180, "loss": 1.1124, "grad_norm": "2.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.247e+00", "dlm_acc": "5.812e-01", "anc_acc": "5.608e-01", "epoch": 0.05636} {"step": 28185, "loss": 1.1169, "grad_norm": "3.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.295e-01", "anc_loss": "5.598e-01", "dlm_acc": "6.288e-01", "anc_acc": "6.094e-01", "epoch": 0.05637} {"step": 28190, "loss": 1.2212, "grad_norm": "3.061e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.289e+00", "dlm_acc": "5.586e-01", "anc_acc": "5.334e-01", "epoch": 0.05638} {"step": 28195, "loss": 1.0277, "grad_norm": "4.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.166e+00", "dlm_acc": "6.142e-01", "anc_acc": "5.966e-01", "epoch": 0.05639} {"step": 28200, "loss": 0.6951, "grad_norm": "3.265e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.691e-01", "anc_loss": "9.402e-01", "dlm_acc": "6.457e-01", "anc_acc": "6.276e-01", "epoch": 0.0564} {"step": 28205, "loss": 0.8826, "grad_norm": "3.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.351e-01", "anc_loss": "3.777e-01", "dlm_acc": "8.264e-01", "anc_acc": "8.071e-01", "epoch": 0.05641} {"step": 28210, "loss": 1.329, "grad_norm": "3.299e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.111e+00", "anc_loss": "1.189e+00", "dlm_acc": "6.099e-01", "anc_acc": "5.903e-01", "epoch": 0.05642} {"step": 28215, "loss": 1.1937, "grad_norm": "6.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.357e-01", "anc_loss": "7.013e-01", "dlm_acc": "7.622e-01", "anc_acc": "7.399e-01", "epoch": 0.05643} {"step": 28220, "loss": 1.3487, "grad_norm": "4.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.377e-01", "anc_loss": "5.808e-01", "dlm_acc": "7.760e-01", "anc_acc": "7.631e-01", "epoch": 0.05644} {"step": 28225, "loss": 1.1867, "grad_norm": "2.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.127e+00", "dlm_acc": "5.637e-01", "anc_acc": "5.442e-01", "epoch": 0.05645} {"step": 28230, "loss": 1.134, "grad_norm": "6.339e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.766e-01", "anc_loss": "5.008e-01", "dlm_acc": "6.799e-01", "anc_acc": "6.714e-01", "epoch": 0.05646} {"step": 28235, "loss": 0.9802, "grad_norm": "2.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.885e-01", "anc_loss": "2.248e-01", "dlm_acc": "8.519e-01", "anc_acc": "8.299e-01", "epoch": 0.05647} {"step": 28240, "loss": 1.46, "grad_norm": "5.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.604e-01", "anc_loss": "6.192e-01", "dlm_acc": "8.046e-01", "anc_acc": "7.907e-01", "epoch": 0.05648} {"step": 28245, "loss": 1.3521, "grad_norm": "3.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.727e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.446e-01", "anc_acc": "6.199e-01", "epoch": 0.05649} {"step": 28250, "loss": 0.7512, "grad_norm": "5.092e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.126e-01", "anc_loss": "3.331e-01", "dlm_acc": "7.998e-01", "anc_acc": "7.891e-01", "epoch": 0.0565} {"step": 28255, "loss": 0.8234, "grad_norm": "4.756e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.852e-01", "anc_loss": "3.002e-01", "dlm_acc": "7.971e-01", "anc_acc": "7.884e-01", "epoch": 0.05651} {"step": 28260, "loss": 0.9367, "grad_norm": "4.590e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.723e-01", "anc_loss": "9.271e-01", "dlm_acc": "6.745e-01", "anc_acc": "6.599e-01", "epoch": 0.05652} {"step": 28265, "loss": 1.0059, "grad_norm": "1.739e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.668e-01", "anc_loss": "8.277e-01", "dlm_acc": "6.190e-01", "anc_acc": "6.018e-01", "epoch": 0.05653} {"step": 28270, "loss": 0.9572, "grad_norm": "4.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.223e-01", "anc_loss": "5.531e-01", "dlm_acc": "6.699e-01", "anc_acc": "6.567e-01", "epoch": 0.05654} {"step": 28275, "loss": 0.6124, "grad_norm": "2.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.957e-01", "anc_loss": "4.309e-01", "dlm_acc": "7.102e-01", "anc_acc": "6.931e-01", "epoch": 0.05655} {"step": 28280, "loss": 0.5184, "grad_norm": "2.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.393e-01", "anc_loss": "2.645e-01", "dlm_acc": "8.380e-01", "anc_acc": "8.250e-01", "epoch": 0.05656} {"step": 28285, "loss": 0.8887, "grad_norm": "4.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.461e-01", "anc_loss": "2.714e-01", "dlm_acc": "8.466e-01", "anc_acc": "8.341e-01", "epoch": 0.05657} {"step": 28290, "loss": 0.8521, "grad_norm": "3.340e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.980e-01", "anc_loss": "6.449e-01", "dlm_acc": "6.947e-01", "anc_acc": "6.824e-01", "epoch": 0.05658} {"step": 28295, "loss": 1.1879, "grad_norm": "5.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.499e+00", "dlm_acc": "5.368e-01", "anc_acc": "5.146e-01", "epoch": 0.05659} {"step": 28300, "loss": 0.9988, "grad_norm": "4.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.406e+00", "dlm_acc": "4.917e-01", "anc_acc": "4.741e-01", "epoch": 0.0566} {"step": 28305, "loss": 1.1324, "grad_norm": "1.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.339e+00", "anc_loss": "1.446e+00", "dlm_acc": "5.395e-01", "anc_acc": "5.183e-01", "epoch": 0.05661} {"step": 28310, "loss": 1.4058, "grad_norm": "5.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.635e+00", "anc_loss": "1.744e+00", "dlm_acc": "5.063e-01", "anc_acc": "4.824e-01", "epoch": 0.05662} {"step": 28315, "loss": 1.4163, "grad_norm": "3.154e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.611e+00", "anc_loss": "1.744e+00", "dlm_acc": "5.197e-01", "anc_acc": "4.944e-01", "epoch": 0.05663} {"step": 28320, "loss": 1.125, "grad_norm": "3.290e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.225e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.537e-01", "anc_acc": "5.281e-01", "epoch": 0.05664} {"step": 28325, "loss": 1.5164, "grad_norm": "8.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.831e+00", "anc_loss": "1.953e+00", "dlm_acc": "4.445e-01", "anc_acc": "4.250e-01", "epoch": 0.05665} {"step": 28330, "loss": 1.2421, "grad_norm": "2.539e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.500e+00", "anc_loss": "1.602e+00", "dlm_acc": "5.167e-01", "anc_acc": "4.924e-01", "epoch": 0.05666} {"step": 28335, "loss": 1.1624, "grad_norm": "4.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.365e+00", "dlm_acc": "5.540e-01", "anc_acc": "5.312e-01", "epoch": 0.05667} {"step": 28340, "loss": 1.5641, "grad_norm": "4.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.752e+00", "dlm_acc": "5.335e-01", "anc_acc": "5.055e-01", "epoch": 0.05668} {"step": 28345, "loss": 1.4137, "grad_norm": "5.778e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.702e+00", "dlm_acc": "4.805e-01", "anc_acc": "4.574e-01", "epoch": 0.05669} {"step": 28350, "loss": 0.9101, "grad_norm": "1.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.711e-01", "anc_loss": "1.068e+00", "dlm_acc": "6.564e-01", "anc_acc": "6.318e-01", "epoch": 0.0567} {"step": 28355, "loss": 1.3881, "grad_norm": "4.108e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.560e+00", "anc_loss": "1.683e+00", "dlm_acc": "5.314e-01", "anc_acc": "5.045e-01", "epoch": 0.05671} {"step": 28360, "loss": 1.0822, "grad_norm": "2.244e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.232e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.802e-01", "anc_acc": "5.475e-01", "epoch": 0.05672} {"step": 28365, "loss": 0.7981, "grad_norm": "2.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.641e-01", "anc_loss": "1.052e+00", "dlm_acc": "5.697e-01", "anc_acc": "5.472e-01", "epoch": 0.05673} {"step": 28370, "loss": 1.3269, "grad_norm": "3.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.689e+00", "anc_loss": "1.795e+00", "dlm_acc": "4.622e-01", "anc_acc": "4.397e-01", "epoch": 0.05674} {"step": 28375, "loss": 0.9902, "grad_norm": "6.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.182e+00", "anc_loss": "1.285e+00", "dlm_acc": "5.372e-01", "anc_acc": "5.122e-01", "epoch": 0.05675} {"step": 28380, "loss": 1.0703, "grad_norm": "2.075e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.578e+00", "dlm_acc": "4.697e-01", "anc_acc": "4.425e-01", "epoch": 0.05676} {"step": 28385, "loss": 1.0399, "grad_norm": "5.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.381e+00", "anc_loss": "1.519e+00", "dlm_acc": "5.412e-01", "anc_acc": "5.115e-01", "epoch": 0.05677} {"step": 28390, "loss": 1.1796, "grad_norm": "2.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.385e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.310e-01", "anc_acc": "5.072e-01", "epoch": 0.05678} {"step": 28395, "loss": 0.7292, "grad_norm": "4.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.219e+00", "dlm_acc": "4.478e-01", "anc_acc": "4.297e-01", "epoch": 0.05679} {"step": 28400, "loss": 1.1683, "grad_norm": "5.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.000e-01", "anc_loss": "9.516e-01", "dlm_acc": "4.534e-01", "anc_acc": "4.310e-01", "epoch": 0.0568} {"step": 28405, "loss": 0.7641, "grad_norm": "2.874e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.781e-01", "anc_loss": "6.359e-01", "dlm_acc": "5.447e-01", "anc_acc": "5.088e-01", "epoch": 0.05681} {"step": 28410, "loss": 1.3468, "grad_norm": "3.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.469e-01", "anc_loss": "8.102e-01", "dlm_acc": "4.840e-01", "anc_acc": "4.477e-01", "epoch": 0.05682} {"step": 28415, "loss": 0.8719, "grad_norm": "4.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.883e-01", "anc_loss": "6.555e-01", "dlm_acc": "5.570e-01", "anc_acc": "5.182e-01", "epoch": 0.05683} {"step": 28420, "loss": 1.1124, "grad_norm": "1.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.492e-01", "anc_loss": "7.164e-01", "dlm_acc": "5.410e-01", "anc_acc": "5.013e-01", "epoch": 0.05684} {"step": 28425, "loss": 1.3577, "grad_norm": "5.883e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.906e-01", "anc_loss": "6.586e-01", "dlm_acc": "5.628e-01", "anc_acc": "5.207e-01", "epoch": 0.05685} {"step": 28430, "loss": 1.5706, "grad_norm": "3.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.210e+00", "dlm_acc": "6.366e-01", "anc_acc": "6.171e-01", "epoch": 0.05686} {"step": 28435, "loss": 1.2348, "grad_norm": "3.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.186e+00", "dlm_acc": "6.074e-01", "anc_acc": "5.803e-01", "epoch": 0.05687} {"step": 28440, "loss": 1.3114, "grad_norm": "2.498e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.078e-01", "anc_loss": "1.021e+00", "dlm_acc": "6.586e-01", "anc_acc": "6.214e-01", "epoch": 0.05688} {"step": 28445, "loss": 1.3189, "grad_norm": "4.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.233e+00", "dlm_acc": "6.003e-01", "anc_acc": "5.767e-01", "epoch": 0.05689} {"step": 28450, "loss": 0.859, "grad_norm": "4.111e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.195e-01", "anc_loss": "1.021e+00", "dlm_acc": "6.125e-01", "anc_acc": "5.800e-01", "epoch": 0.0569} {"step": 28455, "loss": 1.4772, "grad_norm": "2.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.446e+00", "anc_loss": "2.516e+00", "dlm_acc": "2.367e-01", "anc_acc": "2.242e-01", "epoch": 0.05691} {"step": 28460, "loss": 1.6226, "grad_norm": "5.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.617e+00", "anc_loss": "2.653e+00", "dlm_acc": "9.330e-02", "anc_acc": "8.523e-02", "epoch": 0.05692} {"step": 28465, "loss": 1.5909, "grad_norm": "3.437e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.149e+00", "anc_loss": "1.240e+00", "dlm_acc": "5.978e-01", "anc_acc": "5.707e-01", "epoch": 0.05693} {"step": 28470, "loss": 1.4805, "grad_norm": "3.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.290e+00", "anc_loss": "1.375e+00", "dlm_acc": "5.566e-01", "anc_acc": "5.374e-01", "epoch": 0.05694} {"step": 28475, "loss": 1.5464, "grad_norm": "3.798e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.981e+00", "anc_loss": "2.139e+00", "dlm_acc": "3.204e-01", "anc_acc": "2.820e-01", "epoch": 0.05695} {"step": 28480, "loss": 1.4123, "grad_norm": "4.114e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.702e+00", "dlm_acc": "4.186e-01", "anc_acc": "3.825e-01", "epoch": 0.05696} {"step": 28485, "loss": 1.1602, "grad_norm": "5.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.711e-01", "anc_loss": "1.057e+00", "dlm_acc": "6.024e-01", "anc_acc": "5.777e-01", "epoch": 0.05697} {"step": 28490, "loss": 1.1536, "grad_norm": "6.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.938e-01", "anc_loss": "9.617e-01", "dlm_acc": "5.636e-01", "anc_acc": "5.443e-01", "epoch": 0.05698} {"step": 28495, "loss": 1.7828, "grad_norm": "5.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.530e+00", "dlm_acc": "4.436e-01", "anc_acc": "4.260e-01", "epoch": 0.05699} {"step": 28500, "loss": 1.2984, "grad_norm": "7.749e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.658e-01", "anc_acc": "5.288e-01", "epoch": 0.057} {"step": 28505, "loss": 0.9849, "grad_norm": "1.610e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.688e+00", "anc_loss": "1.765e+00", "dlm_acc": "3.746e-01", "anc_acc": "3.542e-01", "epoch": 0.05701} {"step": 28510, "loss": 1.1001, "grad_norm": "2.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.723e-01", "anc_acc": "5.377e-01", "epoch": 0.05702} {"step": 28515, "loss": 0.8482, "grad_norm": "2.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.205e+00", "dlm_acc": "5.788e-01", "anc_acc": "5.440e-01", "epoch": 0.05703} {"step": 28520, "loss": 0.9706, "grad_norm": "8.863e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.445e-01", "anc_loss": "8.043e-01", "dlm_acc": "6.221e-01", "anc_acc": "5.971e-01", "epoch": 0.05704} {"step": 28525, "loss": 1.4917, "grad_norm": "6.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.226e+00", "anc_loss": "1.306e+00", "dlm_acc": "5.465e-01", "anc_acc": "5.237e-01", "epoch": 0.05705} {"step": 28530, "loss": 1.5357, "grad_norm": "1.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.407e+00", "anc_loss": "1.485e+00", "dlm_acc": "5.813e-01", "anc_acc": "5.627e-01", "epoch": 0.05706} {"step": 28535, "loss": 0.9575, "grad_norm": "3.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.854e-01", "anc_loss": "3.254e-01", "dlm_acc": "8.275e-01", "anc_acc": "8.145e-01", "epoch": 0.05707} {"step": 28540, "loss": 1.0948, "grad_norm": "3.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.102e-01", "anc_loss": "9.461e-01", "dlm_acc": "6.779e-01", "anc_acc": "6.630e-01", "epoch": 0.05708} {"step": 28545, "loss": 1.212, "grad_norm": "2.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.340e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.007e-01", "anc_acc": "4.725e-01", "epoch": 0.05709} {"step": 28550, "loss": 1.3684, "grad_norm": "3.110e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.301e+00", "dlm_acc": "6.229e-01", "anc_acc": "5.873e-01", "epoch": 0.0571} {"step": 28555, "loss": 1.0534, "grad_norm": "3.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.848e-01", "anc_loss": "7.824e-01", "dlm_acc": "7.327e-01", "anc_acc": "7.030e-01", "epoch": 0.05711} {"step": 28560, "loss": 1.2005, "grad_norm": "2.252e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.141e-01", "anc_loss": "8.488e-01", "dlm_acc": "7.048e-01", "anc_acc": "6.613e-01", "epoch": 0.05712} {"step": 28565, "loss": 1.2981, "grad_norm": "2.791e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.773e-01", "anc_loss": "9.559e-01", "dlm_acc": "6.496e-01", "anc_acc": "6.264e-01", "epoch": 0.05713} {"step": 28570, "loss": 1.2995, "grad_norm": "3.968e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.256e+00", "anc_loss": "2.384e+00", "dlm_acc": "1.995e-01", "anc_acc": "1.631e-01", "epoch": 0.05714} {"step": 28575, "loss": 1.0417, "grad_norm": "2.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.115e-01", "anc_loss": "1.004e+00", "dlm_acc": "7.403e-01", "anc_acc": "7.159e-01", "epoch": 0.05715} {"step": 28580, "loss": 1.3519, "grad_norm": "4.295e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.153e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.376e-01", "anc_acc": "5.082e-01", "epoch": 0.05716} {"step": 28585, "loss": 1.4676, "grad_norm": "3.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.384e-01", "anc_acc": "5.105e-01", "epoch": 0.05717} {"step": 28590, "loss": 1.0315, "grad_norm": "3.290e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.508e-01", "anc_loss": "9.383e-01", "dlm_acc": "6.124e-01", "anc_acc": "5.867e-01", "epoch": 0.05718} {"step": 28595, "loss": 1.234, "grad_norm": "4.071e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.070e-01", "anc_loss": "7.836e-01", "dlm_acc": "5.341e-01", "anc_acc": "5.084e-01", "epoch": 0.05719} {"step": 28600, "loss": 1.2435, "grad_norm": "2.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.617e-01", "anc_loss": "9.672e-01", "dlm_acc": "5.946e-01", "anc_acc": "5.628e-01", "epoch": 0.0572} {"step": 28605, "loss": 1.1711, "grad_norm": "3.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.122e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.953e-01", "anc_acc": "5.784e-01", "epoch": 0.05721} {"step": 28610, "loss": 1.0457, "grad_norm": "2.496e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.136e-01", "anc_loss": "2.563e-01", "dlm_acc": "8.895e-01", "anc_acc": "8.672e-01", "epoch": 0.05722} {"step": 28615, "loss": 1.3281, "grad_norm": "2.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.191e-01", "anc_loss": "6.623e-01", "dlm_acc": "7.328e-01", "anc_acc": "7.209e-01", "epoch": 0.05723} {"step": 28620, "loss": 1.2673, "grad_norm": "2.520e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.619e-01", "anc_loss": "1.025e+00", "dlm_acc": "5.711e-01", "anc_acc": "5.553e-01", "epoch": 0.05724} {"step": 28625, "loss": 1.1572, "grad_norm": "3.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.083e+00", "anc_loss": "1.186e+00", "dlm_acc": "5.872e-01", "anc_acc": "5.602e-01", "epoch": 0.05725} {"step": 28630, "loss": 1.1514, "grad_norm": "3.425e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.879e-01", "anc_loss": "9.641e-01", "dlm_acc": "7.118e-01", "anc_acc": "6.913e-01", "epoch": 0.05726} {"step": 28635, "loss": 0.8861, "grad_norm": "7.487e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.529e-01", "anc_loss": "1.626e-01", "dlm_acc": "9.092e-01", "anc_acc": "9.043e-01", "epoch": 0.05727} {"step": 28640, "loss": 1.0674, "grad_norm": "5.445e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.938e-01", "anc_loss": "2.065e-01", "dlm_acc": "8.646e-01", "anc_acc": "8.603e-01", "epoch": 0.05728} {"step": 28645, "loss": 1.2235, "grad_norm": "2.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.561e-01", "anc_loss": "4.363e-01", "dlm_acc": "8.489e-01", "anc_acc": "8.208e-01", "epoch": 0.05729} {"step": 28650, "loss": 1.4497, "grad_norm": "6.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.945e-01", "anc_loss": "7.712e-01", "dlm_acc": "7.798e-01", "anc_acc": "7.542e-01", "epoch": 0.0573} {"step": 28655, "loss": 0.846, "grad_norm": "2.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.109e-01", "anc_loss": "9.297e-01", "dlm_acc": "6.610e-01", "anc_acc": "6.297e-01", "epoch": 0.05731} {"step": 28660, "loss": 0.9313, "grad_norm": "3.192e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.416e-01", "anc_loss": "8.035e-01", "dlm_acc": "7.001e-01", "anc_acc": "6.838e-01", "epoch": 0.05732} {"step": 28665, "loss": 0.9555, "grad_norm": "3.798e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.016e-01", "anc_loss": "7.703e-01", "dlm_acc": "6.805e-01", "anc_acc": "6.612e-01", "epoch": 0.05733} {"step": 28670, "loss": 1.1254, "grad_norm": "4.858e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.371e-01", "anc_loss": "4.541e-01", "dlm_acc": "7.552e-01", "anc_acc": "7.466e-01", "epoch": 0.05734} {"step": 28675, "loss": 1.0512, "grad_norm": "2.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.645e-01", "anc_loss": "3.836e-01", "dlm_acc": "7.787e-01", "anc_acc": "7.699e-01", "epoch": 0.05735} {"step": 28680, "loss": 1.0886, "grad_norm": "3.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.701e-01", "anc_loss": "3.910e-01", "dlm_acc": "7.721e-01", "anc_acc": "7.627e-01", "epoch": 0.05736} {"step": 28685, "loss": 1.0241, "grad_norm": "2.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.420e-01", "anc_loss": "5.938e-01", "dlm_acc": "7.615e-01", "anc_acc": "7.458e-01", "epoch": 0.05737} {"step": 28690, "loss": 1.3113, "grad_norm": "2.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.805e-01", "anc_loss": "9.639e-01", "dlm_acc": "6.927e-01", "anc_acc": "6.733e-01", "epoch": 0.05738} {"step": 28695, "loss": 1.1049, "grad_norm": "3.168e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.001e-01", "anc_loss": "5.462e-01", "dlm_acc": "7.801e-01", "anc_acc": "7.610e-01", "epoch": 0.05739} {"step": 28700, "loss": 1.1289, "grad_norm": "7.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.766e-01", "anc_loss": "9.508e-01", "dlm_acc": "6.715e-01", "anc_acc": "6.519e-01", "epoch": 0.0574} {"step": 28705, "loss": 1.2238, "grad_norm": "3.610e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.527e-01", "anc_loss": "1.030e+00", "dlm_acc": "6.500e-01", "anc_acc": "6.316e-01", "epoch": 0.05741} {"step": 28710, "loss": 1.1303, "grad_norm": "1.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.694e-01", "anc_loss": "4.164e-01", "dlm_acc": "8.279e-01", "anc_acc": "8.093e-01", "epoch": 0.05742} {"step": 28715, "loss": 1.2069, "grad_norm": "4.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.902e-01", "anc_loss": "9.586e-01", "dlm_acc": "6.511e-01", "anc_acc": "6.377e-01", "epoch": 0.05743} {"step": 28720, "loss": 1.3781, "grad_norm": "3.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.547e-01", "anc_loss": "8.063e-01", "dlm_acc": "6.599e-01", "anc_acc": "6.446e-01", "epoch": 0.05744} {"step": 28725, "loss": 1.41, "grad_norm": "6.494e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.754e-01", "anc_loss": "9.334e-01", "dlm_acc": "5.725e-01", "anc_acc": "5.568e-01", "epoch": 0.05745} {"step": 28730, "loss": 1.1124, "grad_norm": "2.445e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.097e+00", "dlm_acc": "5.829e-01", "anc_acc": "5.533e-01", "epoch": 0.05746} {"step": 28735, "loss": 1.2089, "grad_norm": "7.494e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.321e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.743e-01", "anc_acc": "5.517e-01", "epoch": 0.05747} {"step": 28740, "loss": 1.0152, "grad_norm": "2.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.547e-01", "anc_loss": "8.230e-01", "dlm_acc": "7.214e-01", "anc_acc": "7.026e-01", "epoch": 0.05748} {"step": 28745, "loss": 0.9695, "grad_norm": "2.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.768e-01", "anc_loss": "7.457e-01", "dlm_acc": "7.262e-01", "anc_acc": "7.077e-01", "epoch": 0.05749} {"step": 28750, "loss": 1.2315, "grad_norm": "4.482e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.172e-01", "anc_loss": "9.203e-01", "dlm_acc": "6.851e-01", "anc_acc": "6.571e-01", "epoch": 0.0575} {"step": 28755, "loss": 1.1635, "grad_norm": "5.330e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.820e-01", "anc_loss": "1.073e+00", "dlm_acc": "6.167e-01", "anc_acc": "5.925e-01", "epoch": 0.05751} {"step": 28760, "loss": 1.2572, "grad_norm": "2.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.157e-01", "anc_loss": "8.899e-01", "dlm_acc": "7.314e-01", "anc_acc": "7.153e-01", "epoch": 0.05752} {"step": 28765, "loss": 0.8943, "grad_norm": "3.337e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.680e-01", "anc_loss": "3.916e-01", "dlm_acc": "8.735e-01", "anc_acc": "8.689e-01", "epoch": 0.05753} {"step": 28770, "loss": 1.1507, "grad_norm": "2.699e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.254e+00", "dlm_acc": "5.614e-01", "anc_acc": "5.371e-01", "epoch": 0.05754} {"step": 28775, "loss": 0.9854, "grad_norm": "4.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.109e-01", "anc_loss": "9.020e-01", "dlm_acc": "6.960e-01", "anc_acc": "6.708e-01", "epoch": 0.05755} {"step": 28780, "loss": 1.0096, "grad_norm": "3.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.000e-01", "anc_loss": "6.676e-01", "dlm_acc": "7.343e-01", "anc_acc": "7.076e-01", "epoch": 0.05756} {"step": 28785, "loss": 0.9776, "grad_norm": "1.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.168e-01", "anc_loss": "4.623e-01", "dlm_acc": "8.074e-01", "anc_acc": "7.896e-01", "epoch": 0.05757} {"step": 28790, "loss": 1.3933, "grad_norm": "5.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.648e-01", "anc_loss": "1.052e+00", "dlm_acc": "6.328e-01", "anc_acc": "6.126e-01", "epoch": 0.05758} {"step": 28795, "loss": 0.996, "grad_norm": "3.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.602e-01", "anc_loss": "6.508e-01", "dlm_acc": "7.652e-01", "anc_acc": "7.436e-01", "epoch": 0.05759} {"step": 28800, "loss": 0.9489, "grad_norm": "3.065e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.831e-01", "anc_loss": "2.615e-01", "dlm_acc": "9.103e-01", "anc_acc": "8.824e-01", "epoch": 0.0576} {"step": 28805, "loss": 1.338, "grad_norm": "5.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.110e+00", "dlm_acc": "6.254e-01", "anc_acc": "6.034e-01", "epoch": 0.05761} {"step": 28810, "loss": 1.0851, "grad_norm": "2.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.388e-01", "anc_loss": "8.983e-01", "dlm_acc": "6.957e-01", "anc_acc": "6.809e-01", "epoch": 0.05762} {"step": 28815, "loss": 0.8646, "grad_norm": "3.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.712e-01", "anc_loss": "4.216e-01", "dlm_acc": "8.345e-01", "anc_acc": "8.147e-01", "epoch": 0.05763} {"step": 28820, "loss": 1.2819, "grad_norm": "2.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.505e-01", "anc_loss": "9.388e-01", "dlm_acc": "6.934e-01", "anc_acc": "6.668e-01", "epoch": 0.05764} {"step": 28825, "loss": 1.0141, "grad_norm": "6.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.241e+00", "dlm_acc": "5.511e-01", "anc_acc": "5.286e-01", "epoch": 0.05765} {"step": 28830, "loss": 1.3529, "grad_norm": "4.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.426e-01", "anc_loss": "9.285e-01", "dlm_acc": "6.638e-01", "anc_acc": "6.367e-01", "epoch": 0.05766} {"step": 28835, "loss": 1.3928, "grad_norm": "8.202e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.883e-01", "anc_loss": "9.742e-01", "dlm_acc": "6.387e-01", "anc_acc": "6.123e-01", "epoch": 0.05767} {"step": 28840, "loss": 1.2565, "grad_norm": "2.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.027e-01", "anc_loss": "7.957e-01", "dlm_acc": "7.019e-01", "anc_acc": "6.735e-01", "epoch": 0.05768} {"step": 28845, "loss": 1.5517, "grad_norm": "3.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.918e-01", "anc_loss": "7.914e-01", "dlm_acc": "7.738e-01", "anc_acc": "7.480e-01", "epoch": 0.05769} {"step": 28850, "loss": 1.3502, "grad_norm": "7.317e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.152e-01", "anc_loss": "9.988e-01", "dlm_acc": "7.054e-01", "anc_acc": "6.894e-01", "epoch": 0.0577} {"step": 28855, "loss": 1.0546, "grad_norm": "2.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.820e-01", "anc_loss": "7.195e-01", "dlm_acc": "5.500e-01", "anc_acc": "5.326e-01", "epoch": 0.05771} {"step": 28860, "loss": 1.1297, "grad_norm": "2.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.227e+00", "dlm_acc": "4.783e-01", "anc_acc": "4.578e-01", "epoch": 0.05772} {"step": 28865, "loss": 0.8355, "grad_norm": "2.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.809e-01", "anc_loss": "8.094e-01", "dlm_acc": "5.563e-01", "anc_acc": "5.484e-01", "epoch": 0.05773} {"step": 28870, "loss": 0.9625, "grad_norm": "3.129e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.648e-01", "anc_loss": "8.953e-01", "dlm_acc": "6.698e-01", "anc_acc": "6.246e-01", "epoch": 0.05774} {"step": 28875, "loss": 1.6017, "grad_norm": "1.972e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.904e-01", "anc_acc": "5.676e-01", "epoch": 0.05775} {"step": 28880, "loss": 1.3218, "grad_norm": "2.928e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.898e-01", "anc_loss": "1.089e+00", "dlm_acc": "6.504e-01", "anc_acc": "6.229e-01", "epoch": 0.05776} {"step": 28885, "loss": 1.6995, "grad_norm": "6.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.480e+00", "anc_loss": "1.583e+00", "dlm_acc": "4.744e-01", "anc_acc": "4.472e-01", "epoch": 0.05777} {"step": 28890, "loss": 1.2668, "grad_norm": "3.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.282e+00", "dlm_acc": "5.957e-01", "anc_acc": "5.594e-01", "epoch": 0.05778} {"step": 28895, "loss": 1.2182, "grad_norm": "2.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.222e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.522e-01", "anc_acc": "5.256e-01", "epoch": 0.05779} {"step": 28900, "loss": 1.1477, "grad_norm": "3.339e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.547e-01", "anc_loss": "7.961e-01", "dlm_acc": "5.590e-01", "anc_acc": "5.491e-01", "epoch": 0.0578} {"step": 28905, "loss": 1.27, "grad_norm": "2.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.141e-01", "anc_loss": "7.359e-01", "dlm_acc": "4.691e-01", "anc_acc": "4.571e-01", "epoch": 0.05781} {"step": 28910, "loss": 1.2085, "grad_norm": "3.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.188e-01", "anc_loss": "7.367e-01", "dlm_acc": "4.675e-01", "anc_acc": "4.574e-01", "epoch": 0.05782} {"step": 28915, "loss": 1.5677, "grad_norm": "5.325e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.424e+00", "anc_loss": "1.518e+00", "dlm_acc": "5.292e-01", "anc_acc": "5.111e-01", "epoch": 0.05783} {"step": 28920, "loss": 1.1604, "grad_norm": "3.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.146e+00", "dlm_acc": "6.016e-01", "anc_acc": "5.818e-01", "epoch": 0.05784} {"step": 28925, "loss": 1.2097, "grad_norm": "5.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.236e+00", "dlm_acc": "5.648e-01", "anc_acc": "5.357e-01", "epoch": 0.05785} {"step": 28930, "loss": 0.9525, "grad_norm": "3.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.566e-01", "anc_loss": "9.648e-01", "dlm_acc": "6.448e-01", "anc_acc": "6.152e-01", "epoch": 0.05786} {"step": 28935, "loss": 1.2355, "grad_norm": "4.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.910e-01", "anc_loss": "7.594e-01", "dlm_acc": "7.208e-01", "anc_acc": "6.990e-01", "epoch": 0.05787} {"step": 28940, "loss": 1.8965, "grad_norm": "3.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.089e+00", "anc_loss": "2.147e+00", "dlm_acc": "3.425e-01", "anc_acc": "3.309e-01", "epoch": 0.05788} {"step": 28945, "loss": 1.3978, "grad_norm": "3.771e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.653e+00", "anc_loss": "1.741e+00", "dlm_acc": "4.393e-01", "anc_acc": "4.223e-01", "epoch": 0.05789} {"step": 28950, "loss": 1.1428, "grad_norm": "4.222e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.859e-01", "anc_loss": "7.668e-01", "dlm_acc": "6.387e-01", "anc_acc": "6.059e-01", "epoch": 0.0579} {"step": 28955, "loss": 1.6718, "grad_norm": "2.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.663e+00", "anc_loss": "1.764e+00", "dlm_acc": "4.408e-01", "anc_acc": "4.202e-01", "epoch": 0.05791} {"step": 28960, "loss": 1.1937, "grad_norm": "3.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.668e-01", "anc_loss": "9.691e-01", "dlm_acc": "6.276e-01", "anc_acc": "5.886e-01", "epoch": 0.05792} {"step": 28965, "loss": 1.404, "grad_norm": "2.878e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.205e+00", "dlm_acc": "5.719e-01", "anc_acc": "5.393e-01", "epoch": 0.05793} {"step": 28970, "loss": 1.5297, "grad_norm": "3.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.562e+00", "dlm_acc": "5.092e-01", "anc_acc": "4.845e-01", "epoch": 0.05794} {"step": 28975, "loss": 1.3396, "grad_norm": "4.112e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.058e+00", "anc_loss": "2.136e+00", "dlm_acc": "3.237e-01", "anc_acc": "3.031e-01", "epoch": 0.05795} {"step": 28980, "loss": 1.2234, "grad_norm": "2.818e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.203e+00", "dlm_acc": "5.458e-01", "anc_acc": "5.229e-01", "epoch": 0.05796} {"step": 28985, "loss": 1.1742, "grad_norm": "5.012e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.640e-01", "anc_acc": "5.349e-01", "epoch": 0.05797} {"step": 28990, "loss": 0.883, "grad_norm": "3.694e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.624e-01", "anc_loss": "7.336e-01", "dlm_acc": "6.935e-01", "anc_acc": "6.662e-01", "epoch": 0.05798} {"step": 28995, "loss": 1.4878, "grad_norm": "6.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.449e+00", "dlm_acc": "5.184e-01", "anc_acc": "4.966e-01", "epoch": 0.05799} {"step": 29000, "loss": 1.3814, "grad_norm": "2.129e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.949e-01", "anc_loss": "1.070e+00", "dlm_acc": "6.007e-01", "anc_acc": "5.823e-01", "epoch": 0.058} {"step": 29005, "loss": 1.3505, "grad_norm": "4.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.949e-01", "anc_loss": "8.445e-01", "dlm_acc": "6.206e-01", "anc_acc": "6.062e-01", "epoch": 0.05801} {"step": 29010, "loss": 1.291, "grad_norm": "1.029e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.163e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.265e-01", "anc_acc": "4.896e-01", "epoch": 0.05802} {"step": 29015, "loss": 1.3239, "grad_norm": "8.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.930e-01", "anc_loss": "9.984e-01", "dlm_acc": "2.268e-01", "anc_acc": "2.281e-01", "epoch": 0.05803} {"step": 29020, "loss": 1.4596, "grad_norm": "4.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.030e+00", "dlm_acc": "2.303e-01", "anc_acc": "2.270e-01", "epoch": 0.05804} {"step": 29025, "loss": 1.1704, "grad_norm": "2.530e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.102e+00", "dlm_acc": "4.886e-01", "anc_acc": "4.717e-01", "epoch": 0.05805} {"step": 29030, "loss": 1.2286, "grad_norm": "3.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.383e+00", "anc_loss": "1.473e+00", "dlm_acc": "4.680e-01", "anc_acc": "4.422e-01", "epoch": 0.05806} {"step": 29035, "loss": 1.4722, "grad_norm": "8.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.170e+00", "dlm_acc": "5.306e-01", "anc_acc": "5.073e-01", "epoch": 0.05807} {"step": 29040, "loss": 1.4385, "grad_norm": "4.733e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.179e+00", "dlm_acc": "6.224e-01", "anc_acc": "5.950e-01", "epoch": 0.05808} {"step": 29045, "loss": 1.925, "grad_norm": "3.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.787e+00", "anc_loss": "1.887e+00", "dlm_acc": "4.340e-01", "anc_acc": "4.084e-01", "epoch": 0.05809} {"step": 29050, "loss": 1.1919, "grad_norm": "4.834e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.458e+00", "anc_loss": "1.664e+00", "dlm_acc": "5.154e-01", "anc_acc": "4.804e-01", "epoch": 0.0581} {"step": 29055, "loss": 1.4079, "grad_norm": "3.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.674e-01", "anc_acc": "5.242e-01", "epoch": 0.05811} {"step": 29060, "loss": 0.9516, "grad_norm": "3.523e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.773e-01", "anc_loss": "1.086e+00", "dlm_acc": "6.262e-01", "anc_acc": "5.954e-01", "epoch": 0.05812} {"step": 29065, "loss": 1.3296, "grad_norm": "3.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.117e+00", "dlm_acc": "5.869e-01", "anc_acc": "5.524e-01", "epoch": 0.05813} {"step": 29070, "loss": 1.1904, "grad_norm": "3.101e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.268e+00", "dlm_acc": "5.682e-01", "anc_acc": "5.436e-01", "epoch": 0.05814} {"step": 29075, "loss": 1.2711, "grad_norm": "3.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e+00", "anc_loss": "1.437e+00", "dlm_acc": "4.760e-01", "anc_acc": "4.552e-01", "epoch": 0.05815} {"step": 29080, "loss": 1.2024, "grad_norm": "3.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.722e+00", "anc_loss": "1.793e+00", "dlm_acc": "3.774e-01", "anc_acc": "3.612e-01", "epoch": 0.05816} {"step": 29085, "loss": 1.0282, "grad_norm": "3.757e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e-01", "anc_loss": "1.739e-01", "dlm_acc": "9.248e-01", "anc_acc": "9.175e-01", "epoch": 0.05817} {"step": 29090, "loss": 1.1448, "grad_norm": "2.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.532e-01", "anc_acc": "5.245e-01", "epoch": 0.05818} {"step": 29095, "loss": 1.3825, "grad_norm": "3.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.358e+00", "anc_loss": "1.477e+00", "dlm_acc": "5.554e-01", "anc_acc": "5.319e-01", "epoch": 0.05819} {"step": 29100, "loss": 1.1851, "grad_norm": "3.467e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.301e+00", "anc_loss": "1.363e+00", "dlm_acc": "3.989e-01", "anc_acc": "3.767e-01", "epoch": 0.0582} {"step": 29105, "loss": 0.9484, "grad_norm": "3.373e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.078e-01", "anc_loss": "1.040e+00", "dlm_acc": "6.443e-01", "anc_acc": "6.035e-01", "epoch": 0.05821} {"step": 29110, "loss": 0.8494, "grad_norm": "3.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.438e-01", "anc_loss": "9.574e-01", "dlm_acc": "6.381e-01", "anc_acc": "6.059e-01", "epoch": 0.05822} {"step": 29115, "loss": 0.8888, "grad_norm": "3.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.691e-01", "anc_loss": "9.719e-01", "dlm_acc": "6.312e-01", "anc_acc": "6.019e-01", "epoch": 0.05823} {"step": 29120, "loss": 1.311, "grad_norm": "3.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.336e+00", "dlm_acc": "6.114e-01", "anc_acc": "5.751e-01", "epoch": 0.05824} {"step": 29125, "loss": 0.6999, "grad_norm": "4.139e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.469e-01", "anc_loss": "2.957e-01", "dlm_acc": "8.360e-01", "anc_acc": "8.091e-01", "epoch": 0.05825} {"step": 29130, "loss": 0.8473, "grad_norm": "3.804e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.562e-01", "anc_loss": "9.422e-01", "dlm_acc": "6.321e-01", "anc_acc": "6.080e-01", "epoch": 0.05826} {"step": 29135, "loss": 1.2017, "grad_norm": "4.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.222e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.491e-01", "anc_acc": "5.243e-01", "epoch": 0.05827} {"step": 29140, "loss": 1.0696, "grad_norm": "5.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.221e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.837e-01", "anc_acc": "5.463e-01", "epoch": 0.05828} {"step": 29145, "loss": 0.7366, "grad_norm": "3.713e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.437e-01", "anc_loss": "5.824e-01", "dlm_acc": "6.279e-01", "anc_acc": "6.130e-01", "epoch": 0.05829} {"step": 29150, "loss": 0.8634, "grad_norm": "3.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.969e-01", "anc_loss": "5.301e-01", "dlm_acc": "6.474e-01", "anc_acc": "6.379e-01", "epoch": 0.0583} {"step": 29155, "loss": 0.8948, "grad_norm": "3.431e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.273e-01", "anc_loss": "4.496e-01", "dlm_acc": "6.967e-01", "anc_acc": "6.879e-01", "epoch": 0.05831} {"step": 29160, "loss": 1.0867, "grad_norm": "2.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.090e-01", "anc_loss": "7.711e-01", "dlm_acc": "6.245e-01", "anc_acc": "6.081e-01", "epoch": 0.05832} {"step": 29165, "loss": 1.2567, "grad_norm": "2.525e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.586e-01", "anc_loss": "1.085e+00", "dlm_acc": "6.568e-01", "anc_acc": "6.152e-01", "epoch": 0.05833} {"step": 29170, "loss": 0.945, "grad_norm": "6.694e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.437e+00", "dlm_acc": "5.423e-01", "anc_acc": "5.222e-01", "epoch": 0.05834} {"step": 29175, "loss": 0.8975, "grad_norm": "3.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.414e-01", "anc_loss": "8.641e-01", "dlm_acc": "4.812e-01", "anc_acc": "4.752e-01", "epoch": 0.05835} {"step": 29180, "loss": 1.0643, "grad_norm": "6.019e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.461e-01", "anc_loss": "8.523e-01", "dlm_acc": "4.766e-01", "anc_acc": "4.743e-01", "epoch": 0.05836} {"step": 29185, "loss": 0.8872, "grad_norm": "4.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.094e-01", "anc_loss": "7.109e-01", "dlm_acc": "4.760e-01", "anc_acc": "4.760e-01", "epoch": 0.05837} {"step": 29190, "loss": 1.1407, "grad_norm": "3.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.617e-01", "anc_loss": "7.641e-01", "dlm_acc": "4.722e-01", "anc_acc": "4.720e-01", "epoch": 0.05838} {"step": 29195, "loss": 1.1027, "grad_norm": "5.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.016e-01", "anc_loss": "8.047e-01", "dlm_acc": "4.754e-01", "anc_acc": "4.751e-01", "epoch": 0.05839} {"step": 29200, "loss": 1.039, "grad_norm": "3.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.011e+00", "anc_loss": "1.119e+00", "dlm_acc": "5.472e-01", "anc_acc": "5.152e-01", "epoch": 0.0584} {"step": 29205, "loss": 1.1979, "grad_norm": "4.274e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.161e+00", "dlm_acc": "4.971e-01", "anc_acc": "4.755e-01", "epoch": 0.05841} {"step": 29210, "loss": 1.1653, "grad_norm": "4.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.080e+00", "dlm_acc": "5.589e-01", "anc_acc": "5.370e-01", "epoch": 0.05842} {"step": 29215, "loss": 1.3842, "grad_norm": "3.626e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.221e+00", "anc_loss": "1.323e+00", "dlm_acc": "5.136e-01", "anc_acc": "4.929e-01", "epoch": 0.05843} {"step": 29220, "loss": 1.6126, "grad_norm": "2.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.619e+00", "anc_loss": "1.762e+00", "dlm_acc": "4.921e-01", "anc_acc": "4.655e-01", "epoch": 0.05844} {"step": 29225, "loss": 1.1728, "grad_norm": "2.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.674e-01", "anc_acc": "5.466e-01", "epoch": 0.05845} {"step": 29230, "loss": 1.3577, "grad_norm": "2.986e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.499e+00", "dlm_acc": "5.089e-01", "anc_acc": "4.846e-01", "epoch": 0.05846} {"step": 29235, "loss": 1.6125, "grad_norm": "8.958e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.659e+00", "anc_loss": "1.755e+00", "dlm_acc": "4.496e-01", "anc_acc": "4.242e-01", "epoch": 0.05847} {"step": 29240, "loss": 1.0551, "grad_norm": "3.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.217e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.372e-01", "anc_acc": "5.174e-01", "epoch": 0.05848} {"step": 29245, "loss": 1.341, "grad_norm": "3.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.415e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.446e-01", "epoch": 0.05849} {"step": 29250, "loss": 1.2584, "grad_norm": "3.667e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.995e+00", "anc_loss": "2.041e+00", "dlm_acc": "3.204e-01", "anc_acc": "3.089e-01", "epoch": 0.0585} {"step": 29255, "loss": 1.1181, "grad_norm": "3.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.621e-01", "anc_acc": "5.236e-01", "epoch": 0.05851} {"step": 29260, "loss": 1.2713, "grad_norm": "3.977e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.932e+00", "anc_loss": "1.998e+00", "dlm_acc": "3.387e-01", "anc_acc": "3.234e-01", "epoch": 0.05852} {"step": 29265, "loss": 1.2074, "grad_norm": "1.794e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.193e+00", "anc_loss": "1.321e+00", "dlm_acc": "5.601e-01", "anc_acc": "5.193e-01", "epoch": 0.05853} {"step": 29270, "loss": 1.4566, "grad_norm": "3.709e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.388e+00", "dlm_acc": "5.400e-01", "anc_acc": "5.134e-01", "epoch": 0.05854} {"step": 29275, "loss": 1.3782, "grad_norm": "7.192e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.520e+00", "anc_loss": "1.628e+00", "dlm_acc": "4.719e-01", "anc_acc": "4.453e-01", "epoch": 0.05855} {"step": 29280, "loss": 0.9739, "grad_norm": "3.208e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.195e+00", "dlm_acc": "5.896e-01", "anc_acc": "5.516e-01", "epoch": 0.05856} {"step": 29285, "loss": 1.3261, "grad_norm": "4.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.173e+00", "dlm_acc": "5.947e-01", "anc_acc": "5.556e-01", "epoch": 0.05857} {"step": 29290, "loss": 0.9612, "grad_norm": "4.862e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.113e+00", "dlm_acc": "6.045e-01", "anc_acc": "5.743e-01", "epoch": 0.05858} {"step": 29295, "loss": 1.1563, "grad_norm": "2.806e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.856e-01", "anc_acc": "5.522e-01", "epoch": 0.05859} {"step": 29300, "loss": 1.2842, "grad_norm": "2.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.117e-01", "anc_loss": "8.109e-01", "dlm_acc": "6.855e-01", "anc_acc": "6.541e-01", "epoch": 0.0586} {"step": 29305, "loss": 1.3024, "grad_norm": "2.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.060e+00", "anc_loss": "1.184e+00", "dlm_acc": "6.236e-01", "anc_acc": "5.882e-01", "epoch": 0.05861} {"step": 29310, "loss": 1.5624, "grad_norm": "4.273e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.215e+00", "anc_loss": "1.351e+00", "dlm_acc": "5.864e-01", "anc_acc": "5.562e-01", "epoch": 0.05862} {"step": 29315, "loss": 1.7731, "grad_norm": "4.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.315e+00", "dlm_acc": "5.625e-01", "anc_acc": "5.254e-01", "epoch": 0.05863} {"step": 29320, "loss": 1.5002, "grad_norm": "4.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.502e+00", "dlm_acc": "4.746e-01", "anc_acc": "4.519e-01", "epoch": 0.05864} {"step": 29325, "loss": 1.323, "grad_norm": "2.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.318e+00", "dlm_acc": "4.720e-01", "anc_acc": "4.520e-01", "epoch": 0.05865} {"step": 29330, "loss": 0.7757, "grad_norm": "6.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.609e-01", "anc_loss": "7.418e-01", "dlm_acc": "6.699e-01", "anc_acc": "6.410e-01", "epoch": 0.05866} {"step": 29335, "loss": 0.9603, "grad_norm": "2.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.221e+00", "anc_loss": "1.328e+00", "dlm_acc": "5.823e-01", "anc_acc": "5.534e-01", "epoch": 0.05867} {"step": 29340, "loss": 0.7048, "grad_norm": "7.924e-02", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.147e+00", "dlm_acc": "5.573e-01", "anc_acc": "5.337e-01", "epoch": 0.05868} {"step": 29345, "loss": 1.1971, "grad_norm": "3.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.279e+00", "anc_loss": "1.369e+00", "dlm_acc": "5.729e-01", "anc_acc": "5.530e-01", "epoch": 0.05869} {"step": 29350, "loss": 0.99, "grad_norm": "3.204e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.926e-01", "anc_acc": "5.719e-01", "epoch": 0.0587} {"step": 29355, "loss": 1.1197, "grad_norm": "3.524e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.225e-01", "anc_acc": "4.979e-01", "epoch": 0.05871} {"step": 29360, "loss": 0.887, "grad_norm": "1.084e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.820e-01", "anc_loss": "7.195e-01", "dlm_acc": "5.656e-01", "anc_acc": "5.510e-01", "epoch": 0.05872} {"step": 29365, "loss": 1.3031, "grad_norm": "4.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.295e+00", "dlm_acc": "4.594e-01", "anc_acc": "4.375e-01", "epoch": 0.05873} {"step": 29370, "loss": 1.4362, "grad_norm": "6.111e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.494e+00", "anc_loss": "1.647e+00", "dlm_acc": "3.935e-01", "anc_acc": "3.569e-01", "epoch": 0.05874} {"step": 29375, "loss": 1.4004, "grad_norm": "3.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.664e+00", "anc_loss": "1.845e+00", "dlm_acc": "3.644e-01", "anc_acc": "3.199e-01", "epoch": 0.05875} {"step": 29380, "loss": 1.6078, "grad_norm": "2.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.977e+00", "anc_loss": "2.108e+00", "dlm_acc": "3.188e-01", "anc_acc": "2.857e-01", "epoch": 0.05876} {"step": 29385, "loss": 1.4468, "grad_norm": "3.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.761e+00", "dlm_acc": "4.838e-01", "anc_acc": "4.543e-01", "epoch": 0.05877} {"step": 29390, "loss": 1.238, "grad_norm": "4.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.695e-01", "anc_loss": "9.766e-01", "dlm_acc": "6.454e-01", "anc_acc": "6.167e-01", "epoch": 0.05878} {"step": 29395, "loss": 1.9064, "grad_norm": "3.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.021e-01", "anc_acc": "4.779e-01", "epoch": 0.05879} {"step": 29400, "loss": 2.0979, "grad_norm": "6.868e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.603e+00", "anc_loss": "1.703e+00", "dlm_acc": "4.648e-01", "anc_acc": "4.460e-01", "epoch": 0.0588} {"step": 29405, "loss": 1.6761, "grad_norm": "5.280e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.922e-01", "anc_loss": "9.797e-01", "dlm_acc": "5.343e-01", "anc_acc": "4.972e-01", "epoch": 0.05881} {"step": 29410, "loss": 1.074, "grad_norm": "6.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.367e-01", "anc_loss": "1.062e+00", "dlm_acc": "6.306e-01", "anc_acc": "5.956e-01", "epoch": 0.05882} {"step": 29415, "loss": 1.3555, "grad_norm": "2.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.514e-01", "anc_acc": "5.225e-01", "epoch": 0.05883} {"step": 29420, "loss": 1.0375, "grad_norm": "2.458e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.914e-01", "anc_loss": "8.516e-01", "dlm_acc": "5.455e-01", "anc_acc": "5.245e-01", "epoch": 0.05884} {"step": 29425, "loss": 1.4369, "grad_norm": "3.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.556e+00", "anc_loss": "1.689e+00", "dlm_acc": "5.094e-01", "anc_acc": "4.760e-01", "epoch": 0.05885} {"step": 29430, "loss": 1.0369, "grad_norm": "3.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.370e-01", "anc_acc": "4.978e-01", "epoch": 0.05886} {"step": 29435, "loss": 1.0704, "grad_norm": "2.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.631e-01", "anc_loss": "6.355e-01", "dlm_acc": "6.990e-01", "anc_acc": "6.700e-01", "epoch": 0.05887} {"step": 29440, "loss": 1.0463, "grad_norm": "3.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.316e-01", "anc_loss": "8.027e-01", "dlm_acc": "6.395e-01", "anc_acc": "6.151e-01", "epoch": 0.05888} {"step": 29445, "loss": 1.383, "grad_norm": "4.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.709e-01", "anc_acc": "5.433e-01", "epoch": 0.05889} {"step": 29450, "loss": 1.3085, "grad_norm": "4.741e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.625e-01", "anc_loss": "8.609e-01", "dlm_acc": "6.666e-01", "anc_acc": "6.356e-01", "epoch": 0.0589} {"step": 29455, "loss": 1.2205, "grad_norm": "7.344e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.001e+00", "anc_loss": "1.098e+00", "dlm_acc": "6.144e-01", "anc_acc": "5.872e-01", "epoch": 0.05891} {"step": 29460, "loss": 1.5145, "grad_norm": "3.938e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.184e+00", "dlm_acc": "4.921e-01", "anc_acc": "4.699e-01", "epoch": 0.05892} {"step": 29465, "loss": 1.3063, "grad_norm": "2.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.797e-01", "anc_acc": "5.549e-01", "epoch": 0.05893} {"step": 29470, "loss": 1.8398, "grad_norm": "6.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.859e+00", "anc_loss": "1.940e+00", "dlm_acc": "4.284e-01", "anc_acc": "4.122e-01", "epoch": 0.05894} {"step": 29475, "loss": 1.5935, "grad_norm": "2.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.847e+00", "anc_loss": "2.891e+00", "dlm_acc": "4.662e-02", "anc_acc": "4.706e-02", "epoch": 0.05895} {"step": 29480, "loss": 0.9209, "grad_norm": "2.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.066e-01", "anc_loss": "6.910e-01", "dlm_acc": "7.302e-01", "anc_acc": "7.046e-01", "epoch": 0.05896} {"step": 29485, "loss": 1.0452, "grad_norm": "1.628e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.621e-01", "anc_loss": "7.633e-01", "dlm_acc": "7.323e-01", "anc_acc": "6.979e-01", "epoch": 0.05897} {"step": 29490, "loss": 1.2861, "grad_norm": "2.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.146e+00", "anc_loss": "1.279e+00", "dlm_acc": "6.121e-01", "anc_acc": "5.712e-01", "epoch": 0.05898} {"step": 29495, "loss": 1.3197, "grad_norm": "4.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.892e-01", "anc_acc": "5.499e-01", "epoch": 0.05899} {"step": 29500, "loss": 1.2113, "grad_norm": "2.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.646e-01", "anc_acc": "5.381e-01", "epoch": 0.059} {"step": 29505, "loss": 1.2637, "grad_norm": "3.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.286e-01", "anc_acc": "4.951e-01", "epoch": 0.05901} {"step": 29510, "loss": 1.4231, "grad_norm": "3.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.508e+00", "dlm_acc": "5.376e-01", "anc_acc": "5.075e-01", "epoch": 0.05902} {"step": 29515, "loss": 1.2416, "grad_norm": "2.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.451e+00", "dlm_acc": "5.223e-01", "anc_acc": "4.948e-01", "epoch": 0.05903} {"step": 29520, "loss": 1.4066, "grad_norm": "4.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.650e-01", "anc_acc": "5.425e-01", "epoch": 0.05904} {"step": 29525, "loss": 1.0923, "grad_norm": "2.643e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.197e+00", "dlm_acc": "6.012e-01", "anc_acc": "5.691e-01", "epoch": 0.05905} {"step": 29530, "loss": 1.0308, "grad_norm": "6.062e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.215e+00", "dlm_acc": "5.661e-01", "anc_acc": "5.401e-01", "epoch": 0.05906} {"step": 29535, "loss": 0.9349, "grad_norm": "6.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.023e-01", "anc_loss": "9.844e-01", "dlm_acc": "6.107e-01", "anc_acc": "5.858e-01", "epoch": 0.05907} {"step": 29540, "loss": 0.7834, "grad_norm": "3.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.609e-01", "anc_loss": "1.013e+00", "dlm_acc": "6.819e-01", "anc_acc": "6.414e-01", "epoch": 0.05908} {"step": 29545, "loss": 1.3159, "grad_norm": "3.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.239e+00", "anc_loss": "2.295e+00", "dlm_acc": "2.421e-01", "anc_acc": "2.320e-01", "epoch": 0.05909} {"step": 29550, "loss": 1.1094, "grad_norm": "3.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.094e+00", "anc_loss": "2.178e+00", "dlm_acc": "3.144e-01", "anc_acc": "2.970e-01", "epoch": 0.0591} {"step": 29555, "loss": 1.0573, "grad_norm": "4.022e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.845e-01", "anc_acc": "5.556e-01", "epoch": 0.05911} {"step": 29560, "loss": 1.0283, "grad_norm": "2.397e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.187e-01", "anc_loss": "9.910e-01", "dlm_acc": "6.235e-01", "anc_acc": "5.985e-01", "epoch": 0.05912} {"step": 29565, "loss": 1.6471, "grad_norm": "4.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.316e+00", "dlm_acc": "6.015e-01", "anc_acc": "5.786e-01", "epoch": 0.05913} {"step": 29570, "loss": 1.1198, "grad_norm": "3.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.429e+00", "dlm_acc": "5.419e-01", "anc_acc": "5.172e-01", "epoch": 0.05914} {"step": 29575, "loss": 1.4437, "grad_norm": "3.180e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.472e-01", "anc_acc": "5.256e-01", "epoch": 0.05915} {"step": 29580, "loss": 1.2116, "grad_norm": "1.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.296e+00", "dlm_acc": "5.958e-01", "anc_acc": "5.682e-01", "epoch": 0.05916} {"step": 29585, "loss": 1.2478, "grad_norm": "8.156e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.369e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.964e-01", "anc_acc": "5.792e-01", "epoch": 0.05917} {"step": 29590, "loss": 1.1151, "grad_norm": "5.664e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.854e-01", "anc_acc": "5.648e-01", "epoch": 0.05918} {"step": 29595, "loss": 1.0399, "grad_norm": "8.773e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.360e-01", "epoch": 0.05919} {"step": 29600, "loss": 1.3918, "grad_norm": "3.095e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.400e+00", "dlm_acc": "5.959e-01", "anc_acc": "5.710e-01", "epoch": 0.0592} {"step": 29605, "loss": 1.1214, "grad_norm": "4.281e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.368e+00", "anc_loss": "1.439e+00", "dlm_acc": "4.654e-01", "anc_acc": "4.471e-01", "epoch": 0.05921} {"step": 29610, "loss": 1.3148, "grad_norm": "5.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.161e+00", "dlm_acc": "5.261e-01", "anc_acc": "5.020e-01", "epoch": 0.05922} {"step": 29615, "loss": 0.9236, "grad_norm": "3.483e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.566e-01", "anc_loss": "8.762e-01", "dlm_acc": "6.922e-01", "anc_acc": "6.511e-01", "epoch": 0.05923} {"step": 29620, "loss": 1.3882, "grad_norm": "2.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.015e+00", "anc_loss": "1.118e+00", "dlm_acc": "6.042e-01", "anc_acc": "5.748e-01", "epoch": 0.05924} {"step": 29625, "loss": 1.5559, "grad_norm": "3.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.227e+00", "dlm_acc": "6.137e-01", "anc_acc": "5.896e-01", "epoch": 0.05925} {"step": 29630, "loss": 1.0743, "grad_norm": "2.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.117e-01", "anc_loss": "1.025e+00", "dlm_acc": "6.018e-01", "anc_acc": "5.652e-01", "epoch": 0.05926} {"step": 29635, "loss": 1.5486, "grad_norm": "2.875e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.365e+00", "anc_loss": "1.481e+00", "dlm_acc": "5.135e-01", "anc_acc": "4.807e-01", "epoch": 0.05927} {"step": 29640, "loss": 1.3698, "grad_norm": "3.513e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.418e+00", "anc_loss": "1.558e+00", "dlm_acc": "5.586e-01", "anc_acc": "5.223e-01", "epoch": 0.05928} {"step": 29645, "loss": 1.1528, "grad_norm": "2.613e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.841e-01", "anc_loss": "6.432e-01", "dlm_acc": "7.831e-01", "anc_acc": "7.653e-01", "epoch": 0.05929} {"step": 29650, "loss": 1.4964, "grad_norm": "3.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.320e-01", "anc_loss": "7.859e-01", "dlm_acc": "7.101e-01", "anc_acc": "6.936e-01", "epoch": 0.0593} {"step": 29655, "loss": 1.2291, "grad_norm": "3.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.292e-01", "anc_acc": "4.964e-01", "epoch": 0.05931} {"step": 29660, "loss": 1.3003, "grad_norm": "3.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.385e+00", "dlm_acc": "4.837e-01", "anc_acc": "4.591e-01", "epoch": 0.05932} {"step": 29665, "loss": 1.221, "grad_norm": "3.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.225e+00", "dlm_acc": "6.105e-01", "anc_acc": "5.862e-01", "epoch": 0.05933} {"step": 29670, "loss": 1.5672, "grad_norm": "4.650e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.677e+00", "dlm_acc": "5.210e-01", "anc_acc": "4.953e-01", "epoch": 0.05934} {"step": 29675, "loss": 1.3598, "grad_norm": "3.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.376e+00", "dlm_acc": "5.415e-01", "anc_acc": "5.208e-01", "epoch": 0.05935} {"step": 29680, "loss": 1.1411, "grad_norm": "2.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.040e+00", "anc_loss": "1.048e+00", "dlm_acc": "3.545e-01", "anc_acc": "3.526e-01", "epoch": 0.05936} {"step": 29685, "loss": 1.4173, "grad_norm": "4.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.364e+00", "anc_loss": "1.440e+00", "dlm_acc": "4.293e-01", "anc_acc": "4.134e-01", "epoch": 0.05937} {"step": 29690, "loss": 1.5172, "grad_norm": "4.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.453e+00", "anc_loss": "1.558e+00", "dlm_acc": "5.203e-01", "anc_acc": "4.984e-01", "epoch": 0.05938} {"step": 29695, "loss": 1.4507, "grad_norm": "2.313e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e+00", "anc_loss": "1.550e+00", "dlm_acc": "5.140e-01", "anc_acc": "4.902e-01", "epoch": 0.05939} {"step": 29700, "loss": 1.2864, "grad_norm": "4.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.389e+00", "dlm_acc": "5.350e-01", "anc_acc": "5.098e-01", "epoch": 0.0594} {"step": 29705, "loss": 1.7558, "grad_norm": "7.119e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.194e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.701e-01", "anc_acc": "5.534e-01", "epoch": 0.05941} {"step": 29710, "loss": 1.6781, "grad_norm": "5.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.042e+00", "anc_loss": "1.151e+00", "dlm_acc": "5.939e-01", "anc_acc": "5.745e-01", "epoch": 0.05942} {"step": 29715, "loss": 1.0468, "grad_norm": "3.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.859e-01", "anc_loss": "8.797e-01", "dlm_acc": "6.395e-01", "anc_acc": "6.191e-01", "epoch": 0.05943} {"step": 29720, "loss": 1.1422, "grad_norm": "4.877e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.008e+00", "anc_loss": "1.080e+00", "dlm_acc": "5.713e-01", "anc_acc": "5.526e-01", "epoch": 0.05944} {"step": 29725, "loss": 1.3428, "grad_norm": "2.482e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.556e+00", "anc_loss": "1.675e+00", "dlm_acc": "4.889e-01", "anc_acc": "4.620e-01", "epoch": 0.05945} {"step": 29730, "loss": 1.1773, "grad_norm": "4.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.580e+00", "dlm_acc": "5.240e-01", "anc_acc": "4.991e-01", "epoch": 0.05946} {"step": 29735, "loss": 0.8241, "grad_norm": "1.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.387e-01", "anc_loss": "9.057e-01", "dlm_acc": "6.539e-01", "anc_acc": "6.320e-01", "epoch": 0.05947} {"step": 29740, "loss": 1.5669, "grad_norm": "3.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.713e-01", "anc_acc": "5.464e-01", "epoch": 0.05948} {"step": 29745, "loss": 1.3075, "grad_norm": "4.410e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.231e+00", "dlm_acc": "6.318e-01", "anc_acc": "6.091e-01", "epoch": 0.05949} {"step": 29750, "loss": 1.1272, "grad_norm": "3.242e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.393e+00", "dlm_acc": "5.096e-01", "anc_acc": "4.886e-01", "epoch": 0.0595} {"step": 29755, "loss": 1.5229, "grad_norm": "5.624e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.641e-01", "anc_acc": "5.388e-01", "epoch": 0.05951} {"step": 29760, "loss": 1.3131, "grad_norm": "3.547e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.196e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.323e-01", "anc_acc": "5.073e-01", "epoch": 0.05952} {"step": 29765, "loss": 1.5091, "grad_norm": "3.076e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.202e+00", "dlm_acc": "5.780e-01", "anc_acc": "5.558e-01", "epoch": 0.05953} {"step": 29770, "loss": 1.4974, "grad_norm": "3.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.378e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.253e-01", "anc_acc": "4.925e-01", "epoch": 0.05954} {"step": 29775, "loss": 1.2102, "grad_norm": "3.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.089e-01", "anc_loss": "9.588e-01", "dlm_acc": "5.736e-01", "anc_acc": "5.574e-01", "epoch": 0.05955} {"step": 29780, "loss": 1.1113, "grad_norm": "2.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.340e-01", "anc_loss": "7.676e-01", "dlm_acc": "6.096e-01", "anc_acc": "5.980e-01", "epoch": 0.05956} {"step": 29785, "loss": 0.7495, "grad_norm": "2.326e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.535e-01", "anc_loss": "7.980e-01", "dlm_acc": "5.734e-01", "anc_acc": "5.583e-01", "epoch": 0.05957} {"step": 29790, "loss": 0.9579, "grad_norm": "4.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.322e+00", "dlm_acc": "5.725e-01", "anc_acc": "5.363e-01", "epoch": 0.05958} {"step": 29795, "loss": 0.9114, "grad_norm": "2.204e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.875e-01", "anc_loss": "1.092e+00", "dlm_acc": "5.960e-01", "anc_acc": "5.613e-01", "epoch": 0.05959} {"step": 29800, "loss": 1.3704, "grad_norm": "2.925e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.211e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.854e-01", "anc_acc": "5.493e-01", "epoch": 0.0596} {"step": 29805, "loss": 0.7543, "grad_norm": "2.059e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.850e-01", "anc_loss": "5.430e-01", "dlm_acc": "7.549e-01", "anc_acc": "7.309e-01", "epoch": 0.05961} {"step": 29810, "loss": 1.0787, "grad_norm": "2.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.988e-01", "anc_loss": "5.375e-01", "dlm_acc": "6.602e-01", "anc_acc": "6.367e-01", "epoch": 0.05962} {"step": 29815, "loss": 1.1462, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.266e-01", "anc_loss": "4.605e-01", "dlm_acc": "7.103e-01", "anc_acc": "6.892e-01", "epoch": 0.05963} {"step": 29820, "loss": 1.1927, "grad_norm": "3.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.789e-01", "anc_loss": "4.129e-01", "dlm_acc": "7.752e-01", "anc_acc": "7.561e-01", "epoch": 0.05964} {"step": 29825, "loss": 0.9499, "grad_norm": "1.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.419e-01", "anc_loss": "3.664e-01", "dlm_acc": "7.628e-01", "anc_acc": "7.485e-01", "epoch": 0.05965} {"step": 29830, "loss": 1.2217, "grad_norm": "2.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.034e+00", "anc_loss": "1.155e+00", "dlm_acc": "6.103e-01", "anc_acc": "5.766e-01", "epoch": 0.05966} {"step": 29835, "loss": 1.1938, "grad_norm": "2.942e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.455e-01", "anc_loss": "1.029e+00", "dlm_acc": "6.417e-01", "anc_acc": "6.113e-01", "epoch": 0.05967} {"step": 29840, "loss": 1.4991, "grad_norm": "4.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.727e-01", "anc_loss": "9.523e-01", "dlm_acc": "6.532e-01", "anc_acc": "6.336e-01", "epoch": 0.05968} {"step": 29845, "loss": 1.2422, "grad_norm": "2.088e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.236e+00", "dlm_acc": "5.675e-01", "anc_acc": "5.325e-01", "epoch": 0.05969} {"step": 29850, "loss": 1.0462, "grad_norm": "1.931e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.150e-01", "anc_loss": "9.148e-01", "dlm_acc": "6.498e-01", "anc_acc": "6.093e-01", "epoch": 0.0597} {"step": 29855, "loss": 1.0876, "grad_norm": "3.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.697e-01", "anc_loss": "9.301e-01", "dlm_acc": "5.729e-01", "anc_acc": "5.533e-01", "epoch": 0.05971} {"step": 29860, "loss": 1.5583, "grad_norm": "3.330e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.847e+00", "anc_loss": "1.925e+00", "dlm_acc": "3.337e-01", "anc_acc": "3.178e-01", "epoch": 0.05972} {"step": 29865, "loss": 1.8731, "grad_norm": "3.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.614e+00", "dlm_acc": "4.780e-01", "anc_acc": "4.489e-01", "epoch": 0.05973} {"step": 29870, "loss": 1.2643, "grad_norm": "3.068e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.257e+00", "dlm_acc": "6.148e-01", "anc_acc": "5.885e-01", "epoch": 0.05974} {"step": 29875, "loss": 1.4553, "grad_norm": "6.461e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.465e-01", "anc_acc": "5.140e-01", "epoch": 0.05975} {"step": 29880, "loss": 1.3649, "grad_norm": "4.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.475e+00", "anc_loss": "1.578e+00", "dlm_acc": "4.919e-01", "anc_acc": "4.695e-01", "epoch": 0.05976} {"step": 29885, "loss": 1.0596, "grad_norm": "2.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.576e-01", "anc_acc": "5.353e-01", "epoch": 0.05977} {"step": 29890, "loss": 1.1527, "grad_norm": "3.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.414e+00", "dlm_acc": "5.555e-01", "anc_acc": "5.218e-01", "epoch": 0.05978} {"step": 29895, "loss": 1.385, "grad_norm": "3.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.359e+00", "dlm_acc": "5.227e-01", "anc_acc": "4.999e-01", "epoch": 0.05979} {"step": 29900, "loss": 1.3605, "grad_norm": "2.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.859e-01", "anc_loss": "6.367e-01", "dlm_acc": "6.333e-01", "anc_acc": "6.068e-01", "epoch": 0.0598} {"step": 29905, "loss": 1.5843, "grad_norm": "8.540e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.548e+00", "dlm_acc": "5.116e-01", "anc_acc": "4.781e-01", "epoch": 0.05981} {"step": 29910, "loss": 1.4398, "grad_norm": "2.928e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.421e+00", "anc_loss": "1.519e+00", "dlm_acc": "4.792e-01", "anc_acc": "4.582e-01", "epoch": 0.05982} {"step": 29915, "loss": 1.2853, "grad_norm": "2.070e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.936e+00", "anc_loss": "2.042e+00", "dlm_acc": "2.650e-01", "anc_acc": "2.423e-01", "epoch": 0.05983} {"step": 29920, "loss": 1.8721, "grad_norm": "6.617e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.234e+00", "anc_loss": "2.322e+00", "dlm_acc": "2.388e-01", "anc_acc": "2.228e-01", "epoch": 0.05984} {"step": 29925, "loss": 1.2842, "grad_norm": "3.328e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.452e+00", "dlm_acc": "4.978e-01", "anc_acc": "4.707e-01", "epoch": 0.05985} {"step": 29930, "loss": 1.6879, "grad_norm": "3.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.301e+00", "anc_loss": "1.407e+00", "dlm_acc": "5.487e-01", "anc_acc": "5.211e-01", "epoch": 0.05986} {"step": 29935, "loss": 1.0567, "grad_norm": "3.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.261e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.361e-01", "epoch": 0.05987} {"step": 29940, "loss": 1.3321, "grad_norm": "4.557e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.336e-01", "anc_acc": "5.059e-01", "epoch": 0.05988} {"step": 29945, "loss": 1.3036, "grad_norm": "2.952e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.178e+00", "dlm_acc": "5.926e-01", "anc_acc": "5.495e-01", "epoch": 0.05989} {"step": 29950, "loss": 1.2995, "grad_norm": "3.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.393e+00", "dlm_acc": "5.426e-01", "anc_acc": "5.127e-01", "epoch": 0.0599} {"step": 29955, "loss": 1.9739, "grad_norm": "3.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.819e+00", "dlm_acc": "4.957e-01", "anc_acc": "4.711e-01", "epoch": 0.05991} {"step": 29960, "loss": 1.3282, "grad_norm": "5.538e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.466e+00", "anc_loss": "1.598e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.198e-01", "epoch": 0.05992} {"step": 29965, "loss": 1.6848, "grad_norm": "5.573e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.607e+00", "anc_loss": "1.727e+00", "dlm_acc": "5.236e-01", "anc_acc": "4.997e-01", "epoch": 0.05993} {"step": 29970, "loss": 1.1589, "grad_norm": "1.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.719e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.306e-01", "anc_acc": "6.080e-01", "epoch": 0.05994} {"step": 29975, "loss": 1.3591, "grad_norm": "5.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.408e+00", "dlm_acc": "4.517e-01", "anc_acc": "4.348e-01", "epoch": 0.05995} {"step": 29980, "loss": 1.6437, "grad_norm": "3.608e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.480e+00", "anc_loss": "1.541e+00", "dlm_acc": "4.034e-01", "anc_acc": "3.928e-01", "epoch": 0.05996} {"step": 29985, "loss": 1.5169, "grad_norm": "3.899e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.620e+00", "anc_loss": "1.773e+00", "dlm_acc": "4.716e-01", "anc_acc": "4.484e-01", "epoch": 0.05997} {"step": 29990, "loss": 1.4801, "grad_norm": "4.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.379e+00", "dlm_acc": "5.647e-01", "anc_acc": "5.433e-01", "epoch": 0.05998} {"step": 29995, "loss": 1.1806, "grad_norm": "4.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.517e+00", "dlm_acc": "5.300e-01", "anc_acc": "5.072e-01", "epoch": 0.05999} {"step": 30000, "loss": 1.4586, "grad_norm": "3.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.612e+00", "anc_loss": "1.724e+00", "dlm_acc": "5.230e-01", "anc_acc": "4.981e-01", "epoch": 0.06} {"step": 30005, "loss": 1.4879, "grad_norm": "6.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.508e+00", "dlm_acc": "5.346e-01", "anc_acc": "5.096e-01", "epoch": 0.06001} {"step": 30010, "loss": 1.9941, "grad_norm": "3.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.618e+00", "dlm_acc": "5.502e-01", "anc_acc": "5.262e-01", "epoch": 0.06002} {"step": 30015, "loss": 2.1601, "grad_norm": "4.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.268e+00", "anc_loss": "1.371e+00", "dlm_acc": "6.027e-01", "anc_acc": "5.789e-01", "epoch": 0.06003} {"step": 30020, "loss": 1.3626, "grad_norm": "5.668e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.055e-01", "anc_loss": "4.365e-01", "dlm_acc": "7.994e-01", "anc_acc": "7.914e-01", "epoch": 0.06004} {"step": 30025, "loss": 1.123, "grad_norm": "3.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.342e+00", "dlm_acc": "5.767e-01", "anc_acc": "5.507e-01", "epoch": 0.06005} {"step": 30030, "loss": 0.8524, "grad_norm": "2.182e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.221e-01", "anc_loss": "7.916e-01", "dlm_acc": "6.975e-01", "anc_acc": "6.755e-01", "epoch": 0.06006} {"step": 30035, "loss": 1.3817, "grad_norm": "3.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.766e-01", "anc_loss": "9.484e-01", "dlm_acc": "6.614e-01", "anc_acc": "6.409e-01", "epoch": 0.06007} {"step": 30040, "loss": 1.3873, "grad_norm": "2.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.367e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.071e-01", "anc_acc": "4.841e-01", "epoch": 0.06008} {"step": 30045, "loss": 1.2025, "grad_norm": "4.048e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.025e+00", "anc_loss": "1.107e+00", "dlm_acc": "5.751e-01", "anc_acc": "5.627e-01", "epoch": 0.06009} {"step": 30050, "loss": 1.12, "grad_norm": "3.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.629e-01", "anc_loss": "9.719e-01", "dlm_acc": "6.683e-01", "anc_acc": "6.350e-01", "epoch": 0.0601} {"step": 30055, "loss": 1.3806, "grad_norm": "2.348e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.125e+00", "anc_loss": "1.247e+00", "dlm_acc": "6.598e-01", "anc_acc": "6.326e-01", "epoch": 0.06011} {"step": 30060, "loss": 1.0372, "grad_norm": "4.580e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.533e-01", "anc_loss": "9.805e-01", "dlm_acc": "7.205e-01", "anc_acc": "6.854e-01", "epoch": 0.06012} {"step": 30065, "loss": 1.772, "grad_norm": "2.688e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.645e+00", "anc_loss": "1.748e+00", "dlm_acc": "4.662e-01", "anc_acc": "4.438e-01", "epoch": 0.06013} {"step": 30070, "loss": 1.3727, "grad_norm": "2.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.314e+00", "dlm_acc": "5.725e-01", "anc_acc": "5.466e-01", "epoch": 0.06014} {"step": 30075, "loss": 0.9961, "grad_norm": "2.313e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.040e+00", "anc_loss": "1.148e+00", "dlm_acc": "5.873e-01", "anc_acc": "5.597e-01", "epoch": 0.06015} {"step": 30080, "loss": 1.3674, "grad_norm": "5.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.461e-01", "anc_acc": "5.174e-01", "epoch": 0.06016} {"step": 30085, "loss": 1.182, "grad_norm": "4.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.351e+00", "dlm_acc": "5.410e-01", "anc_acc": "5.158e-01", "epoch": 0.06017} {"step": 30090, "loss": 1.1682, "grad_norm": "2.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.204e-01", "anc_acc": "4.954e-01", "epoch": 0.06018} {"step": 30095, "loss": 1.1958, "grad_norm": "3.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.481e+00", "anc_loss": "1.584e+00", "dlm_acc": "5.271e-01", "anc_acc": "5.050e-01", "epoch": 0.06019} {"step": 30100, "loss": 0.7886, "grad_norm": "1.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.860e-01", "anc_loss": "5.383e-01", "dlm_acc": "8.392e-01", "anc_acc": "8.243e-01", "epoch": 0.0602} {"step": 30105, "loss": 0.9167, "grad_norm": "1.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.086e-01", "anc_loss": "8.852e-01", "dlm_acc": "7.151e-01", "anc_acc": "6.948e-01", "epoch": 0.06021} {"step": 30110, "loss": 1.2655, "grad_norm": "1.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.207e+00", "anc_loss": "1.301e+00", "dlm_acc": "5.729e-01", "anc_acc": "5.481e-01", "epoch": 0.06022} {"step": 30115, "loss": 1.4214, "grad_norm": "8.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.392e+00", "anc_loss": "1.493e+00", "dlm_acc": "5.435e-01", "anc_acc": "5.186e-01", "epoch": 0.06023} {"step": 30120, "loss": 1.1336, "grad_norm": "2.300e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.141e+00", "dlm_acc": "6.016e-01", "anc_acc": "5.761e-01", "epoch": 0.06024} {"step": 30125, "loss": 1.422, "grad_norm": "2.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.411e+00", "dlm_acc": "5.070e-01", "anc_acc": "4.813e-01", "epoch": 0.06025} {"step": 30130, "loss": 1.1029, "grad_norm": "2.527e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.181e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.507e-01", "anc_acc": "5.241e-01", "epoch": 0.06026} {"step": 30135, "loss": 1.1967, "grad_norm": "3.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.555e-01", "anc_loss": "1.040e+00", "dlm_acc": "6.898e-01", "anc_acc": "6.721e-01", "epoch": 0.06027} {"step": 30140, "loss": 1.0622, "grad_norm": "1.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.668e-01", "anc_loss": "9.570e-01", "dlm_acc": "6.851e-01", "anc_acc": "6.609e-01", "epoch": 0.06028} {"step": 30145, "loss": 0.8857, "grad_norm": "4.595e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.828e-01", "anc_loss": "8.584e-01", "dlm_acc": "6.993e-01", "anc_acc": "6.755e-01", "epoch": 0.06029} {"step": 30150, "loss": 1.2862, "grad_norm": "5.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.617e-01", "anc_loss": "9.125e-01", "dlm_acc": "5.980e-01", "anc_acc": "5.835e-01", "epoch": 0.0603} {"step": 30155, "loss": 0.7964, "grad_norm": "3.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.578e-01", "anc_loss": "3.727e-01", "dlm_acc": "7.629e-01", "anc_acc": "7.602e-01", "epoch": 0.06031} {"step": 30160, "loss": 0.947, "grad_norm": "2.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.848e-01", "anc_loss": "4.047e-01", "dlm_acc": "7.501e-01", "anc_acc": "7.451e-01", "epoch": 0.06032} {"step": 30165, "loss": 1.1521, "grad_norm": "2.246e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.065e-01", "anc_loss": "9.146e-01", "dlm_acc": "7.104e-01", "anc_acc": "6.797e-01", "epoch": 0.06033} {"step": 30170, "loss": 1.0435, "grad_norm": "2.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.129e-01", "anc_loss": "6.285e-01", "dlm_acc": "6.295e-01", "anc_acc": "6.283e-01", "epoch": 0.06034} {"step": 30175, "loss": 1.1391, "grad_norm": "4.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.949e-01", "anc_loss": "1.068e+00", "dlm_acc": "6.066e-01", "anc_acc": "5.911e-01", "epoch": 0.06035} {"step": 30180, "loss": 0.9644, "grad_norm": "5.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.721e-01", "anc_loss": "6.313e-01", "dlm_acc": "7.950e-01", "anc_acc": "7.742e-01", "epoch": 0.06036} {"step": 30185, "loss": 1.0387, "grad_norm": "3.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.117e-01", "anc_loss": "6.554e-01", "dlm_acc": "7.260e-01", "anc_acc": "7.107e-01", "epoch": 0.06037} {"step": 30190, "loss": 0.7589, "grad_norm": "2.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.645e-01", "anc_loss": "2.986e-01", "dlm_acc": "8.518e-01", "anc_acc": "8.380e-01", "epoch": 0.06038} {"step": 30195, "loss": 1.2252, "grad_norm": "7.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.373e+00", "dlm_acc": "6.358e-01", "anc_acc": "6.142e-01", "epoch": 0.06039} {"step": 30200, "loss": 1.4784, "grad_norm": "3.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.561e+00", "dlm_acc": "5.303e-01", "anc_acc": "5.061e-01", "epoch": 0.0604} {"step": 30205, "loss": 0.9403, "grad_norm": "4.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.468e-01", "anc_acc": "5.271e-01", "epoch": 0.06041} {"step": 30210, "loss": 1.0278, "grad_norm": "4.024e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.047e-01", "anc_loss": "9.727e-01", "dlm_acc": "6.312e-01", "anc_acc": "6.135e-01", "epoch": 0.06042} {"step": 30215, "loss": 1.8667, "grad_norm": "5.237e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.553e-01", "anc_acc": "5.359e-01", "epoch": 0.06043} {"step": 30220, "loss": 1.3515, "grad_norm": "1.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.625e-01", "anc_loss": "5.062e-01", "dlm_acc": "7.772e-01", "anc_acc": "7.610e-01", "epoch": 0.06044} {"step": 30225, "loss": 0.7976, "grad_norm": "2.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.448e-01", "anc_loss": "6.081e-01", "dlm_acc": "7.574e-01", "anc_acc": "7.399e-01", "epoch": 0.06045} {"step": 30230, "loss": 0.8503, "grad_norm": "3.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.483e-01", "anc_loss": "3.041e-01", "dlm_acc": "8.588e-01", "anc_acc": "8.324e-01", "epoch": 0.06046} {"step": 30235, "loss": 0.9533, "grad_norm": "2.846e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.940e-01", "anc_loss": "5.463e-01", "dlm_acc": "7.793e-01", "anc_acc": "7.602e-01", "epoch": 0.06047} {"step": 30240, "loss": 1.0278, "grad_norm": "2.648e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.474e-01", "anc_loss": "7.036e-01", "dlm_acc": "7.794e-01", "anc_acc": "7.661e-01", "epoch": 0.06048} {"step": 30245, "loss": 0.8117, "grad_norm": "4.152e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.676e-01", "anc_loss": "6.086e-01", "dlm_acc": "6.540e-01", "anc_acc": "6.454e-01", "epoch": 0.06049} {"step": 30250, "loss": 1.2566, "grad_norm": "1.079e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.936e-01", "anc_loss": "9.637e-01", "dlm_acc": "6.605e-01", "anc_acc": "6.422e-01", "epoch": 0.0605} {"step": 30255, "loss": 1.292, "grad_norm": "4.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.930e-01", "anc_loss": "5.283e-01", "dlm_acc": "7.890e-01", "anc_acc": "7.790e-01", "epoch": 0.06051} {"step": 30260, "loss": 1.3166, "grad_norm": "5.174e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.199e-01", "anc_loss": "9.141e-01", "dlm_acc": "6.782e-01", "anc_acc": "6.551e-01", "epoch": 0.06052} {"step": 30265, "loss": 1.1491, "grad_norm": "4.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.936e-01", "anc_loss": "6.301e-01", "dlm_acc": "7.548e-01", "anc_acc": "7.462e-01", "epoch": 0.06053} {"step": 30270, "loss": 1.2182, "grad_norm": "1.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.191e-01", "anc_loss": "6.805e-01", "dlm_acc": "7.002e-01", "anc_acc": "6.825e-01", "epoch": 0.06054} {"step": 30275, "loss": 0.9268, "grad_norm": "3.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.863e-01", "anc_loss": "5.441e-01", "dlm_acc": "7.502e-01", "anc_acc": "7.326e-01", "epoch": 0.06055} {"step": 30280, "loss": 1.1197, "grad_norm": "1.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.825e-01", "anc_loss": "3.274e-01", "dlm_acc": "8.550e-01", "anc_acc": "8.399e-01", "epoch": 0.06056} {"step": 30285, "loss": 0.9376, "grad_norm": "3.725e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.902e-01", "anc_loss": "3.498e-01", "dlm_acc": "8.324e-01", "anc_acc": "8.119e-01", "epoch": 0.06057} {"step": 30290, "loss": 1.533, "grad_norm": "6.939e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.186e+00", "dlm_acc": "6.169e-01", "anc_acc": "6.016e-01", "epoch": 0.06058} {"step": 30295, "loss": 1.4631, "grad_norm": "4.883e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.618e+00", "anc_loss": "1.713e+00", "dlm_acc": "5.563e-01", "anc_acc": "5.321e-01", "epoch": 0.06059} {"step": 30300, "loss": 1.1909, "grad_norm": "1.155e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.064e-01", "anc_loss": "6.530e-01", "dlm_acc": "7.153e-01", "anc_acc": "6.948e-01", "epoch": 0.0606} {"step": 30305, "loss": 1.2224, "grad_norm": "1.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.524e-01", "anc_loss": "3.733e-01", "dlm_acc": "7.713e-01", "anc_acc": "7.649e-01", "epoch": 0.06061} {"step": 30310, "loss": 1.0943, "grad_norm": "8.131e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.526e-01", "anc_loss": "1.611e-01", "dlm_acc": "8.949e-01", "anc_acc": "8.920e-01", "epoch": 0.06062} {"step": 30315, "loss": 1.0502, "grad_norm": "3.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.550e-01", "anc_loss": "2.732e-01", "dlm_acc": "8.392e-01", "anc_acc": "8.336e-01", "epoch": 0.06063} {"step": 30320, "loss": 0.9853, "grad_norm": "5.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.738e-01", "anc_loss": "2.916e-01", "dlm_acc": "8.327e-01", "anc_acc": "8.235e-01", "epoch": 0.06064} {"step": 30325, "loss": 0.6768, "grad_norm": "3.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.371e-01", "anc_loss": "3.502e-01", "dlm_acc": "7.611e-01", "anc_acc": "7.542e-01", "epoch": 0.06065} {"step": 30330, "loss": 0.9797, "grad_norm": "3.161e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.965e-01", "anc_loss": "6.270e-01", "dlm_acc": "6.523e-01", "anc_acc": "6.455e-01", "epoch": 0.06066} {"step": 30335, "loss": 1.4246, "grad_norm": "8.984e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.229e-01", "anc_loss": "6.865e-01", "dlm_acc": "7.516e-01", "anc_acc": "7.309e-01", "epoch": 0.06067} {"step": 30340, "loss": 1.4083, "grad_norm": "3.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.132e+00", "dlm_acc": "5.657e-01", "anc_acc": "5.497e-01", "epoch": 0.06068} {"step": 30345, "loss": 1.2469, "grad_norm": "3.062e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.947e-01", "anc_loss": "8.932e-01", "dlm_acc": "6.605e-01", "anc_acc": "6.389e-01", "epoch": 0.06069} {"step": 30350, "loss": 0.9556, "grad_norm": "1.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.872e-01", "anc_loss": "6.346e-01", "dlm_acc": "7.405e-01", "anc_acc": "7.225e-01", "epoch": 0.0607} {"step": 30355, "loss": 1.1421, "grad_norm": "4.719e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.853e-01", "anc_acc": "5.606e-01", "epoch": 0.06071} {"step": 30360, "loss": 1.0332, "grad_norm": "1.544e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.508e-01", "anc_loss": "9.625e-01", "dlm_acc": "6.756e-01", "anc_acc": "6.486e-01", "epoch": 0.06072} {"step": 30365, "loss": 1.2373, "grad_norm": "2.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.317e+00", "dlm_acc": "5.540e-01", "anc_acc": "5.329e-01", "epoch": 0.06073} {"step": 30370, "loss": 1.3177, "grad_norm": "2.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.793e-01", "anc_loss": "6.346e-01", "dlm_acc": "7.625e-01", "anc_acc": "7.447e-01", "epoch": 0.06074} {"step": 30375, "loss": 0.9685, "grad_norm": "1.065e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.072e-01", "anc_loss": "6.617e-01", "dlm_acc": "7.121e-01", "anc_acc": "6.974e-01", "epoch": 0.06075} {"step": 30380, "loss": 1.427, "grad_norm": "6.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.058e-01", "anc_loss": "5.388e-01", "dlm_acc": "8.209e-01", "anc_acc": "8.092e-01", "epoch": 0.06076} {"step": 30385, "loss": 1.1784, "grad_norm": "3.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.422e-01", "anc_loss": "9.141e-01", "dlm_acc": "6.983e-01", "anc_acc": "6.824e-01", "epoch": 0.06077} {"step": 30390, "loss": 1.3105, "grad_norm": "4.166e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.414e-01", "anc_loss": "7.945e-01", "dlm_acc": "7.343e-01", "anc_acc": "7.238e-01", "epoch": 0.06078} {"step": 30395, "loss": 1.6884, "grad_norm": "5.770e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.411e+00", "dlm_acc": "5.783e-01", "anc_acc": "5.550e-01", "epoch": 0.06079} {"step": 30400, "loss": 1.1166, "grad_norm": "3.416e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.125e-01", "anc_loss": "9.039e-01", "dlm_acc": "6.608e-01", "anc_acc": "6.364e-01", "epoch": 0.0608} {"step": 30405, "loss": 1.5403, "grad_norm": "3.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.219e+00", "dlm_acc": "5.569e-01", "anc_acc": "5.270e-01", "epoch": 0.06081} {"step": 30410, "loss": 1.2319, "grad_norm": "2.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.266e-01", "anc_loss": "1.044e+00", "dlm_acc": "6.111e-01", "anc_acc": "5.726e-01", "epoch": 0.06082} {"step": 30415, "loss": 1.2733, "grad_norm": "3.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.725e-01", "anc_acc": "5.470e-01", "epoch": 0.06083} {"step": 30420, "loss": 0.9049, "grad_norm": "3.578e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.393e-01", "anc_loss": "8.754e-01", "dlm_acc": "7.519e-01", "anc_acc": "7.453e-01", "epoch": 0.06084} {"step": 30425, "loss": 0.7589, "grad_norm": "2.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.516e-02", "anc_loss": "2.334e-02", "dlm_acc": "9.880e-01", "anc_acc": "9.878e-01", "epoch": 0.06085} {"step": 30430, "loss": 0.7785, "grad_norm": "2.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.060e-02", "anc_loss": "1.140e-02", "dlm_acc": "9.936e-01", "anc_acc": "9.934e-01", "epoch": 0.06086} {"step": 30435, "loss": 0.8187, "grad_norm": "2.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.626e-02", "anc_loss": "5.637e-02", "dlm_acc": "9.765e-01", "anc_acc": "9.763e-01", "epoch": 0.06087} {"step": 30440, "loss": 0.9929, "grad_norm": "7.405e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.730e-02", "anc_loss": "1.923e-02", "dlm_acc": "9.925e-01", "anc_acc": "9.918e-01", "epoch": 0.06088} {"step": 30445, "loss": 0.8865, "grad_norm": "4.588e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e-02", "anc_loss": "1.125e-02", "dlm_acc": "9.931e-01", "anc_acc": "9.923e-01", "epoch": 0.06089} {"step": 30450, "loss": 0.9083, "grad_norm": "3.639e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.816e-01", "anc_loss": "3.061e-01", "dlm_acc": "8.924e-01", "anc_acc": "8.862e-01", "epoch": 0.0609} {"step": 30455, "loss": 1.0076, "grad_norm": "3.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.665e-01", "anc_acc": "5.429e-01", "epoch": 0.06091} {"step": 30460, "loss": 1.4109, "grad_norm": "1.921e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.266e-01", "anc_acc": "5.043e-01", "epoch": 0.06092} {"step": 30465, "loss": 1.4223, "grad_norm": "8.309e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.438e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.164e-01", "anc_acc": "4.935e-01", "epoch": 0.06093} {"step": 30470, "loss": 1.3682, "grad_norm": "2.117e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.353e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.660e-01", "anc_acc": "5.398e-01", "epoch": 0.06094} {"step": 30475, "loss": 1.3402, "grad_norm": "2.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.681e+00", "anc_loss": "1.809e+00", "dlm_acc": "4.260e-01", "anc_acc": "3.891e-01", "epoch": 0.06095} {"step": 30480, "loss": 1.1694, "grad_norm": "3.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.488e-01", "anc_loss": "8.516e-01", "dlm_acc": "6.750e-01", "anc_acc": "6.435e-01", "epoch": 0.06096} {"step": 30485, "loss": 1.3232, "grad_norm": "8.481e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.493e+00", "dlm_acc": "5.257e-01", "anc_acc": "4.998e-01", "epoch": 0.06097} {"step": 30490, "loss": 1.8397, "grad_norm": "3.643e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.457e+00", "anc_loss": "1.568e+00", "dlm_acc": "5.422e-01", "anc_acc": "5.189e-01", "epoch": 0.06098} {"step": 30495, "loss": 1.4563, "grad_norm": "2.863e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.356e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.385e-01", "anc_acc": "5.149e-01", "epoch": 0.06099} {"step": 30500, "loss": 1.2546, "grad_norm": "3.445e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.226e-01", "anc_acc": "4.992e-01", "epoch": 0.061} {"step": 30505, "loss": 1.4099, "grad_norm": "2.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.556e-01", "anc_acc": "5.265e-01", "epoch": 0.06101} {"step": 30510, "loss": 1.7067, "grad_norm": "2.845e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.884e+00", "anc_loss": "1.975e+00", "dlm_acc": "3.698e-01", "anc_acc": "3.531e-01", "epoch": 0.06102} {"step": 30515, "loss": 1.1195, "grad_norm": "3.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.004e-01", "anc_loss": "8.602e-01", "dlm_acc": "6.272e-01", "anc_acc": "6.120e-01", "epoch": 0.06103} {"step": 30520, "loss": 1.4331, "grad_norm": "4.937e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.516e+00", "anc_loss": "1.620e+00", "dlm_acc": "5.174e-01", "anc_acc": "4.949e-01", "epoch": 0.06104} {"step": 30525, "loss": 1.5939, "grad_norm": "2.996e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.545e+00", "anc_loss": "1.668e+00", "dlm_acc": "5.250e-01", "anc_acc": "4.978e-01", "epoch": 0.06105} {"step": 30530, "loss": 1.9439, "grad_norm": "3.765e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.059e+00", "anc_loss": "2.169e+00", "dlm_acc": "4.197e-01", "anc_acc": "3.981e-01", "epoch": 0.06106} {"step": 30535, "loss": 1.9312, "grad_norm": "4.906e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.766e+00", "anc_loss": "1.881e+00", "dlm_acc": "5.026e-01", "anc_acc": "4.784e-01", "epoch": 0.06107} {"step": 30540, "loss": 1.4345, "grad_norm": "3.964e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.211e+00", "dlm_acc": "6.250e-01", "anc_acc": "6.025e-01", "epoch": 0.06108} {"step": 30545, "loss": 1.3605, "grad_norm": "3.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.461e+00", "anc_loss": "1.569e+00", "dlm_acc": "5.292e-01", "anc_acc": "5.051e-01", "epoch": 0.06109} {"step": 30550, "loss": 1.2891, "grad_norm": "2.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.520e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.289e-01", "anc_acc": "5.048e-01", "epoch": 0.0611} {"step": 30555, "loss": 1.2365, "grad_norm": "2.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.547e+00", "dlm_acc": "5.225e-01", "anc_acc": "4.979e-01", "epoch": 0.06111} {"step": 30560, "loss": 1.2112, "grad_norm": "7.485e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.500e+00", "dlm_acc": "5.394e-01", "anc_acc": "5.122e-01", "epoch": 0.06112} {"step": 30565, "loss": 1.1506, "grad_norm": "3.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.046e+00", "anc_loss": "1.149e+00", "dlm_acc": "5.807e-01", "anc_acc": "5.537e-01", "epoch": 0.06113} {"step": 30570, "loss": 1.2923, "grad_norm": "3.613e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.388e+00", "anc_loss": "1.496e+00", "dlm_acc": "5.314e-01", "anc_acc": "5.057e-01", "epoch": 0.06114} {"step": 30575, "loss": 1.3223, "grad_norm": "3.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.608e+00", "dlm_acc": "4.974e-01", "anc_acc": "4.756e-01", "epoch": 0.06115} {"step": 30580, "loss": 1.0284, "grad_norm": "6.855e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.471e+00", "dlm_acc": "5.328e-01", "anc_acc": "5.099e-01", "epoch": 0.06116} {"step": 30585, "loss": 1.0437, "grad_norm": "2.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.558e+00", "dlm_acc": "5.070e-01", "anc_acc": "4.787e-01", "epoch": 0.06117} {"step": 30590, "loss": 1.1563, "grad_norm": "2.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.720e+00", "anc_loss": "1.825e+00", "dlm_acc": "4.587e-01", "anc_acc": "4.387e-01", "epoch": 0.06118} {"step": 30595, "loss": 0.9504, "grad_norm": "2.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.316e+00", "dlm_acc": "5.494e-01", "anc_acc": "5.298e-01", "epoch": 0.06119} {"step": 30600, "loss": 1.0103, "grad_norm": "2.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.545e+00", "anc_loss": "1.648e+00", "dlm_acc": "4.786e-01", "anc_acc": "4.532e-01", "epoch": 0.0612} {"step": 30605, "loss": 1.3167, "grad_norm": "7.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.242e+00", "dlm_acc": "6.116e-01", "anc_acc": "5.871e-01", "epoch": 0.06121} {"step": 30610, "loss": 1.1482, "grad_norm": "2.751e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.339e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.436e-01", "anc_acc": "5.187e-01", "epoch": 0.06122} {"step": 30615, "loss": 1.3191, "grad_norm": "3.507e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.483e+00", "anc_loss": "1.598e+00", "dlm_acc": "5.198e-01", "anc_acc": "4.931e-01", "epoch": 0.06123} {"step": 30620, "loss": 1.408, "grad_norm": "3.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.486e+00", "anc_loss": "1.619e+00", "dlm_acc": "4.968e-01", "anc_acc": "4.701e-01", "epoch": 0.06124} {"step": 30625, "loss": 0.9556, "grad_norm": "3.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.251e+00", "dlm_acc": "5.736e-01", "anc_acc": "5.533e-01", "epoch": 0.06125} {"step": 30630, "loss": 0.791, "grad_norm": "2.113e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.602e-01", "anc_loss": "1.050e+00", "dlm_acc": "6.118e-01", "anc_acc": "5.865e-01", "epoch": 0.06126} {"step": 30635, "loss": 0.6853, "grad_norm": "1.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.078e-01", "anc_loss": "9.043e-01", "dlm_acc": "6.750e-01", "anc_acc": "6.477e-01", "epoch": 0.06127} {"step": 30640, "loss": 1.2463, "grad_norm": "2.483e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.588e+00", "anc_loss": "1.703e+00", "dlm_acc": "4.920e-01", "anc_acc": "4.679e-01", "epoch": 0.06128} {"step": 30645, "loss": 1.2235, "grad_norm": "3.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.608e+00", "dlm_acc": "4.992e-01", "anc_acc": "4.771e-01", "epoch": 0.06129} {"step": 30650, "loss": 1.1334, "grad_norm": "3.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.866e-01", "anc_loss": "1.096e+00", "dlm_acc": "6.648e-01", "anc_acc": "6.372e-01", "epoch": 0.0613} {"step": 30655, "loss": 1.2484, "grad_norm": "3.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.239e+00", "dlm_acc": "5.503e-01", "anc_acc": "5.206e-01", "epoch": 0.06131} {"step": 30660, "loss": 1.4388, "grad_norm": "3.193e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.206e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.759e-01", "anc_acc": "5.541e-01", "epoch": 0.06132} {"step": 30665, "loss": 1.3379, "grad_norm": "4.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.104e+00", "anc_loss": "1.200e+00", "dlm_acc": "6.150e-01", "anc_acc": "5.897e-01", "epoch": 0.06133} {"step": 30670, "loss": 0.8423, "grad_norm": "3.808e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.046e+00", "anc_loss": "1.148e+00", "dlm_acc": "6.006e-01", "anc_acc": "5.740e-01", "epoch": 0.06134} {"step": 30675, "loss": 1.0823, "grad_norm": "3.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.333e-01", "anc_loss": "5.918e-01", "dlm_acc": "8.237e-01", "anc_acc": "7.758e-01", "epoch": 0.06135} {"step": 30680, "loss": 1.2052, "grad_norm": "4.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.367e-01", "anc_loss": "1.043e+00", "dlm_acc": "6.624e-01", "anc_acc": "6.312e-01", "epoch": 0.06136} {"step": 30685, "loss": 1.1974, "grad_norm": "2.964e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.670e+00", "dlm_acc": "5.187e-01", "anc_acc": "4.904e-01", "epoch": 0.06137} {"step": 30690, "loss": 1.1502, "grad_norm": "2.875e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.031e-02", "anc_loss": "4.663e-02", "dlm_acc": "9.732e-01", "anc_acc": "9.698e-01", "epoch": 0.06138} {"step": 30695, "loss": 1.2475, "grad_norm": "2.440e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.160e-02", "anc_loss": "1.112e-01", "dlm_acc": "9.429e-01", "anc_acc": "9.337e-01", "epoch": 0.06139} {"step": 30700, "loss": 1.1531, "grad_norm": "3.725e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.392e-01", "anc_loss": "1.552e-01", "dlm_acc": "9.100e-01", "anc_acc": "9.030e-01", "epoch": 0.0614} {"step": 30705, "loss": 1.011, "grad_norm": "4.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e-01", "anc_loss": "1.596e-01", "dlm_acc": "9.138e-01", "anc_acc": "9.020e-01", "epoch": 0.06141} {"step": 30710, "loss": 0.8571, "grad_norm": "2.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.977e-01", "anc_loss": "5.533e-01", "dlm_acc": "7.739e-01", "anc_acc": "7.556e-01", "epoch": 0.06142} {"step": 30715, "loss": 1.3914, "grad_norm": "4.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.399e+00", "dlm_acc": "5.075e-01", "anc_acc": "4.916e-01", "epoch": 0.06143} {"step": 30720, "loss": 0.9494, "grad_norm": "5.167e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.531e-01", "anc_loss": "1.013e+00", "dlm_acc": "5.580e-01", "anc_acc": "5.423e-01", "epoch": 0.06144} {"step": 30725, "loss": 0.856, "grad_norm": "1.444e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.961e-01", "anc_loss": "7.031e-01", "dlm_acc": "5.763e-01", "anc_acc": "5.703e-01", "epoch": 0.06145} {"step": 30730, "loss": 0.6642, "grad_norm": "4.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.383e-01", "anc_loss": "6.921e-01", "dlm_acc": "6.987e-01", "anc_acc": "6.799e-01", "epoch": 0.06146} {"step": 30735, "loss": 0.8529, "grad_norm": "5.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.653e-01", "anc_loss": "4.531e-01", "dlm_acc": "7.508e-01", "anc_acc": "6.904e-01", "epoch": 0.06147} {"step": 30740, "loss": 1.0216, "grad_norm": "2.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.059e-01", "anc_loss": "6.980e-01", "dlm_acc": "7.065e-01", "anc_acc": "6.763e-01", "epoch": 0.06148} {"step": 30745, "loss": 0.7536, "grad_norm": "2.401e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.523e-01", "anc_loss": "1.033e+00", "dlm_acc": "6.103e-01", "anc_acc": "5.869e-01", "epoch": 0.06149} {"step": 30750, "loss": 0.8199, "grad_norm": "3.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.559e-01", "anc_loss": "8.488e-01", "dlm_acc": "6.806e-01", "anc_acc": "6.547e-01", "epoch": 0.0615} {"step": 30755, "loss": 1.4253, "grad_norm": "3.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.492e-01", "anc_loss": "6.004e-01", "dlm_acc": "6.692e-01", "anc_acc": "6.489e-01", "epoch": 0.06151} {"step": 30760, "loss": 1.2099, "grad_norm": "3.646e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.578e-01", "anc_loss": "8.227e-01", "dlm_acc": "6.411e-01", "anc_acc": "6.170e-01", "epoch": 0.06152} {"step": 30765, "loss": 1.6192, "grad_norm": "4.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.738e-01", "anc_loss": "9.434e-01", "dlm_acc": "5.662e-01", "anc_acc": "5.451e-01", "epoch": 0.06153} {"step": 30770, "loss": 1.3318, "grad_norm": "4.695e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.176e-01", "anc_loss": "6.570e-01", "dlm_acc": "5.842e-01", "anc_acc": "5.633e-01", "epoch": 0.06154} {"step": 30775, "loss": 1.0145, "grad_norm": "3.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.801e-01", "anc_loss": "8.355e-01", "dlm_acc": "5.997e-01", "anc_acc": "5.809e-01", "epoch": 0.06155} {"step": 30780, "loss": 1.3498, "grad_norm": "5.440e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.613e-01", "anc_loss": "6.098e-01", "dlm_acc": "6.189e-01", "anc_acc": "5.882e-01", "epoch": 0.06156} {"step": 30785, "loss": 1.2369, "grad_norm": "5.646e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.382e+00", "anc_loss": "1.496e+00", "dlm_acc": "5.573e-01", "anc_acc": "5.328e-01", "epoch": 0.06157} {"step": 30790, "loss": 0.9953, "grad_norm": "5.738e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.637e-01", "anc_loss": "6.855e-01", "dlm_acc": "5.191e-01", "anc_acc": "5.034e-01", "epoch": 0.06158} {"step": 30795, "loss": 0.9043, "grad_norm": "4.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.430e-01", "anc_loss": "6.562e-01", "dlm_acc": "5.105e-01", "anc_acc": "5.021e-01", "epoch": 0.06159} {"step": 30800, "loss": 1.4349, "grad_norm": "3.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.234e-01", "anc_loss": "6.453e-01", "dlm_acc": "5.341e-01", "anc_acc": "5.230e-01", "epoch": 0.0616} {"step": 30805, "loss": 1.0337, "grad_norm": "3.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.285e-01", "anc_acc": "4.991e-01", "epoch": 0.06161} {"step": 30810, "loss": 1.0471, "grad_norm": "3.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.777e-01", "anc_loss": "1.073e+00", "dlm_acc": "5.930e-01", "anc_acc": "5.666e-01", "epoch": 0.06162} {"step": 30815, "loss": 0.9624, "grad_norm": "2.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.367e-01", "anc_loss": "6.586e-01", "dlm_acc": "5.693e-01", "anc_acc": "5.604e-01", "epoch": 0.06163} {"step": 30820, "loss": 1.1673, "grad_norm": "2.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.129e-01", "anc_loss": "6.281e-01", "dlm_acc": "5.625e-01", "anc_acc": "5.527e-01", "epoch": 0.06164} {"step": 30825, "loss": 1.1857, "grad_norm": "3.741e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.578e-01", "anc_loss": "8.945e-01", "dlm_acc": "4.964e-01", "anc_acc": "4.836e-01", "epoch": 0.06165} {"step": 30830, "loss": 0.8821, "grad_norm": "1.447e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.169e-01", "anc_loss": "1.256e-01", "dlm_acc": "9.428e-01", "anc_acc": "9.390e-01", "epoch": 0.06166} {"step": 30835, "loss": 1.1579, "grad_norm": "3.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.642e-01", "anc_loss": "1.811e-01", "dlm_acc": "8.921e-01", "anc_acc": "8.838e-01", "epoch": 0.06167} {"step": 30840, "loss": 1.3437, "grad_norm": "3.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.335e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.484e-01", "anc_acc": "5.285e-01", "epoch": 0.06168} {"step": 30845, "loss": 1.3464, "grad_norm": "3.452e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.614e+00", "anc_loss": "1.733e+00", "dlm_acc": "5.129e-01", "anc_acc": "4.895e-01", "epoch": 0.06169} {"step": 30850, "loss": 1.2663, "grad_norm": "4.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.122e+00", "dlm_acc": "6.022e-01", "anc_acc": "5.727e-01", "epoch": 0.0617} {"step": 30855, "loss": 1.5239, "grad_norm": "8.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.272e-01", "anc_acc": "5.041e-01", "epoch": 0.06171} {"step": 30860, "loss": 1.4241, "grad_norm": "3.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.973e-01", "anc_loss": "7.707e-01", "dlm_acc": "6.880e-01", "anc_acc": "6.634e-01", "epoch": 0.06172} {"step": 30865, "loss": 1.0828, "grad_norm": "3.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.065e+00", "anc_loss": "1.159e+00", "dlm_acc": "6.082e-01", "anc_acc": "5.818e-01", "epoch": 0.06173} {"step": 30870, "loss": 1.156, "grad_norm": "2.547e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.219e-01", "anc_loss": "7.902e-01", "dlm_acc": "6.554e-01", "anc_acc": "6.231e-01", "epoch": 0.06174} {"step": 30875, "loss": 1.3805, "grad_norm": "5.290e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.147e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.920e-01", "anc_acc": "5.654e-01", "epoch": 0.06175} {"step": 30880, "loss": 1.2598, "grad_norm": "7.676e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.979e-01", "anc_loss": "9.885e-01", "dlm_acc": "6.722e-01", "anc_acc": "6.452e-01", "epoch": 0.06176} {"step": 30885, "loss": 1.4784, "grad_norm": "5.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.126e+00", "dlm_acc": "5.173e-01", "anc_acc": "5.038e-01", "epoch": 0.06177} {"step": 30890, "loss": 1.7002, "grad_norm": "1.140e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.777e+00", "anc_loss": "1.901e+00", "dlm_acc": "5.212e-01", "anc_acc": "4.984e-01", "epoch": 0.06178} {"step": 30895, "loss": 1.0455, "grad_norm": "3.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.578e-01", "anc_loss": "9.563e-01", "dlm_acc": "6.527e-01", "anc_acc": "6.250e-01", "epoch": 0.06179} {"step": 30900, "loss": 1.35, "grad_norm": "2.768e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.355e-01", "anc_loss": "6.844e-01", "dlm_acc": "6.346e-01", "anc_acc": "6.075e-01", "epoch": 0.0618} {"step": 30905, "loss": 0.8121, "grad_norm": "4.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.322e-01", "anc_loss": "5.816e-01", "dlm_acc": "6.852e-01", "anc_acc": "6.629e-01", "epoch": 0.06181} {"step": 30910, "loss": 0.7294, "grad_norm": "3.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.637e-01", "anc_loss": "5.102e-01", "dlm_acc": "7.308e-01", "anc_acc": "7.081e-01", "epoch": 0.06182} {"step": 30915, "loss": 0.9709, "grad_norm": "3.171e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.118e+00", "anc_loss": "1.238e+00", "dlm_acc": "5.946e-01", "anc_acc": "5.653e-01", "epoch": 0.06183} {"step": 30920, "loss": 1.6404, "grad_norm": "4.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.609e-01", "anc_loss": "6.668e-01", "dlm_acc": "7.956e-01", "anc_acc": "7.652e-01", "epoch": 0.06184} {"step": 30925, "loss": 1.468, "grad_norm": "3.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.116e+00", "dlm_acc": "6.672e-01", "anc_acc": "6.427e-01", "epoch": 0.06185} {"step": 30930, "loss": 1.4996, "grad_norm": "3.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.678e-01", "anc_acc": "5.397e-01", "epoch": 0.06186} {"step": 30935, "loss": 1.5533, "grad_norm": "3.361e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.606e-01", "anc_acc": "5.316e-01", "epoch": 0.06187} {"step": 30940, "loss": 1.7133, "grad_norm": "3.578e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.292e+00", "dlm_acc": "6.066e-01", "anc_acc": "5.765e-01", "epoch": 0.06188} {"step": 30945, "loss": 1.4535, "grad_norm": "3.601e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.332e+00", "dlm_acc": "6.007e-01", "anc_acc": "5.658e-01", "epoch": 0.06189} {"step": 30950, "loss": 1.8425, "grad_norm": "3.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.786e+00", "anc_loss": "1.914e+00", "dlm_acc": "4.783e-01", "anc_acc": "4.529e-01", "epoch": 0.0619} {"step": 30955, "loss": 1.583, "grad_norm": "2.253e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.521e-01", "anc_acc": "5.242e-01", "epoch": 0.06191} {"step": 30960, "loss": 1.5056, "grad_norm": "3.271e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.612e+00", "dlm_acc": "5.287e-01", "anc_acc": "5.032e-01", "epoch": 0.06192} {"step": 30965, "loss": 1.3197, "grad_norm": "3.375e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.517e+00", "dlm_acc": "5.468e-01", "anc_acc": "5.206e-01", "epoch": 0.06193} {"step": 30970, "loss": 1.157, "grad_norm": "3.185e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.196e+00", "anc_loss": "1.317e+00", "dlm_acc": "6.048e-01", "anc_acc": "5.741e-01", "epoch": 0.06194} {"step": 30975, "loss": 1.3122, "grad_norm": "2.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.476e+00", "anc_loss": "1.599e+00", "dlm_acc": "5.285e-01", "anc_acc": "5.024e-01", "epoch": 0.06195} {"step": 30980, "loss": 1.3344, "grad_norm": "4.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.435e+00", "anc_loss": "1.544e+00", "dlm_acc": "5.426e-01", "anc_acc": "5.189e-01", "epoch": 0.06196} {"step": 30985, "loss": 1.5025, "grad_norm": "3.601e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.382e-01", "anc_acc": "5.001e-01", "epoch": 0.06197} {"step": 30990, "loss": 1.7008, "grad_norm": "4.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.625e+00", "dlm_acc": "5.276e-01", "anc_acc": "5.036e-01", "epoch": 0.06198} {"step": 30995, "loss": 1.2556, "grad_norm": "4.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.094e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.726e-01", "anc_acc": "5.432e-01", "epoch": 0.06199} {"step": 31000, "loss": 1.124, "grad_norm": "5.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.805e-01", "anc_loss": "1.102e+00", "dlm_acc": "6.382e-01", "anc_acc": "6.070e-01", "epoch": 0.062} {"step": 31005, "loss": 1.0628, "grad_norm": "2.878e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.207e-01", "anc_acc": "5.002e-01", "epoch": 0.06201} {"step": 31010, "loss": 1.258, "grad_norm": "4.591e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.368e+00", "anc_loss": "1.436e+00", "dlm_acc": "3.509e-01", "anc_acc": "3.414e-01", "epoch": 0.06202} {"step": 31015, "loss": 1.062, "grad_norm": "2.792e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.477e-01", "anc_loss": "1.037e+00", "dlm_acc": "6.095e-01", "anc_acc": "5.837e-01", "epoch": 0.06203} {"step": 31020, "loss": 1.0066, "grad_norm": "1.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.850e-01", "anc_loss": "5.268e-01", "dlm_acc": "7.189e-01", "anc_acc": "6.964e-01", "epoch": 0.06204} {"step": 31025, "loss": 1.6769, "grad_norm": "4.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.578e-01", "anc_loss": "1.054e+00", "dlm_acc": "5.677e-01", "anc_acc": "5.374e-01", "epoch": 0.06205} {"step": 31030, "loss": 1.3706, "grad_norm": "3.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.186e+00", "dlm_acc": "5.222e-01", "anc_acc": "4.822e-01", "epoch": 0.06206} {"step": 31035, "loss": 1.2125, "grad_norm": "6.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.426e+00", "dlm_acc": "5.466e-01", "anc_acc": "5.157e-01", "epoch": 0.06207} {"step": 31040, "loss": 1.0804, "grad_norm": "4.883e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.404e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.217e-01", "anc_acc": "4.874e-01", "epoch": 0.06208} {"step": 31045, "loss": 0.9484, "grad_norm": "2.617e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.305e-01", "anc_loss": "1.027e+00", "dlm_acc": "6.192e-01", "anc_acc": "5.933e-01", "epoch": 0.06209} {"step": 31050, "loss": 1.051, "grad_norm": "4.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.043e-01", "anc_loss": "7.531e-01", "dlm_acc": "6.493e-01", "anc_acc": "6.291e-01", "epoch": 0.0621} {"step": 31055, "loss": 0.7066, "grad_norm": "1.066e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.734e-01", "anc_loss": "5.403e-01", "dlm_acc": "8.229e-01", "anc_acc": "8.058e-01", "epoch": 0.06211} {"step": 31060, "loss": 0.9863, "grad_norm": "2.608e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.827e-01", "anc_acc": "5.485e-01", "epoch": 0.06212} {"step": 31065, "loss": 1.0474, "grad_norm": "1.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.071e+00", "anc_loss": "1.184e+00", "dlm_acc": "5.958e-01", "anc_acc": "5.640e-01", "epoch": 0.06213} {"step": 31070, "loss": 1.0047, "grad_norm": "2.619e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.338e+00", "dlm_acc": "5.493e-01", "anc_acc": "5.159e-01", "epoch": 0.06214} {"step": 31075, "loss": 1.0156, "grad_norm": "3.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.174e+00", "dlm_acc": "5.805e-01", "anc_acc": "5.446e-01", "epoch": 0.06215} {"step": 31080, "loss": 1.2231, "grad_norm": "2.739e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.201e+00", "dlm_acc": "5.792e-01", "anc_acc": "5.478e-01", "epoch": 0.06216} {"step": 31085, "loss": 1.2681, "grad_norm": "3.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.919e-01", "anc_acc": "5.643e-01", "epoch": 0.06217} {"step": 31090, "loss": 0.8673, "grad_norm": "1.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.941e-01", "anc_loss": "9.039e-01", "dlm_acc": "6.772e-01", "anc_acc": "6.369e-01", "epoch": 0.06218} {"step": 31095, "loss": 0.8801, "grad_norm": "6.739e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.723e-01", "anc_loss": "8.945e-01", "dlm_acc": "6.632e-01", "anc_acc": "6.129e-01", "epoch": 0.06219} {"step": 31100, "loss": 1.109, "grad_norm": "6.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.832e-01", "anc_loss": "1.014e+00", "dlm_acc": "6.342e-01", "anc_acc": "5.861e-01", "epoch": 0.0622} {"step": 31105, "loss": 0.8579, "grad_norm": "4.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.939e-01", "anc_loss": "9.453e-01", "dlm_acc": "6.761e-01", "anc_acc": "6.213e-01", "epoch": 0.06221} {"step": 31110, "loss": 0.953, "grad_norm": "4.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.245e+00", "dlm_acc": "5.663e-01", "anc_acc": "5.299e-01", "epoch": 0.06222} {"step": 31115, "loss": 1.2116, "grad_norm": "5.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.013e+00", "anc_loss": "1.090e+00", "dlm_acc": "6.170e-01", "anc_acc": "5.973e-01", "epoch": 0.06223} {"step": 31120, "loss": 0.8481, "grad_norm": "3.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.485e-01", "anc_loss": "2.672e-01", "dlm_acc": "8.917e-01", "anc_acc": "8.860e-01", "epoch": 0.06224} {"step": 31125, "loss": 0.8235, "grad_norm": "1.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.332e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.566e-01", "anc_acc": "5.326e-01", "epoch": 0.06225} {"step": 31130, "loss": 0.5961, "grad_norm": "1.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.984e-01", "anc_loss": "1.173e+00", "dlm_acc": "6.141e-01", "anc_acc": "5.578e-01", "epoch": 0.06226} {"step": 31135, "loss": 0.8308, "grad_norm": "4.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.453e+00", "anc_loss": "1.481e+00", "dlm_acc": "4.559e-01", "anc_acc": "4.457e-01", "epoch": 0.06227} {"step": 31140, "loss": 0.8646, "grad_norm": "1.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.331e+00", "dlm_acc": "4.928e-01", "anc_acc": "4.631e-01", "epoch": 0.06228} {"step": 31145, "loss": 0.8135, "grad_norm": "2.842e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.042e+00", "anc_loss": "1.157e+00", "dlm_acc": "5.795e-01", "anc_acc": "5.456e-01", "epoch": 0.06229} {"step": 31150, "loss": 1.4113, "grad_norm": "4.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.267e+00", "dlm_acc": "5.758e-01", "anc_acc": "5.499e-01", "epoch": 0.0623} {"step": 31155, "loss": 0.9623, "grad_norm": "5.761e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.622e+00", "anc_loss": "1.734e+00", "dlm_acc": "4.222e-01", "anc_acc": "3.965e-01", "epoch": 0.06231} {"step": 31160, "loss": 0.7534, "grad_norm": "3.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.204e+00", "dlm_acc": "5.887e-01", "anc_acc": "5.636e-01", "epoch": 0.06232} {"step": 31165, "loss": 0.9862, "grad_norm": "2.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.909e-01", "anc_acc": "5.538e-01", "epoch": 0.06233} {"step": 31170, "loss": 1.2286, "grad_norm": "4.137e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.695e+00", "dlm_acc": "4.521e-01", "anc_acc": "4.296e-01", "epoch": 0.06234} {"step": 31175, "loss": 1.1152, "grad_norm": "3.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.047e+00", "anc_loss": "1.137e+00", "dlm_acc": "5.841e-01", "anc_acc": "5.603e-01", "epoch": 0.06235} {"step": 31180, "loss": 1.4878, "grad_norm": "3.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.023e-01", "anc_loss": "9.648e-01", "dlm_acc": "5.534e-01", "anc_acc": "5.297e-01", "epoch": 0.06236} {"step": 31185, "loss": 1.6631, "grad_norm": "3.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.043e-01", "anc_loss": "8.703e-01", "dlm_acc": "6.317e-01", "anc_acc": "6.080e-01", "epoch": 0.06237} {"step": 31190, "loss": 0.8051, "grad_norm": "2.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.410e-01", "anc_loss": "3.840e-01", "dlm_acc": "7.051e-01", "anc_acc": "6.694e-01", "epoch": 0.06238} {"step": 31195, "loss": 1.3593, "grad_norm": "5.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.148e-01", "anc_loss": "8.406e-01", "dlm_acc": "5.319e-01", "anc_acc": "5.244e-01", "epoch": 0.06239} {"step": 31200, "loss": 1.2206, "grad_norm": "1.256e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.238e+00", "dlm_acc": "6.210e-01", "anc_acc": "6.041e-01", "epoch": 0.0624} {"step": 31205, "loss": 0.6533, "grad_norm": "1.158e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.513e-01", "anc_loss": "2.681e-01", "dlm_acc": "8.482e-01", "anc_acc": "8.415e-01", "epoch": 0.06241} {"step": 31210, "loss": 1.2388, "grad_norm": "1.032e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.392e+00", "dlm_acc": "5.913e-01", "anc_acc": "5.685e-01", "epoch": 0.06242} {"step": 31215, "loss": 0.7652, "grad_norm": "3.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.541e-01", "anc_loss": "8.174e-01", "dlm_acc": "6.611e-01", "anc_acc": "6.425e-01", "epoch": 0.06243} {"step": 31220, "loss": 1.1858, "grad_norm": "6.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.341e+00", "dlm_acc": "4.913e-01", "anc_acc": "4.699e-01", "epoch": 0.06244} {"step": 31225, "loss": 1.7135, "grad_norm": "5.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.539e-01", "anc_acc": "5.257e-01", "epoch": 0.06245} {"step": 31230, "loss": 1.3043, "grad_norm": "3.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.146e+00", "dlm_acc": "6.321e-01", "anc_acc": "6.059e-01", "epoch": 0.06246} {"step": 31235, "loss": 1.4347, "grad_norm": "2.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.499e-01", "anc_acc": "5.241e-01", "epoch": 0.06247} {"step": 31240, "loss": 0.9678, "grad_norm": "5.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.938e-01", "anc_loss": "5.437e-01", "dlm_acc": "7.469e-01", "anc_acc": "7.320e-01", "epoch": 0.06248} {"step": 31245, "loss": 1.1838, "grad_norm": "5.382e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.218e+00", "dlm_acc": "5.301e-01", "anc_acc": "5.141e-01", "epoch": 0.06249} {"step": 31250, "loss": 1.1355, "grad_norm": "4.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.098e-01", "anc_loss": "6.816e-01", "dlm_acc": "6.706e-01", "anc_acc": "6.447e-01", "epoch": 0.0625} {"step": 31255, "loss": 1.0382, "grad_norm": "2.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.672e-01", "anc_loss": "9.199e-01", "dlm_acc": "5.026e-01", "anc_acc": "4.801e-01", "epoch": 0.06251} {"step": 31260, "loss": 1.0156, "grad_norm": "3.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.617e-01", "anc_loss": "5.969e-01", "dlm_acc": "5.910e-01", "anc_acc": "5.719e-01", "epoch": 0.06252} {"step": 31265, "loss": 1.1754, "grad_norm": "4.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.098e-01", "anc_loss": "6.398e-01", "dlm_acc": "5.662e-01", "anc_acc": "5.460e-01", "epoch": 0.06253} {"step": 31270, "loss": 1.111, "grad_norm": "3.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.355e-01", "anc_loss": "5.652e-01", "dlm_acc": "6.115e-01", "anc_acc": "5.922e-01", "epoch": 0.06254} {"step": 31275, "loss": 1.1367, "grad_norm": "2.837e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.703e-01", "anc_loss": "6.062e-01", "dlm_acc": "5.845e-01", "anc_acc": "5.634e-01", "epoch": 0.06255} {"step": 31280, "loss": 1.0519, "grad_norm": "3.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.156e-01", "anc_loss": "5.508e-01", "dlm_acc": "6.146e-01", "anc_acc": "5.923e-01", "epoch": 0.06256} {"step": 31285, "loss": 1.3402, "grad_norm": "3.869e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.350e+00", "anc_loss": "1.440e+00", "dlm_acc": "5.578e-01", "anc_acc": "5.355e-01", "epoch": 0.06257} {"step": 31290, "loss": 1.6143, "grad_norm": "4.107e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.610e+00", "anc_loss": "1.744e+00", "dlm_acc": "5.055e-01", "anc_acc": "4.775e-01", "epoch": 0.06258} {"step": 31295, "loss": 1.0001, "grad_norm": "4.461e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.625e-01", "anc_loss": "8.410e-01", "dlm_acc": "6.417e-01", "anc_acc": "6.167e-01", "epoch": 0.06259} {"step": 31300, "loss": 1.3926, "grad_norm": "3.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.094e+00", "dlm_acc": "6.550e-01", "anc_acc": "6.362e-01", "epoch": 0.0626} {"step": 31305, "loss": 1.0083, "grad_norm": "3.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.816e-01", "anc_loss": "8.391e-01", "dlm_acc": "6.281e-01", "anc_acc": "6.097e-01", "epoch": 0.06261} {"step": 31310, "loss": 0.8691, "grad_norm": "4.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.244e-01", "anc_loss": "4.408e-01", "dlm_acc": "7.170e-01", "anc_acc": "7.081e-01", "epoch": 0.06262} {"step": 31315, "loss": 0.9516, "grad_norm": "2.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.160e-01", "anc_loss": "4.344e-01", "dlm_acc": "6.866e-01", "anc_acc": "6.759e-01", "epoch": 0.06263} {"step": 31320, "loss": 1.1934, "grad_norm": "9.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.633e-01", "anc_loss": "4.938e-01", "dlm_acc": "7.503e-01", "anc_acc": "7.323e-01", "epoch": 0.06264} {"step": 31325, "loss": 0.9165, "grad_norm": "1.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.861e-01", "anc_loss": "3.057e-01", "dlm_acc": "7.765e-01", "anc_acc": "7.630e-01", "epoch": 0.06265} {"step": 31330, "loss": 1.1549, "grad_norm": "4.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.961e-01", "anc_loss": "5.191e-01", "dlm_acc": "6.712e-01", "anc_acc": "6.570e-01", "epoch": 0.06266} {"step": 31335, "loss": 0.7077, "grad_norm": "2.814e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.404e-01", "anc_loss": "3.673e-01", "dlm_acc": "7.828e-01", "anc_acc": "7.647e-01", "epoch": 0.06267} {"step": 31340, "loss": 1.073, "grad_norm": "2.707e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.969e-01", "anc_loss": "7.367e-01", "dlm_acc": "6.452e-01", "anc_acc": "6.321e-01", "epoch": 0.06268} {"step": 31345, "loss": 1.1707, "grad_norm": "3.359e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.496e-01", "anc_loss": "7.064e-01", "dlm_acc": "6.868e-01", "anc_acc": "6.667e-01", "epoch": 0.06269} {"step": 31350, "loss": 1.3766, "grad_norm": "3.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.556e+00", "dlm_acc": "5.189e-01", "anc_acc": "4.960e-01", "epoch": 0.0627} {"step": 31355, "loss": 0.8878, "grad_norm": "4.366e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.131e-01", "anc_loss": "4.631e-01", "dlm_acc": "7.949e-01", "anc_acc": "7.751e-01", "epoch": 0.06271} {"step": 31360, "loss": 0.9876, "grad_norm": "2.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.496e-01", "anc_loss": "1.049e+00", "dlm_acc": "6.026e-01", "anc_acc": "5.782e-01", "epoch": 0.06272} {"step": 31365, "loss": 1.1447, "grad_norm": "2.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.363e-01", "anc_loss": "7.887e-01", "dlm_acc": "6.112e-01", "anc_acc": "5.890e-01", "epoch": 0.06273} {"step": 31370, "loss": 1.1028, "grad_norm": "3.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.805e-01", "anc_loss": "8.359e-01", "dlm_acc": "5.898e-01", "anc_acc": "5.740e-01", "epoch": 0.06274} {"step": 31375, "loss": 1.0264, "grad_norm": "4.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.414e-01", "anc_loss": "9.086e-01", "dlm_acc": "6.398e-01", "anc_acc": "6.222e-01", "epoch": 0.06275} {"step": 31380, "loss": 1.1056, "grad_norm": "3.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.203e+00", "dlm_acc": "6.102e-01", "anc_acc": "5.824e-01", "epoch": 0.06276} {"step": 31385, "loss": 1.2364, "grad_norm": "4.595e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.061e+00", "anc_loss": "1.144e+00", "dlm_acc": "5.846e-01", "anc_acc": "5.613e-01", "epoch": 0.06277} {"step": 31390, "loss": 1.2947, "grad_norm": "2.524e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.193e+00", "dlm_acc": "6.366e-01", "anc_acc": "6.086e-01", "epoch": 0.06278} {"step": 31395, "loss": 0.7702, "grad_norm": "2.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.705e-01", "anc_loss": "8.439e-01", "dlm_acc": "6.348e-01", "anc_acc": "6.088e-01", "epoch": 0.06279} {"step": 31400, "loss": 1.0875, "grad_norm": "2.531e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.434e-01", "anc_loss": "8.953e-01", "dlm_acc": "5.467e-01", "anc_acc": "5.315e-01", "epoch": 0.0628} {"step": 31405, "loss": 1.5697, "grad_norm": "4.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.303e+00", "dlm_acc": "4.911e-01", "anc_acc": "4.676e-01", "epoch": 0.06281} {"step": 31410, "loss": 0.8832, "grad_norm": "4.234e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.060e+00", "anc_loss": "1.131e+00", "dlm_acc": "6.262e-01", "anc_acc": "6.074e-01", "epoch": 0.06282} {"step": 31415, "loss": 0.9462, "grad_norm": "3.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.150e+00", "dlm_acc": "5.419e-01", "anc_acc": "5.182e-01", "epoch": 0.06283} {"step": 31420, "loss": 0.9865, "grad_norm": "3.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.434e-01", "anc_loss": "6.578e-01", "dlm_acc": "5.364e-01", "anc_acc": "5.277e-01", "epoch": 0.06284} {"step": 31425, "loss": 1.1366, "grad_norm": "2.399e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.352e-01", "anc_loss": "6.516e-01", "dlm_acc": "4.983e-01", "anc_acc": "4.893e-01", "epoch": 0.06285} {"step": 31430, "loss": 1.7159, "grad_norm": "3.182e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.102e-01", "anc_loss": "9.477e-01", "dlm_acc": "5.784e-01", "anc_acc": "5.674e-01", "epoch": 0.06286} {"step": 31435, "loss": 1.1761, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.969e-01", "anc_loss": "8.582e-01", "dlm_acc": "6.159e-01", "anc_acc": "5.977e-01", "epoch": 0.06287} {"step": 31440, "loss": 1.1753, "grad_norm": "3.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.063e+00", "anc_loss": "1.142e+00", "dlm_acc": "5.678e-01", "anc_acc": "5.459e-01", "epoch": 0.06288} {"step": 31445, "loss": 0.7759, "grad_norm": "3.255e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.160e-01", "anc_loss": "5.496e-01", "dlm_acc": "5.984e-01", "anc_acc": "5.744e-01", "epoch": 0.06289} {"step": 31450, "loss": 1.2691, "grad_norm": "7.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.148e+00", "dlm_acc": "6.181e-01", "anc_acc": "5.927e-01", "epoch": 0.0629} {"step": 31455, "loss": 0.9651, "grad_norm": "4.744e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.113e-01", "anc_loss": "1.004e+00", "dlm_acc": "6.361e-01", "anc_acc": "6.086e-01", "epoch": 0.06291} {"step": 31460, "loss": 1.1858, "grad_norm": "3.516e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.641e-01", "anc_loss": "9.219e-01", "dlm_acc": "5.718e-01", "anc_acc": "5.548e-01", "epoch": 0.06292} {"step": 31465, "loss": 1.15, "grad_norm": "2.304e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.332e-01", "anc_loss": "8.770e-01", "dlm_acc": "5.843e-01", "anc_acc": "5.680e-01", "epoch": 0.06293} {"step": 31470, "loss": 1.2013, "grad_norm": "3.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.221e-01", "anc_loss": "5.613e-01", "dlm_acc": "6.714e-01", "anc_acc": "6.533e-01", "epoch": 0.06294} {"step": 31475, "loss": 1.1036, "grad_norm": "4.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.455e-01", "anc_loss": "4.672e-01", "dlm_acc": "7.301e-01", "anc_acc": "7.170e-01", "epoch": 0.06295} {"step": 31480, "loss": 1.2848, "grad_norm": "2.265e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.961e-01", "anc_loss": "9.766e-01", "dlm_acc": "6.481e-01", "anc_acc": "6.244e-01", "epoch": 0.06296} {"step": 31485, "loss": 1.7091, "grad_norm": "3.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.804e-01", "anc_loss": "8.762e-01", "dlm_acc": "6.924e-01", "anc_acc": "6.624e-01", "epoch": 0.06297} {"step": 31490, "loss": 1.006, "grad_norm": "2.908e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.945e-01", "anc_loss": "6.594e-01", "dlm_acc": "6.481e-01", "anc_acc": "6.239e-01", "epoch": 0.06298} {"step": 31495, "loss": 1.3136, "grad_norm": "4.050e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.164e+00", "dlm_acc": "6.166e-01", "anc_acc": "5.954e-01", "epoch": 0.06299} {"step": 31500, "loss": 1.3135, "grad_norm": "3.447e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.456e-01", "anc_loss": "8.416e-01", "dlm_acc": "7.693e-01", "anc_acc": "7.445e-01", "epoch": 0.063} {"step": 31505, "loss": 1.0844, "grad_norm": "4.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.141e-01", "anc_loss": "8.961e-01", "dlm_acc": "6.448e-01", "anc_acc": "6.224e-01", "epoch": 0.06301} {"step": 31510, "loss": 1.3145, "grad_norm": "3.602e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.602e-01", "anc_loss": "8.250e-01", "dlm_acc": "6.019e-01", "anc_acc": "5.731e-01", "epoch": 0.06302} {"step": 31515, "loss": 1.0455, "grad_norm": "4.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.197e+00", "dlm_acc": "5.742e-01", "anc_acc": "5.537e-01", "epoch": 0.06303} {"step": 31520, "loss": 1.1751, "grad_norm": "6.312e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.480e-01", "anc_loss": "6.746e-01", "dlm_acc": "5.611e-01", "anc_acc": "5.487e-01", "epoch": 0.06304} {"step": 31525, "loss": 0.9714, "grad_norm": "3.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.887e-01", "anc_loss": "1.067e+00", "dlm_acc": "5.790e-01", "anc_acc": "5.547e-01", "epoch": 0.06305} {"step": 31530, "loss": 0.7151, "grad_norm": "2.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.851e-01", "anc_loss": "3.246e-01", "dlm_acc": "8.547e-01", "anc_acc": "8.417e-01", "epoch": 0.06306} {"step": 31535, "loss": 0.9484, "grad_norm": "4.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.800e-01", "anc_loss": "3.126e-01", "dlm_acc": "8.853e-01", "anc_acc": "8.755e-01", "epoch": 0.06307} {"step": 31540, "loss": 1.1981, "grad_norm": "6.958e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.092e-01", "anc_loss": "6.711e-01", "dlm_acc": "8.040e-01", "anc_acc": "7.884e-01", "epoch": 0.06308} {"step": 31545, "loss": 1.2485, "grad_norm": "2.513e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.474e+00", "dlm_acc": "5.083e-01", "anc_acc": "4.890e-01", "epoch": 0.06309} {"step": 31550, "loss": 1.0864, "grad_norm": "3.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.260e+00", "dlm_acc": "5.378e-01", "anc_acc": "5.108e-01", "epoch": 0.0631} {"step": 31555, "loss": 1.2101, "grad_norm": "2.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.104e+00", "dlm_acc": "5.057e-01", "anc_acc": "4.854e-01", "epoch": 0.06311} {"step": 31560, "loss": 1.2915, "grad_norm": "1.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.469e-01", "anc_loss": "1.032e+00", "dlm_acc": "6.182e-01", "anc_acc": "5.967e-01", "epoch": 0.06312} {"step": 31565, "loss": 0.8336, "grad_norm": "4.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.902e-01", "anc_loss": "5.367e-01", "dlm_acc": "7.431e-01", "anc_acc": "7.330e-01", "epoch": 0.06313} {"step": 31570, "loss": 0.9675, "grad_norm": "3.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.358e+00", "anc_loss": "1.474e+00", "dlm_acc": "5.196e-01", "anc_acc": "4.942e-01", "epoch": 0.06314} {"step": 31575, "loss": 1.0493, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.424e-01", "anc_loss": "7.973e-01", "dlm_acc": "6.373e-01", "anc_acc": "6.179e-01", "epoch": 0.06315} {"step": 31580, "loss": 0.882, "grad_norm": "4.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.350e-01", "anc_loss": "5.726e-01", "dlm_acc": "7.006e-01", "anc_acc": "6.820e-01", "epoch": 0.06316} {"step": 31585, "loss": 1.291, "grad_norm": "3.792e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.072e+00", "dlm_acc": "4.258e-01", "anc_acc": "4.131e-01", "epoch": 0.06317} {"step": 31590, "loss": 1.0248, "grad_norm": "4.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.180e-01", "anc_loss": "9.563e-01", "dlm_acc": "4.685e-01", "anc_acc": "4.523e-01", "epoch": 0.06318} {"step": 31595, "loss": 0.7513, "grad_norm": "1.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.785e-01", "anc_loss": "8.258e-01", "dlm_acc": "5.645e-01", "anc_acc": "5.453e-01", "epoch": 0.06319} {"step": 31600, "loss": 0.884, "grad_norm": "3.267e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.070e-01", "anc_loss": "7.760e-01", "dlm_acc": "7.194e-01", "anc_acc": "7.013e-01", "epoch": 0.0632} {"step": 31605, "loss": 1.1147, "grad_norm": "3.813e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.136e+00", "dlm_acc": "6.765e-01", "anc_acc": "6.687e-01", "epoch": 0.06321} {"step": 31610, "loss": 1.212, "grad_norm": "5.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.047e-01", "anc_loss": "8.396e-01", "dlm_acc": "5.663e-01", "anc_acc": "5.569e-01", "epoch": 0.06322} {"step": 31615, "loss": 1.3531, "grad_norm": "3.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.984e-01", "anc_loss": "9.031e-01", "dlm_acc": "3.330e-01", "anc_acc": "3.315e-01", "epoch": 0.06323} {"step": 31620, "loss": 1.3043, "grad_norm": "3.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.992e-01", "anc_loss": "9.062e-01", "dlm_acc": "3.453e-01", "anc_acc": "3.423e-01", "epoch": 0.06324} {"step": 31625, "loss": 1.152, "grad_norm": "3.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.961e-01", "anc_loss": "8.000e-01", "dlm_acc": "3.563e-01", "anc_acc": "3.538e-01", "epoch": 0.06325} {"step": 31630, "loss": 1.1254, "grad_norm": "2.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.789e-01", "anc_loss": "7.859e-01", "dlm_acc": "3.590e-01", "anc_acc": "3.539e-01", "epoch": 0.06326} {"step": 31635, "loss": 1.151, "grad_norm": "2.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.781e-01", "anc_loss": "7.812e-01", "dlm_acc": "3.539e-01", "anc_acc": "3.491e-01", "epoch": 0.06327} {"step": 31640, "loss": 1.1255, "grad_norm": "4.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.359e-01", "anc_loss": "8.414e-01", "dlm_acc": "3.446e-01", "anc_acc": "3.421e-01", "epoch": 0.06328} {"step": 31645, "loss": 1.3581, "grad_norm": "7.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.098e-01", "anc_loss": "8.199e-01", "dlm_acc": "4.417e-01", "anc_acc": "4.368e-01", "epoch": 0.06329} {"step": 31650, "loss": 0.8842, "grad_norm": "2.090e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.902e-01", "anc_loss": "1.079e+00", "dlm_acc": "6.226e-01", "anc_acc": "6.023e-01", "epoch": 0.0633} {"step": 31655, "loss": 0.8677, "grad_norm": "4.654e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.527e-01", "anc_loss": "3.838e-01", "dlm_acc": "7.799e-01", "anc_acc": "7.663e-01", "epoch": 0.06331} {"step": 31660, "loss": 1.1826, "grad_norm": "4.173e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.734e-01", "anc_loss": "4.045e-01", "dlm_acc": "7.442e-01", "anc_acc": "7.253e-01", "epoch": 0.06332} {"step": 31665, "loss": 1.0693, "grad_norm": "3.911e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.120e-01", "anc_loss": "6.803e-01", "dlm_acc": "7.655e-01", "anc_acc": "7.495e-01", "epoch": 0.06333} {"step": 31670, "loss": 1.5721, "grad_norm": "5.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.489e-01", "anc_acc": "5.260e-01", "epoch": 0.06334} {"step": 31675, "loss": 1.0443, "grad_norm": "1.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.779e-01", "anc_loss": "7.483e-01", "dlm_acc": "7.303e-01", "anc_acc": "7.083e-01", "epoch": 0.06335} {"step": 31680, "loss": 1.1839, "grad_norm": "2.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.961e-01", "anc_loss": "6.410e-01", "dlm_acc": "6.940e-01", "anc_acc": "6.758e-01", "epoch": 0.06336} {"step": 31685, "loss": 1.0336, "grad_norm": "1.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.762e-01", "anc_loss": "6.941e-01", "dlm_acc": "6.070e-01", "anc_acc": "6.007e-01", "epoch": 0.06337} {"step": 31690, "loss": 1.0754, "grad_norm": "2.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.571e-01", "anc_loss": "2.663e-01", "dlm_acc": "8.345e-01", "anc_acc": "8.295e-01", "epoch": 0.06338} {"step": 31695, "loss": 1.1636, "grad_norm": "6.516e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.822e-01", "anc_loss": "2.941e-01", "dlm_acc": "8.270e-01", "anc_acc": "8.206e-01", "epoch": 0.06339} {"step": 31700, "loss": 0.8829, "grad_norm": "6.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.711e-01", "anc_loss": "2.877e-01", "dlm_acc": "8.171e-01", "anc_acc": "8.108e-01", "epoch": 0.0634} {"step": 31705, "loss": 1.1843, "grad_norm": "2.515e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.764e-01", "anc_loss": "2.848e-01", "dlm_acc": "8.264e-01", "anc_acc": "8.219e-01", "epoch": 0.06341} {"step": 31710, "loss": 0.9067, "grad_norm": "2.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.867e-01", "anc_loss": "2.990e-01", "dlm_acc": "8.151e-01", "anc_acc": "8.111e-01", "epoch": 0.06342} {"step": 31715, "loss": 1.2195, "grad_norm": "4.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.467e-01", "anc_acc": "5.293e-01", "epoch": 0.06343} {"step": 31720, "loss": 1.371, "grad_norm": "6.041e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.037e-01", "anc_acc": "4.807e-01", "epoch": 0.06344} {"step": 31725, "loss": 1.1548, "grad_norm": "4.168e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.809e-01", "anc_loss": "9.516e-01", "dlm_acc": "5.628e-01", "anc_acc": "5.389e-01", "epoch": 0.06345} {"step": 31730, "loss": 1.2267, "grad_norm": "3.736e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.834e-01", "anc_acc": "5.587e-01", "epoch": 0.06346} {"step": 31735, "loss": 1.2354, "grad_norm": "3.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.657e-01", "anc_loss": "8.314e-01", "dlm_acc": "7.297e-01", "anc_acc": "7.140e-01", "epoch": 0.06347} {"step": 31740, "loss": 1.2151, "grad_norm": "4.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.883e-01", "anc_loss": "9.984e-01", "dlm_acc": "6.787e-01", "anc_acc": "6.514e-01", "epoch": 0.06348} {"step": 31745, "loss": 1.1153, "grad_norm": "4.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.158e+00", "dlm_acc": "6.101e-01", "anc_acc": "5.860e-01", "epoch": 0.06349} {"step": 31750, "loss": 1.5213, "grad_norm": "6.088e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.772e-01", "anc_acc": "5.567e-01", "epoch": 0.0635} {"step": 31755, "loss": 1.0412, "grad_norm": "2.787e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.812e-01", "anc_loss": "3.834e-01", "dlm_acc": "7.243e-01", "anc_acc": "7.221e-01", "epoch": 0.06351} {"step": 31760, "loss": 1.5433, "grad_norm": "6.694e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.031e-01", "anc_loss": "6.051e-01", "dlm_acc": "6.835e-01", "anc_acc": "6.795e-01", "epoch": 0.06352} {"step": 31765, "loss": 1.2296, "grad_norm": "4.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.930e-01", "anc_loss": "8.434e-01", "dlm_acc": "4.568e-01", "anc_acc": "4.430e-01", "epoch": 0.06353} {"step": 31770, "loss": 0.9978, "grad_norm": "2.952e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.379e-01", "anc_loss": "1.007e+00", "dlm_acc": "6.438e-01", "anc_acc": "6.265e-01", "epoch": 0.06354} {"step": 31775, "loss": 1.1606, "grad_norm": "7.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.865e-01", "anc_acc": "5.615e-01", "epoch": 0.06355} {"step": 31780, "loss": 1.0817, "grad_norm": "2.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.180e-01", "anc_loss": "6.629e-01", "dlm_acc": "7.630e-01", "anc_acc": "7.489e-01", "epoch": 0.06356} {"step": 31785, "loss": 1.1745, "grad_norm": "4.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.881e-01", "anc_loss": "9.656e-01", "dlm_acc": "6.831e-01", "anc_acc": "6.647e-01", "epoch": 0.06357} {"step": 31790, "loss": 1.4974, "grad_norm": "4.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.089e+00", "anc_loss": "1.152e+00", "dlm_acc": "5.840e-01", "anc_acc": "5.670e-01", "epoch": 0.06358} {"step": 31795, "loss": 0.8538, "grad_norm": "1.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.965e-01", "anc_loss": "4.199e-01", "dlm_acc": "7.004e-01", "anc_acc": "6.867e-01", "epoch": 0.06359} {"step": 31800, "loss": 1.0017, "grad_norm": "3.455e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.273e-01", "anc_loss": "1.013e+00", "dlm_acc": "6.582e-01", "anc_acc": "6.340e-01", "epoch": 0.0636} {"step": 31805, "loss": 0.9574, "grad_norm": "2.832e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.133e-01", "anc_loss": "7.953e-01", "dlm_acc": "7.258e-01", "anc_acc": "7.019e-01", "epoch": 0.06361} {"step": 31810, "loss": 1.1778, "grad_norm": "1.007e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.087e+00", "dlm_acc": "5.959e-01", "anc_acc": "5.779e-01", "epoch": 0.06362} {"step": 31815, "loss": 0.8054, "grad_norm": "3.252e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.079e-01", "anc_loss": "7.678e-01", "dlm_acc": "7.288e-01", "anc_acc": "7.138e-01", "epoch": 0.06363} {"step": 31820, "loss": 0.9488, "grad_norm": "6.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.703e-01", "anc_loss": "9.430e-01", "dlm_acc": "5.921e-01", "anc_acc": "5.740e-01", "epoch": 0.06364} {"step": 31825, "loss": 0.7229, "grad_norm": "4.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.623e-01", "anc_loss": "8.268e-01", "dlm_acc": "6.564e-01", "anc_acc": "6.384e-01", "epoch": 0.06365} {"step": 31830, "loss": 1.1171, "grad_norm": "6.654e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.222e+00", "dlm_acc": "6.456e-01", "anc_acc": "6.311e-01", "epoch": 0.06366} {"step": 31835, "loss": 1.2879, "grad_norm": "5.166e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.015e+00", "anc_loss": "1.097e+00", "dlm_acc": "6.221e-01", "anc_acc": "6.014e-01", "epoch": 0.06367} {"step": 31840, "loss": 0.8639, "grad_norm": "4.273e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.666e-01", "anc_loss": "8.443e-01", "dlm_acc": "7.299e-01", "anc_acc": "7.073e-01", "epoch": 0.06368} {"step": 31845, "loss": 0.9069, "grad_norm": "3.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.633e-01", "anc_loss": "8.730e-01", "dlm_acc": "6.938e-01", "anc_acc": "6.647e-01", "epoch": 0.06369} {"step": 31850, "loss": 0.8901, "grad_norm": "3.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.289e-01", "anc_loss": "5.927e-01", "dlm_acc": "7.673e-01", "anc_acc": "7.479e-01", "epoch": 0.0637} {"step": 31855, "loss": 0.9525, "grad_norm": "2.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.973e-01", "anc_loss": "6.469e-01", "dlm_acc": "6.158e-01", "anc_acc": "5.950e-01", "epoch": 0.06371} {"step": 31860, "loss": 0.9289, "grad_norm": "2.979e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.633e-01", "anc_loss": "4.844e-01", "dlm_acc": "6.470e-01", "anc_acc": "6.386e-01", "epoch": 0.06372} {"step": 31865, "loss": 1.2293, "grad_norm": "6.478e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.367e-01", "anc_loss": "5.648e-01", "dlm_acc": "6.070e-01", "anc_acc": "5.967e-01", "epoch": 0.06373} {"step": 31870, "loss": 0.9846, "grad_norm": "2.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.281e-01", "anc_loss": "4.561e-01", "dlm_acc": "6.619e-01", "anc_acc": "6.476e-01", "epoch": 0.06374} {"step": 31875, "loss": 1.0385, "grad_norm": "3.436e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.680e-01", "anc_loss": "4.898e-01", "dlm_acc": "6.515e-01", "anc_acc": "6.417e-01", "epoch": 0.06375} {"step": 31880, "loss": 1.2349, "grad_norm": "2.295e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.711e-01", "anc_loss": "6.039e-01", "dlm_acc": "6.192e-01", "anc_acc": "6.056e-01", "epoch": 0.06376} {"step": 31885, "loss": 1.1703, "grad_norm": "4.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.512e-01", "anc_loss": "5.809e-01", "dlm_acc": "6.168e-01", "anc_acc": "6.060e-01", "epoch": 0.06377} {"step": 31890, "loss": 1.1911, "grad_norm": "3.404e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.863e-01", "anc_loss": "7.719e-01", "dlm_acc": "5.786e-01", "anc_acc": "5.508e-01", "epoch": 0.06378} {"step": 31895, "loss": 1.0878, "grad_norm": "2.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.372e-01", "anc_acc": "5.110e-01", "epoch": 0.06379} {"step": 31900, "loss": 1.5917, "grad_norm": "5.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.396e+00", "anc_loss": "1.517e+00", "dlm_acc": "5.409e-01", "anc_acc": "5.156e-01", "epoch": 0.0638} {"step": 31905, "loss": 1.1957, "grad_norm": "6.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.709e-01", "anc_acc": "5.301e-01", "epoch": 0.06381} {"step": 31910, "loss": 1.0353, "grad_norm": "2.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.144e+00", "anc_loss": "1.248e+00", "dlm_acc": "5.228e-01", "anc_acc": "4.967e-01", "epoch": 0.06382} {"step": 31915, "loss": 1.2319, "grad_norm": "3.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.754e+00", "anc_loss": "1.845e+00", "dlm_acc": "4.395e-01", "anc_acc": "4.199e-01", "epoch": 0.06383} {"step": 31920, "loss": 0.916, "grad_norm": "5.479e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.333e+00", "dlm_acc": "4.865e-01", "anc_acc": "4.638e-01", "epoch": 0.06384} {"step": 31925, "loss": 1.2054, "grad_norm": "3.108e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.620e+00", "anc_loss": "1.705e+00", "dlm_acc": "4.630e-01", "anc_acc": "4.417e-01", "epoch": 0.06385} {"step": 31930, "loss": 1.1229, "grad_norm": "6.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.302e-01", "anc_loss": "8.928e-01", "dlm_acc": "7.293e-01", "anc_acc": "7.127e-01", "epoch": 0.06386} {"step": 31935, "loss": 0.8485, "grad_norm": "6.513e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.172e-01", "anc_loss": "1.032e+00", "dlm_acc": "6.236e-01", "anc_acc": "6.010e-01", "epoch": 0.06387} {"step": 31940, "loss": 1.3585, "grad_norm": "4.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.859e-01", "anc_loss": "4.063e-01", "dlm_acc": "8.782e-01", "anc_acc": "8.742e-01", "epoch": 0.06388} {"step": 31945, "loss": 1.37, "grad_norm": "3.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.512e+00", "anc_loss": "1.646e+00", "dlm_acc": "5.226e-01", "anc_acc": "4.927e-01", "epoch": 0.06389} {"step": 31950, "loss": 1.5774, "grad_norm": "5.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.418e+00", "anc_loss": "1.534e+00", "dlm_acc": "5.057e-01", "anc_acc": "4.779e-01", "epoch": 0.0639} {"step": 31955, "loss": 1.0401, "grad_norm": "2.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.293e+00", "dlm_acc": "5.304e-01", "anc_acc": "5.027e-01", "epoch": 0.06391} {"step": 31960, "loss": 1.1315, "grad_norm": "3.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.346e+00", "dlm_acc": "5.791e-01", "anc_acc": "5.504e-01", "epoch": 0.06392} {"step": 31965, "loss": 1.3734, "grad_norm": "4.836e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.831e+00", "anc_loss": "1.930e+00", "dlm_acc": "3.301e-01", "anc_acc": "3.121e-01", "epoch": 0.06393} {"step": 31970, "loss": 1.1668, "grad_norm": "2.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.276e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.223e-01", "anc_acc": "5.005e-01", "epoch": 0.06394} {"step": 31975, "loss": 1.3533, "grad_norm": "3.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.359e+00", "anc_loss": "1.472e+00", "dlm_acc": "5.261e-01", "anc_acc": "4.991e-01", "epoch": 0.06395} {"step": 31980, "loss": 1.2232, "grad_norm": "4.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.475e+00", "anc_loss": "1.595e+00", "dlm_acc": "5.364e-01", "anc_acc": "5.050e-01", "epoch": 0.06396} {"step": 31985, "loss": 1.0549, "grad_norm": "3.961e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.189e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.730e-01", "anc_acc": "5.475e-01", "epoch": 0.06397} {"step": 31990, "loss": 1.1284, "grad_norm": "2.347e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.272e+00", "anc_loss": "1.367e+00", "dlm_acc": "5.859e-01", "anc_acc": "5.657e-01", "epoch": 0.06398} {"step": 31995, "loss": 1.2589, "grad_norm": "5.845e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.797e-01", "anc_loss": "7.684e-01", "dlm_acc": "7.140e-01", "anc_acc": "6.911e-01", "epoch": 0.06399} {"step": 32000, "loss": 0.9532, "grad_norm": "2.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.039e-01", "anc_loss": "6.168e-01", "dlm_acc": "7.696e-01", "anc_acc": "7.376e-01", "epoch": 0.064} {"step": 32005, "loss": 1.1271, "grad_norm": "4.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.297e-01", "anc_loss": "8.184e-01", "dlm_acc": "6.610e-01", "anc_acc": "6.327e-01", "epoch": 0.06401} {"step": 32010, "loss": 1.4491, "grad_norm": "4.602e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.109e-01", "anc_loss": "9.641e-01", "dlm_acc": "5.227e-01", "anc_acc": "5.008e-01", "epoch": 0.06402} {"step": 32015, "loss": 0.7711, "grad_norm": "2.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.199e-01", "anc_loss": "5.465e-01", "dlm_acc": "5.622e-01", "anc_acc": "5.440e-01", "epoch": 0.06403} {"step": 32020, "loss": 0.8591, "grad_norm": "5.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.535e-01", "anc_loss": "5.797e-01", "dlm_acc": "5.740e-01", "anc_acc": "5.572e-01", "epoch": 0.06404} {"step": 32025, "loss": 1.207, "grad_norm": "3.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.305e-01", "anc_loss": "6.531e-01", "dlm_acc": "5.170e-01", "anc_acc": "5.075e-01", "epoch": 0.06405} {"step": 32030, "loss": 1.0017, "grad_norm": "4.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.203e-01", "anc_loss": "9.516e-01", "dlm_acc": "4.305e-01", "anc_acc": "4.209e-01", "epoch": 0.06406} {"step": 32035, "loss": 1.2161, "grad_norm": "2.557e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.094e-01", "anc_loss": "1.079e+00", "dlm_acc": "6.276e-01", "anc_acc": "5.726e-01", "epoch": 0.06407} {"step": 32040, "loss": 1.0976, "grad_norm": "4.092e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.248e+00", "dlm_acc": "5.735e-01", "anc_acc": "5.427e-01", "epoch": 0.06408} {"step": 32045, "loss": 0.93, "grad_norm": "4.695e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.180e-01", "anc_loss": "1.016e+00", "dlm_acc": "6.134e-01", "anc_acc": "5.879e-01", "epoch": 0.06409} {"step": 32050, "loss": 1.2701, "grad_norm": "7.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.398e+00", "anc_loss": "1.520e+00", "dlm_acc": "4.583e-01", "anc_acc": "4.174e-01", "epoch": 0.0641} {"step": 32055, "loss": 1.2562, "grad_norm": "4.109e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.091e+00", "anc_loss": "2.201e+00", "dlm_acc": "2.967e-01", "anc_acc": "2.660e-01", "epoch": 0.06411} {"step": 32060, "loss": 1.5959, "grad_norm": "2.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.545e+00", "anc_loss": "2.623e+00", "dlm_acc": "1.458e-01", "anc_acc": "1.243e-01", "epoch": 0.06412} {"step": 32065, "loss": 1.149, "grad_norm": "3.157e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.205e+00", "dlm_acc": "6.171e-01", "anc_acc": "5.815e-01", "epoch": 0.06413} {"step": 32070, "loss": 1.4522, "grad_norm": "4.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.802e+00", "anc_loss": "1.891e+00", "dlm_acc": "3.858e-01", "anc_acc": "3.624e-01", "epoch": 0.06414} {"step": 32075, "loss": 1.4877, "grad_norm": "4.416e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.162e+00", "dlm_acc": "5.251e-01", "anc_acc": "4.937e-01", "epoch": 0.06415} {"step": 32080, "loss": 1.0725, "grad_norm": "2.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.191e-01", "anc_loss": "6.586e-01", "dlm_acc": "5.563e-01", "anc_acc": "5.287e-01", "epoch": 0.06416} {"step": 32085, "loss": 1.0547, "grad_norm": "1.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.141e-01", "anc_loss": "7.664e-01", "dlm_acc": "5.337e-01", "anc_acc": "5.126e-01", "epoch": 0.06417} {"step": 32090, "loss": 0.9936, "grad_norm": "3.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.152e+00", "dlm_acc": "5.272e-01", "anc_acc": "5.090e-01", "epoch": 0.06418} {"step": 32095, "loss": 0.9285, "grad_norm": "3.059e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.232e-01", "anc_loss": "1.002e+00", "dlm_acc": "6.560e-01", "anc_acc": "6.372e-01", "epoch": 0.06419} {"step": 32100, "loss": 1.0272, "grad_norm": "6.681e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.146e-01", "anc_loss": "5.544e-01", "dlm_acc": "8.032e-01", "anc_acc": "7.938e-01", "epoch": 0.0642} {"step": 32105, "loss": 1.113, "grad_norm": "5.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.123e+00", "dlm_acc": "6.268e-01", "anc_acc": "5.980e-01", "epoch": 0.06421} {"step": 32110, "loss": 1.0412, "grad_norm": "4.406e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.256e-01", "anc_loss": "4.593e-01", "dlm_acc": "6.831e-01", "anc_acc": "6.657e-01", "epoch": 0.06422} {"step": 32115, "loss": 1.2818, "grad_norm": "2.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.174e+00", "dlm_acc": "5.848e-01", "anc_acc": "5.594e-01", "epoch": 0.06423} {"step": 32120, "loss": 1.308, "grad_norm": "5.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.424e+00", "anc_loss": "1.538e+00", "dlm_acc": "5.288e-01", "anc_acc": "5.025e-01", "epoch": 0.06424} {"step": 32125, "loss": 1.1724, "grad_norm": "5.581e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.477e-01", "anc_loss": "1.046e+00", "dlm_acc": "6.331e-01", "anc_acc": "6.078e-01", "epoch": 0.06425} {"step": 32130, "loss": 1.3358, "grad_norm": "7.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.331e+00", "anc_loss": "1.447e+00", "dlm_acc": "5.468e-01", "anc_acc": "5.191e-01", "epoch": 0.06426} {"step": 32135, "loss": 1.3365, "grad_norm": "3.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.543e-01", "anc_loss": "9.266e-01", "dlm_acc": "6.072e-01", "anc_acc": "5.780e-01", "epoch": 0.06427} {"step": 32140, "loss": 0.8832, "grad_norm": "5.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.932e-01", "anc_loss": "4.293e-01", "dlm_acc": "7.227e-01", "anc_acc": "6.952e-01", "epoch": 0.06428} {"step": 32145, "loss": 1.0061, "grad_norm": "2.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.527e-01", "anc_loss": "9.156e-01", "dlm_acc": "5.914e-01", "anc_acc": "5.689e-01", "epoch": 0.06429} {"step": 32150, "loss": 1.393, "grad_norm": "5.802e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.265e+00", "dlm_acc": "6.323e-01", "anc_acc": "6.039e-01", "epoch": 0.0643} {"step": 32155, "loss": 1.5101, "grad_norm": "7.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.270e+00", "dlm_acc": "5.966e-01", "anc_acc": "5.711e-01", "epoch": 0.06431} {"step": 32160, "loss": 1.7073, "grad_norm": "6.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.074e+00", "dlm_acc": "4.515e-01", "anc_acc": "4.379e-01", "epoch": 0.06432} {"step": 32165, "loss": 1.9169, "grad_norm": "5.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.310e+00", "dlm_acc": "5.652e-01", "anc_acc": "5.379e-01", "epoch": 0.06433} {"step": 32170, "loss": 0.779, "grad_norm": "2.035e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.442e-01", "anc_loss": "7.180e-01", "dlm_acc": "6.955e-01", "anc_acc": "6.721e-01", "epoch": 0.06434} {"step": 32175, "loss": 1.2808, "grad_norm": "4.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.236e+00", "dlm_acc": "6.357e-01", "anc_acc": "6.080e-01", "epoch": 0.06435} {"step": 32180, "loss": 1.315, "grad_norm": "4.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.203e-01", "anc_loss": "7.266e-01", "dlm_acc": "7.124e-01", "anc_acc": "6.740e-01", "epoch": 0.06436} {"step": 32185, "loss": 1.3896, "grad_norm": "4.185e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.130e+00", "dlm_acc": "5.514e-01", "anc_acc": "5.320e-01", "epoch": 0.06437} {"step": 32190, "loss": 0.7413, "grad_norm": "2.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.492e-01", "anc_loss": "1.070e+00", "dlm_acc": "6.390e-01", "anc_acc": "6.081e-01", "epoch": 0.06438} {"step": 32195, "loss": 1.0587, "grad_norm": "3.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.340e+00", "dlm_acc": "4.031e-01", "anc_acc": "3.914e-01", "epoch": 0.06439} {"step": 32200, "loss": 0.8952, "grad_norm": "2.752e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.344e-01", "anc_loss": "7.668e-01", "dlm_acc": "4.573e-01", "anc_acc": "4.484e-01", "epoch": 0.0644} {"step": 32205, "loss": 1.6117, "grad_norm": "8.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.654e-01", "anc_loss": "1.060e+00", "dlm_acc": "6.218e-01", "anc_acc": "5.983e-01", "epoch": 0.06441} {"step": 32210, "loss": 1.2788, "grad_norm": "1.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.006e+00", "anc_loss": "1.105e+00", "dlm_acc": "6.151e-01", "anc_acc": "5.884e-01", "epoch": 0.06442} {"step": 32215, "loss": 1.0874, "grad_norm": "4.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.496e-01", "anc_loss": "9.020e-01", "dlm_acc": "6.408e-01", "anc_acc": "6.247e-01", "epoch": 0.06443} {"step": 32220, "loss": 1.4413, "grad_norm": "3.075e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.838e-01", "anc_acc": "5.653e-01", "epoch": 0.06444} {"step": 32225, "loss": 1.004, "grad_norm": "6.351e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.158e+00", "anc_loss": "1.255e+00", "dlm_acc": "5.724e-01", "anc_acc": "5.469e-01", "epoch": 0.06445} {"step": 32230, "loss": 1.2502, "grad_norm": "2.461e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.019e+00", "anc_loss": "1.109e+00", "dlm_acc": "5.969e-01", "anc_acc": "5.732e-01", "epoch": 0.06446} {"step": 32235, "loss": 1.3593, "grad_norm": "3.325e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.101e+00", "dlm_acc": "6.449e-01", "anc_acc": "6.147e-01", "epoch": 0.06447} {"step": 32240, "loss": 1.4849, "grad_norm": "2.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.794e-01", "anc_acc": "5.580e-01", "epoch": 0.06448} {"step": 32245, "loss": 1.3251, "grad_norm": "1.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.424e+00", "dlm_acc": "5.571e-01", "anc_acc": "5.324e-01", "epoch": 0.06449} {"step": 32250, "loss": 1.2734, "grad_norm": "7.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.173e-01", "anc_acc": "4.919e-01", "epoch": 0.0645} {"step": 32255, "loss": 1.5122, "grad_norm": "3.159e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.370e+00", "anc_loss": "1.506e+00", "dlm_acc": "5.489e-01", "anc_acc": "5.190e-01", "epoch": 0.06451} {"step": 32260, "loss": 1.083, "grad_norm": "3.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.062e-01", "anc_loss": "1.014e+00", "dlm_acc": "6.403e-01", "anc_acc": "6.094e-01", "epoch": 0.06452} {"step": 32265, "loss": 1.6145, "grad_norm": "4.798e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.619e+00", "anc_loss": "1.745e+00", "dlm_acc": "5.297e-01", "anc_acc": "5.031e-01", "epoch": 0.06453} {"step": 32270, "loss": 1.3871, "grad_norm": "2.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.097e+00", "anc_loss": "1.221e+00", "dlm_acc": "6.243e-01", "anc_acc": "5.933e-01", "epoch": 0.06454} {"step": 32275, "loss": 1.6233, "grad_norm": "3.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.897e+00", "anc_loss": "2.025e+00", "dlm_acc": "4.471e-01", "anc_acc": "4.239e-01", "epoch": 0.06455} {"step": 32280, "loss": 1.5292, "grad_norm": "1.613e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.415e-01", "anc_acc": "5.241e-01", "epoch": 0.06456} {"step": 32285, "loss": 1.8756, "grad_norm": "2.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.861e+00", "anc_loss": "1.981e+00", "dlm_acc": "4.529e-01", "anc_acc": "4.293e-01", "epoch": 0.06457} {"step": 32290, "loss": 1.1271, "grad_norm": "3.530e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.586e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.259e-01", "anc_acc": "5.971e-01", "epoch": 0.06458} {"step": 32295, "loss": 1.3828, "grad_norm": "3.111e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.511e+00", "anc_loss": "1.628e+00", "dlm_acc": "5.062e-01", "anc_acc": "4.779e-01", "epoch": 0.06459} {"step": 32300, "loss": 1.273, "grad_norm": "5.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.359e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.649e-01", "anc_acc": "5.330e-01", "epoch": 0.0646} {"step": 32305, "loss": 1.1223, "grad_norm": "2.447e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.081e-01", "anc_loss": "9.905e-01", "dlm_acc": "6.982e-01", "anc_acc": "6.761e-01", "epoch": 0.06461} {"step": 32310, "loss": 1.1272, "grad_norm": "2.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.268e+00", "dlm_acc": "5.781e-01", "anc_acc": "5.480e-01", "epoch": 0.06462} {"step": 32315, "loss": 1.1782, "grad_norm": "4.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.404e+00", "dlm_acc": "5.957e-01", "anc_acc": "5.643e-01", "epoch": 0.06463} {"step": 32320, "loss": 1.1712, "grad_norm": "3.386e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.518e+00", "dlm_acc": "5.384e-01", "anc_acc": "5.112e-01", "epoch": 0.06464} {"step": 32325, "loss": 1.2924, "grad_norm": "6.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.260e+00", "dlm_acc": "6.276e-01", "anc_acc": "5.952e-01", "epoch": 0.06465} {"step": 32330, "loss": 1.1014, "grad_norm": "3.675e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.511e+00", "anc_loss": "1.619e+00", "dlm_acc": "4.841e-01", "anc_acc": "4.596e-01", "epoch": 0.06466} {"step": 32335, "loss": 1.0546, "grad_norm": "3.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.575e+00", "dlm_acc": "5.225e-01", "anc_acc": "4.949e-01", "epoch": 0.06467} {"step": 32340, "loss": 1.6016, "grad_norm": "3.382e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.485e+00", "anc_loss": "1.628e+00", "dlm_acc": "5.776e-01", "anc_acc": "5.480e-01", "epoch": 0.06468} {"step": 32345, "loss": 1.2768, "grad_norm": "4.344e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.555e+00", "anc_loss": "1.665e+00", "dlm_acc": "5.194e-01", "anc_acc": "4.966e-01", "epoch": 0.06469} {"step": 32350, "loss": 1.1118, "grad_norm": "3.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.923e-01", "anc_acc": "5.675e-01", "epoch": 0.0647} {"step": 32355, "loss": 1.0053, "grad_norm": "2.619e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.915e-01", "anc_acc": "5.667e-01", "epoch": 0.06471} {"step": 32360, "loss": 0.9827, "grad_norm": "4.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.369e+00", "dlm_acc": "5.628e-01", "anc_acc": "5.336e-01", "epoch": 0.06472} {"step": 32365, "loss": 0.9949, "grad_norm": "3.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.353e+00", "dlm_acc": "6.020e-01", "anc_acc": "5.772e-01", "epoch": 0.06473} {"step": 32370, "loss": 1.2038, "grad_norm": "3.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.691e+00", "dlm_acc": "5.202e-01", "anc_acc": "4.931e-01", "epoch": 0.06474} {"step": 32375, "loss": 0.8824, "grad_norm": "4.331e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.922e-01", "anc_loss": "9.918e-01", "dlm_acc": "6.667e-01", "anc_acc": "6.316e-01", "epoch": 0.06475} {"step": 32380, "loss": 0.7214, "grad_norm": "2.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.165e+00", "anc_loss": "1.253e+00", "dlm_acc": "5.483e-01", "anc_acc": "5.259e-01", "epoch": 0.06476} {"step": 32385, "loss": 0.8454, "grad_norm": "2.714e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.013e+00", "anc_loss": "1.084e+00", "dlm_acc": "6.039e-01", "anc_acc": "5.870e-01", "epoch": 0.06477} {"step": 32390, "loss": 1.3466, "grad_norm": "6.349e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.487e+00", "anc_loss": "1.602e+00", "dlm_acc": "4.849e-01", "anc_acc": "4.564e-01", "epoch": 0.06478} {"step": 32395, "loss": 1.7028, "grad_norm": "3.836e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.367e+00", "anc_loss": "1.497e+00", "dlm_acc": "5.483e-01", "anc_acc": "5.200e-01", "epoch": 0.06479} {"step": 32400, "loss": 1.1528, "grad_norm": "3.470e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.258e-01", "anc_loss": "1.065e+00", "dlm_acc": "6.708e-01", "anc_acc": "6.237e-01", "epoch": 0.0648} {"step": 32405, "loss": 1.0476, "grad_norm": "4.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.762e-01", "anc_loss": "9.641e-01", "dlm_acc": "6.020e-01", "anc_acc": "5.712e-01", "epoch": 0.06481} {"step": 32410, "loss": 1.1712, "grad_norm": "4.070e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.874e-01", "anc_acc": "5.580e-01", "epoch": 0.06482} {"step": 32415, "loss": 1.1643, "grad_norm": "3.780e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.074e-01", "anc_loss": "9.977e-01", "dlm_acc": "6.618e-01", "anc_acc": "6.401e-01", "epoch": 0.06483} {"step": 32420, "loss": 1.8161, "grad_norm": "4.315e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.800e+00", "dlm_acc": "5.429e-01", "anc_acc": "5.235e-01", "epoch": 0.06484} {"step": 32425, "loss": 1.6171, "grad_norm": "3.293e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.091e+00", "anc_loss": "2.158e+00", "dlm_acc": "3.234e-01", "anc_acc": "3.119e-01", "epoch": 0.06485} {"step": 32430, "loss": 0.8691, "grad_norm": "3.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.516e-01", "anc_loss": "1.068e+00", "dlm_acc": "6.614e-01", "anc_acc": "6.308e-01", "epoch": 0.06486} {"step": 32435, "loss": 0.9775, "grad_norm": "3.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.039e-01", "anc_loss": "8.281e-01", "dlm_acc": "4.569e-01", "anc_acc": "4.479e-01", "epoch": 0.06487} {"step": 32440, "loss": 0.7652, "grad_norm": "3.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.635e-01", "anc_loss": "5.230e-01", "dlm_acc": "6.836e-01", "anc_acc": "6.475e-01", "epoch": 0.06488} {"step": 32445, "loss": 0.6484, "grad_norm": "2.907e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.636e-01", "anc_loss": "3.086e-01", "dlm_acc": "7.273e-01", "anc_acc": "6.947e-01", "epoch": 0.06489} {"step": 32450, "loss": 0.7909, "grad_norm": "4.525e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.398e-01", "anc_loss": "5.633e-01", "dlm_acc": "5.554e-01", "anc_acc": "5.415e-01", "epoch": 0.0649} {"step": 32455, "loss": 0.9343, "grad_norm": "2.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.150e-01", "anc_loss": "3.809e-01", "dlm_acc": "7.737e-01", "anc_acc": "7.293e-01", "epoch": 0.06491} {"step": 32460, "loss": 1.0312, "grad_norm": "5.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.903e-01", "anc_loss": "4.561e-01", "dlm_acc": "7.426e-01", "anc_acc": "7.012e-01", "epoch": 0.06492} {"step": 32465, "loss": 1.2816, "grad_norm": "5.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.485e+00", "anc_loss": "1.532e+00", "dlm_acc": "4.674e-01", "anc_acc": "4.536e-01", "epoch": 0.06493} {"step": 32470, "loss": 1.2771, "grad_norm": "3.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.040e+00", "anc_loss": "1.084e+00", "dlm_acc": "3.488e-01", "anc_acc": "3.349e-01", "epoch": 0.06494} {"step": 32475, "loss": 1.1292, "grad_norm": "6.114e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.176e+00", "dlm_acc": "5.849e-01", "anc_acc": "5.493e-01", "epoch": 0.06495} {"step": 32480, "loss": 1.3661, "grad_norm": "3.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.811e+00", "anc_loss": "1.970e+00", "dlm_acc": "4.688e-01", "anc_acc": "4.368e-01", "epoch": 0.06496} {"step": 32485, "loss": 0.7938, "grad_norm": "1.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.232e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.510e-01", "anc_acc": "5.198e-01", "epoch": 0.06497} {"step": 32490, "loss": 0.6323, "grad_norm": "1.912e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.758e-01", "anc_loss": "1.153e+00", "dlm_acc": "6.317e-01", "anc_acc": "5.790e-01", "epoch": 0.06498} {"step": 32495, "loss": 1.0283, "grad_norm": "3.478e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.793e-01", "anc_loss": "1.061e+00", "dlm_acc": "6.139e-01", "anc_acc": "5.883e-01", "epoch": 0.06499} {"step": 32500, "loss": 1.0474, "grad_norm": "3.759e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.268e+00", "dlm_acc": "6.030e-01", "anc_acc": "5.697e-01", "epoch": 0.065} {"step": 32505, "loss": 1.3325, "grad_norm": "2.370e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.353e+00", "dlm_acc": "5.732e-01", "anc_acc": "5.432e-01", "epoch": 0.06501} {"step": 32510, "loss": 1.2156, "grad_norm": "4.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.567e+00", "anc_loss": "1.697e+00", "dlm_acc": "4.987e-01", "anc_acc": "4.677e-01", "epoch": 0.06502} {"step": 32515, "loss": 1.1678, "grad_norm": "4.088e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.977e-01", "anc_loss": "1.104e+00", "dlm_acc": "6.340e-01", "anc_acc": "6.068e-01", "epoch": 0.06503} {"step": 32520, "loss": 0.7129, "grad_norm": "5.186e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.469e-01", "anc_loss": "1.046e+00", "dlm_acc": "5.630e-01", "anc_acc": "5.342e-01", "epoch": 0.06504} {"step": 32525, "loss": 1.0104, "grad_norm": "2.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.606e+00", "dlm_acc": "4.208e-01", "anc_acc": "3.979e-01", "epoch": 0.06505} {"step": 32530, "loss": 1.3065, "grad_norm": "6.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.858e+00", "anc_loss": "1.964e+00", "dlm_acc": "4.104e-01", "anc_acc": "3.870e-01", "epoch": 0.06506} {"step": 32535, "loss": 1.1666, "grad_norm": "2.395e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.163e+00", "anc_loss": "1.293e+00", "dlm_acc": "5.876e-01", "anc_acc": "5.486e-01", "epoch": 0.06507} {"step": 32540, "loss": 1.0911, "grad_norm": "2.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.390e+00", "anc_loss": "1.509e+00", "dlm_acc": "4.979e-01", "anc_acc": "4.718e-01", "epoch": 0.06508} {"step": 32545, "loss": 1.2225, "grad_norm": "2.998e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.505e-01", "anc_acc": "5.171e-01", "epoch": 0.06509} {"step": 32550, "loss": 0.8251, "grad_norm": "1.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.087e-01", "anc_loss": "1.002e+00", "dlm_acc": "6.428e-01", "anc_acc": "6.185e-01", "epoch": 0.0651} {"step": 32555, "loss": 1.1477, "grad_norm": "2.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.648e-01", "anc_acc": "5.370e-01", "epoch": 0.06511} {"step": 32560, "loss": 1.1923, "grad_norm": "6.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.977e-01", "anc_loss": "1.134e+00", "dlm_acc": "6.299e-01", "anc_acc": "5.904e-01", "epoch": 0.06512} {"step": 32565, "loss": 1.2324, "grad_norm": "1.002e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.363e+00", "dlm_acc": "4.799e-01", "anc_acc": "4.527e-01", "epoch": 0.06513} {"step": 32570, "loss": 1.0117, "grad_norm": "1.874e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.163e+00", "dlm_acc": "5.891e-01", "anc_acc": "5.659e-01", "epoch": 0.06514} {"step": 32575, "loss": 0.9775, "grad_norm": "2.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.191e-01", "anc_loss": "1.034e+00", "dlm_acc": "6.778e-01", "anc_acc": "6.451e-01", "epoch": 0.06515} {"step": 32580, "loss": 1.1035, "grad_norm": "8.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.735e+00", "dlm_acc": "4.909e-01", "anc_acc": "4.640e-01", "epoch": 0.06516} {"step": 32585, "loss": 0.8157, "grad_norm": "2.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.742e-01", "anc_acc": "5.499e-01", "epoch": 0.06517} {"step": 32590, "loss": 0.9104, "grad_norm": "3.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.156e+00", "dlm_acc": "6.179e-01", "anc_acc": "5.876e-01", "epoch": 0.06518} {"step": 32595, "loss": 0.7711, "grad_norm": "1.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.596e-01", "anc_acc": "5.325e-01", "epoch": 0.06519} {"step": 32600, "loss": 0.7797, "grad_norm": "1.648e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.317e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.785e-01", "anc_acc": "5.511e-01", "epoch": 0.0652} {"step": 32605, "loss": 0.5074, "grad_norm": "1.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.848e-01", "anc_loss": "9.781e-01", "dlm_acc": "6.477e-01", "anc_acc": "6.196e-01", "epoch": 0.06521} {"step": 32610, "loss": 0.9787, "grad_norm": "2.572e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.311e+00", "dlm_acc": "5.911e-01", "anc_acc": "5.604e-01", "epoch": 0.06522} {"step": 32615, "loss": 0.9736, "grad_norm": "2.714e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.198e+00", "dlm_acc": "5.824e-01", "anc_acc": "5.561e-01", "epoch": 0.06523} {"step": 32620, "loss": 1.1416, "grad_norm": "3.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.662e-01", "anc_acc": "5.392e-01", "epoch": 0.06524} {"step": 32625, "loss": 1.1721, "grad_norm": "4.283e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.397e+00", "anc_loss": "1.534e+00", "dlm_acc": "5.562e-01", "anc_acc": "5.277e-01", "epoch": 0.06525} {"step": 32630, "loss": 1.0209, "grad_norm": "4.228e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.830e-01", "anc_loss": "1.077e+00", "dlm_acc": "6.456e-01", "anc_acc": "6.189e-01", "epoch": 0.06526} {"step": 32635, "loss": 1.0364, "grad_norm": "4.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.382e+00", "dlm_acc": "5.571e-01", "anc_acc": "5.286e-01", "epoch": 0.06527} {"step": 32640, "loss": 1.4468, "grad_norm": "4.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.250e+00", "anc_loss": "2.373e+00", "dlm_acc": "3.251e-01", "anc_acc": "3.060e-01", "epoch": 0.06528} {"step": 32645, "loss": 1.1175, "grad_norm": "3.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.758e-01", "anc_loss": "1.089e+00", "dlm_acc": "5.726e-01", "anc_acc": "5.379e-01", "epoch": 0.06529} {"step": 32650, "loss": 1.0267, "grad_norm": "5.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.253e-01", "anc_loss": "1.012e+00", "dlm_acc": "6.702e-01", "anc_acc": "6.477e-01", "epoch": 0.0653} {"step": 32655, "loss": 1.1882, "grad_norm": "8.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.298e+00", "dlm_acc": "6.033e-01", "anc_acc": "5.530e-01", "epoch": 0.06531} {"step": 32660, "loss": 1.1349, "grad_norm": "6.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.515e+00", "dlm_acc": "5.459e-01", "anc_acc": "5.245e-01", "epoch": 0.06532} {"step": 32665, "loss": 1.0066, "grad_norm": "2.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.199e-01", "anc_loss": "9.508e-01", "dlm_acc": "6.115e-01", "anc_acc": "5.541e-01", "epoch": 0.06533} {"step": 32670, "loss": 1.4581, "grad_norm": "3.911e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.445e+00", "dlm_acc": "4.961e-01", "anc_acc": "4.631e-01", "epoch": 0.06534} {"step": 32675, "loss": 1.4031, "grad_norm": "3.359e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.641e-01", "anc_loss": "1.014e+00", "dlm_acc": "4.097e-01", "anc_acc": "3.842e-01", "epoch": 0.06535} {"step": 32680, "loss": 1.0359, "grad_norm": "3.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.241e+00", "dlm_acc": "5.660e-01", "anc_acc": "5.348e-01", "epoch": 0.06536} {"step": 32685, "loss": 1.4933, "grad_norm": "4.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.383e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.286e-01", "anc_acc": "4.944e-01", "epoch": 0.06537} {"step": 32690, "loss": 1.632, "grad_norm": "4.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.411e+00", "anc_loss": "2.466e+00", "dlm_acc": "2.703e-01", "anc_acc": "2.568e-01", "epoch": 0.06538} {"step": 32695, "loss": 1.0553, "grad_norm": "2.006e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.440e+00", "dlm_acc": "5.113e-01", "anc_acc": "4.713e-01", "epoch": 0.06539} {"step": 32700, "loss": 1.1191, "grad_norm": "4.408e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.354e+00", "dlm_acc": "5.858e-01", "anc_acc": "5.517e-01", "epoch": 0.0654} {"step": 32705, "loss": 1.2541, "grad_norm": "8.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.534e+00", "anc_loss": "1.717e+00", "dlm_acc": "4.994e-01", "anc_acc": "4.693e-01", "epoch": 0.06541} {"step": 32710, "loss": 1.1568, "grad_norm": "2.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.610e+00", "anc_loss": "1.755e+00", "dlm_acc": "4.548e-01", "anc_acc": "4.218e-01", "epoch": 0.06542} {"step": 32715, "loss": 1.0467, "grad_norm": "2.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.727e-01", "anc_loss": "1.102e+00", "dlm_acc": "6.649e-01", "anc_acc": "6.280e-01", "epoch": 0.06543} {"step": 32720, "loss": 0.9662, "grad_norm": "5.587e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.410e+00", "dlm_acc": "5.154e-01", "anc_acc": "4.807e-01", "epoch": 0.06544} {"step": 32725, "loss": 1.7562, "grad_norm": "6.942e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.194e+00", "anc_loss": "2.384e+00", "dlm_acc": "2.757e-01", "anc_acc": "2.373e-01", "epoch": 0.06545} {"step": 32730, "loss": 0.9635, "grad_norm": "3.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.431e+00", "anc_loss": "1.631e+00", "dlm_acc": "4.551e-01", "anc_acc": "4.057e-01", "epoch": 0.06546} {"step": 32735, "loss": 0.9395, "grad_norm": "2.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.203e+00", "dlm_acc": "5.633e-01", "anc_acc": "5.289e-01", "epoch": 0.06547} {"step": 32740, "loss": 1.0552, "grad_norm": "3.751e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.137e+00", "dlm_acc": "5.579e-01", "anc_acc": "5.308e-01", "epoch": 0.06548} {"step": 32745, "loss": 1.3072, "grad_norm": "2.344e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.569e+00", "anc_loss": "1.689e+00", "dlm_acc": "4.787e-01", "anc_acc": "4.538e-01", "epoch": 0.06549} {"step": 32750, "loss": 1.3649, "grad_norm": "2.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.176e+00", "anc_loss": "1.332e+00", "dlm_acc": "5.984e-01", "anc_acc": "5.562e-01", "epoch": 0.0655} {"step": 32755, "loss": 1.4144, "grad_norm": "8.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.454e+00", "anc_loss": "1.618e+00", "dlm_acc": "5.202e-01", "anc_acc": "4.833e-01", "epoch": 0.06551} {"step": 32760, "loss": 1.1709, "grad_norm": "3.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.111e+00", "anc_loss": "1.181e+00", "dlm_acc": "6.759e-01", "anc_acc": "6.631e-01", "epoch": 0.06552} {"step": 32765, "loss": 1.1108, "grad_norm": "2.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.799e-01", "anc_loss": "7.509e-01", "dlm_acc": "7.567e-01", "anc_acc": "7.399e-01", "epoch": 0.06553} {"step": 32770, "loss": 0.8555, "grad_norm": "1.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.102e-01", "anc_loss": "8.242e-01", "dlm_acc": "7.036e-01", "anc_acc": "6.657e-01", "epoch": 0.06554} {"step": 32775, "loss": 1.0375, "grad_norm": "2.450e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.466e+00", "anc_loss": "1.577e+00", "dlm_acc": "4.847e-01", "anc_acc": "4.618e-01", "epoch": 0.06555} {"step": 32780, "loss": 0.9748, "grad_norm": "3.719e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.125e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.958e-01", "anc_acc": "5.694e-01", "epoch": 0.06556} {"step": 32785, "loss": 1.5316, "grad_norm": "4.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.703e+00", "anc_loss": "1.837e+00", "dlm_acc": "4.844e-01", "anc_acc": "4.562e-01", "epoch": 0.06557} {"step": 32790, "loss": 0.9734, "grad_norm": "2.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.992e-01", "anc_loss": "1.110e+00", "dlm_acc": "6.354e-01", "anc_acc": "6.080e-01", "epoch": 0.06558} {"step": 32795, "loss": 1.5272, "grad_norm": "6.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.959e+00", "anc_loss": "2.083e+00", "dlm_acc": "4.337e-01", "anc_acc": "4.050e-01", "epoch": 0.06559} {"step": 32800, "loss": 0.8494, "grad_norm": "2.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.414e-01", "anc_loss": "1.039e+00", "dlm_acc": "6.099e-01", "anc_acc": "5.799e-01", "epoch": 0.0656} {"step": 32805, "loss": 1.4197, "grad_norm": "4.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.864e+00", "anc_loss": "1.966e+00", "dlm_acc": "4.109e-01", "anc_acc": "3.886e-01", "epoch": 0.06561} {"step": 32810, "loss": 0.9868, "grad_norm": "3.668e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.805e-01", "anc_loss": "1.142e+00", "dlm_acc": "5.963e-01", "anc_acc": "5.458e-01", "epoch": 0.06562} {"step": 32815, "loss": 1.3884, "grad_norm": "3.527e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.369e+00", "anc_loss": "1.543e+00", "dlm_acc": "5.310e-01", "anc_acc": "4.849e-01", "epoch": 0.06563} {"step": 32820, "loss": 1.0756, "grad_norm": "3.399e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.422e+00", "dlm_acc": "4.969e-01", "anc_acc": "4.680e-01", "epoch": 0.06564} {"step": 32825, "loss": 1.153, "grad_norm": "4.265e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.346e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.526e-01", "anc_acc": "5.300e-01", "epoch": 0.06565} {"step": 32830, "loss": 1.5354, "grad_norm": "3.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.904e+00", "anc_loss": "1.997e+00", "dlm_acc": "3.932e-01", "anc_acc": "3.745e-01", "epoch": 0.06566} {"step": 32835, "loss": 1.5894, "grad_norm": "3.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.825e+00", "anc_loss": "1.941e+00", "dlm_acc": "4.819e-01", "anc_acc": "4.584e-01", "epoch": 0.06567} {"step": 32840, "loss": 0.7956, "grad_norm": "3.230e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.892e-01", "anc_loss": "7.879e-01", "dlm_acc": "7.305e-01", "anc_acc": "7.012e-01", "epoch": 0.06568} {"step": 32845, "loss": 1.4494, "grad_norm": "4.863e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.340e+00", "anc_loss": "1.451e+00", "dlm_acc": "5.719e-01", "anc_acc": "5.458e-01", "epoch": 0.06569} {"step": 32850, "loss": 1.1754, "grad_norm": "4.971e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.236e+00", "dlm_acc": "5.980e-01", "anc_acc": "5.697e-01", "epoch": 0.0657} {"step": 32855, "loss": 1.3943, "grad_norm": "3.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.583e+00", "dlm_acc": "5.311e-01", "anc_acc": "5.074e-01", "epoch": 0.06571} {"step": 32860, "loss": 1.2735, "grad_norm": "2.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.648e+00", "dlm_acc": "4.982e-01", "anc_acc": "4.739e-01", "epoch": 0.06572} {"step": 32865, "loss": 1.1466, "grad_norm": "3.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.836e-01", "anc_loss": "1.109e+00", "dlm_acc": "6.194e-01", "anc_acc": "5.857e-01", "epoch": 0.06573} {"step": 32870, "loss": 1.6431, "grad_norm": "2.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.484e-01", "anc_loss": "9.125e-01", "dlm_acc": "7.354e-01", "anc_acc": "6.925e-01", "epoch": 0.06574} {"step": 32875, "loss": 1.7526, "grad_norm": "3.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.494e+00", "anc_loss": "1.628e+00", "dlm_acc": "5.610e-01", "anc_acc": "5.359e-01", "epoch": 0.06575} {"step": 32880, "loss": 1.7226, "grad_norm": "3.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.528e-01", "anc_acc": "5.263e-01", "epoch": 0.06576} {"step": 32885, "loss": 0.93, "grad_norm": "2.158e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.209e+00", "dlm_acc": "5.736e-01", "anc_acc": "5.459e-01", "epoch": 0.06577} {"step": 32890, "loss": 1.352, "grad_norm": "4.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.364e+00", "anc_loss": "1.506e+00", "dlm_acc": "5.650e-01", "anc_acc": "5.335e-01", "epoch": 0.06578} {"step": 32895, "loss": 1.4354, "grad_norm": "3.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.726e+00", "anc_loss": "1.831e+00", "dlm_acc": "4.515e-01", "anc_acc": "4.291e-01", "epoch": 0.06579} {"step": 32900, "loss": 1.451, "grad_norm": "3.411e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.628e-01", "anc_acc": "5.381e-01", "epoch": 0.0658} {"step": 32905, "loss": 1.3619, "grad_norm": "3.067e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.148e-01", "anc_loss": "9.992e-01", "dlm_acc": "6.121e-01", "anc_acc": "5.879e-01", "epoch": 0.06581} {"step": 32910, "loss": 1.565, "grad_norm": "2.681e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.283e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.516e-01", "anc_acc": "5.280e-01", "epoch": 0.06582} {"step": 32915, "loss": 1.2788, "grad_norm": "2.524e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.070e-01", "anc_loss": "6.328e-01", "dlm_acc": "6.390e-01", "anc_acc": "6.291e-01", "epoch": 0.06583} {"step": 32920, "loss": 1.1926, "grad_norm": "4.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.320e-01", "anc_loss": "5.555e-01", "dlm_acc": "6.590e-01", "anc_acc": "6.472e-01", "epoch": 0.06584} {"step": 32925, "loss": 1.2891, "grad_norm": "4.552e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.586e-01", "anc_loss": "1.034e+00", "dlm_acc": "6.030e-01", "anc_acc": "5.817e-01", "epoch": 0.06585} {"step": 32930, "loss": 1.3834, "grad_norm": "3.617e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.945e-01", "anc_loss": "1.093e+00", "dlm_acc": "5.884e-01", "anc_acc": "5.648e-01", "epoch": 0.06586} {"step": 32935, "loss": 1.3295, "grad_norm": "3.456e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.570e-01", "anc_loss": "8.055e-01", "dlm_acc": "6.074e-01", "anc_acc": "5.895e-01", "epoch": 0.06587} {"step": 32940, "loss": 1.0946, "grad_norm": "3.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.582e-01", "anc_loss": "9.246e-01", "dlm_acc": "6.026e-01", "anc_acc": "5.829e-01", "epoch": 0.06588} {"step": 32945, "loss": 1.3903, "grad_norm": "5.411e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.469e-01", "anc_loss": "9.570e-01", "dlm_acc": "3.062e-01", "anc_acc": "3.015e-01", "epoch": 0.06589} {"step": 32950, "loss": 1.6368, "grad_norm": "4.432e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.025e+00", "dlm_acc": "3.111e-01", "anc_acc": "3.091e-01", "epoch": 0.0659} {"step": 32955, "loss": 1.3401, "grad_norm": "4.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.812e-01", "anc_loss": "9.914e-01", "dlm_acc": "3.097e-01", "anc_acc": "3.077e-01", "epoch": 0.06591} {"step": 32960, "loss": 1.3834, "grad_norm": "2.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.246e+00", "dlm_acc": "4.356e-01", "anc_acc": "4.215e-01", "epoch": 0.06592} {"step": 32965, "loss": 1.012, "grad_norm": "4.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.477e-01", "anc_loss": "1.020e+00", "dlm_acc": "5.866e-01", "anc_acc": "5.683e-01", "epoch": 0.06593} {"step": 32970, "loss": 0.9963, "grad_norm": "2.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.645e-01", "anc_loss": "7.230e-01", "dlm_acc": "6.463e-01", "anc_acc": "6.233e-01", "epoch": 0.06594} {"step": 32975, "loss": 1.0442, "grad_norm": "3.327e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.197e+00", "anc_loss": "1.302e+00", "dlm_acc": "5.547e-01", "anc_acc": "5.297e-01", "epoch": 0.06595} {"step": 32980, "loss": 1.17, "grad_norm": "3.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.664e-01", "anc_loss": "9.297e-01", "dlm_acc": "5.590e-01", "anc_acc": "5.368e-01", "epoch": 0.06596} {"step": 32985, "loss": 1.1482, "grad_norm": "4.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.900e-01", "anc_loss": "1.073e+00", "dlm_acc": "6.421e-01", "anc_acc": "6.214e-01", "epoch": 0.06597} {"step": 32990, "loss": 1.2056, "grad_norm": "3.406e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.288e+00", "dlm_acc": "4.994e-01", "anc_acc": "4.812e-01", "epoch": 0.06598} {"step": 32995, "loss": 1.599, "grad_norm": "5.498e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.031e-01", "anc_loss": "1.005e+00", "dlm_acc": "6.061e-01", "anc_acc": "5.756e-01", "epoch": 0.06599} {"step": 33000, "loss": 1.2329, "grad_norm": "3.389e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.321e+00", "anc_loss": "1.410e+00", "dlm_acc": "5.454e-01", "anc_acc": "5.242e-01", "epoch": 0.066} {"step": 33005, "loss": 1.262, "grad_norm": "3.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.133e-01", "anc_loss": "1.010e+00", "dlm_acc": "6.405e-01", "anc_acc": "6.168e-01", "epoch": 0.06601} {"step": 33010, "loss": 1.4717, "grad_norm": "5.010e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.305e-01", "anc_loss": "9.563e-01", "dlm_acc": "6.710e-01", "anc_acc": "6.320e-01", "epoch": 0.06602} {"step": 33015, "loss": 1.1339, "grad_norm": "3.526e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.549e-01", "anc_loss": "9.012e-01", "dlm_acc": "5.964e-01", "anc_acc": "5.772e-01", "epoch": 0.06603} {"step": 33020, "loss": 1.1941, "grad_norm": "3.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.836e-01", "anc_loss": "9.711e-01", "dlm_acc": "6.545e-01", "anc_acc": "6.307e-01", "epoch": 0.06604} {"step": 33025, "loss": 1.4347, "grad_norm": "6.074e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.492e-01", "anc_acc": "5.284e-01", "epoch": 0.06605} {"step": 33030, "loss": 0.9839, "grad_norm": "2.447e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.500e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.234e-01", "anc_acc": "5.995e-01", "epoch": 0.06606} {"step": 33035, "loss": 1.0017, "grad_norm": "2.803e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.695e-01", "anc_loss": "5.949e-01", "dlm_acc": "5.399e-01", "anc_acc": "5.234e-01", "epoch": 0.06607} {"step": 33040, "loss": 1.5279, "grad_norm": "5.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.970e-01", "anc_acc": "5.681e-01", "epoch": 0.06608} {"step": 33045, "loss": 0.984, "grad_norm": "3.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.934e-01", "anc_loss": "7.445e-01", "dlm_acc": "5.852e-01", "anc_acc": "5.646e-01", "epoch": 0.06609} {"step": 33050, "loss": 1.0701, "grad_norm": "3.107e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.277e-01", "anc_loss": "7.824e-01", "dlm_acc": "5.817e-01", "anc_acc": "5.620e-01", "epoch": 0.0661} {"step": 33055, "loss": 1.2227, "grad_norm": "4.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.398e-01", "anc_loss": "9.156e-01", "dlm_acc": "6.300e-01", "anc_acc": "6.070e-01", "epoch": 0.06611} {"step": 33060, "loss": 1.542, "grad_norm": "4.116e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.285e+00", "dlm_acc": "5.101e-01", "anc_acc": "4.788e-01", "epoch": 0.06612} {"step": 33065, "loss": 1.3078, "grad_norm": "3.036e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.239e+00", "dlm_acc": "5.966e-01", "anc_acc": "5.711e-01", "epoch": 0.06613} {"step": 33070, "loss": 1.0432, "grad_norm": "5.010e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.108e-01", "anc_loss": "2.477e-01", "dlm_acc": "9.028e-01", "anc_acc": "8.857e-01", "epoch": 0.06614} {"step": 33075, "loss": 1.3216, "grad_norm": "5.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.075e-01", "anc_loss": "2.537e-01", "dlm_acc": "9.097e-01", "anc_acc": "8.866e-01", "epoch": 0.06615} {"step": 33080, "loss": 1.6947, "grad_norm": "3.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.025e+00", "anc_loss": "1.129e+00", "dlm_acc": "6.270e-01", "anc_acc": "5.952e-01", "epoch": 0.06616} {"step": 33085, "loss": 1.2423, "grad_norm": "2.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.091e-01", "anc_loss": "9.812e-01", "dlm_acc": "7.157e-01", "anc_acc": "7.007e-01", "epoch": 0.06617} {"step": 33090, "loss": 1.2597, "grad_norm": "1.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.732e-01", "anc_acc": "5.470e-01", "epoch": 0.06618} {"step": 33095, "loss": 1.614, "grad_norm": "4.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.540e+00", "anc_loss": "1.648e+00", "dlm_acc": "5.134e-01", "anc_acc": "4.880e-01", "epoch": 0.06619} {"step": 33100, "loss": 1.6489, "grad_norm": "4.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.927e+00", "anc_loss": "2.039e+00", "dlm_acc": "4.428e-01", "anc_acc": "4.208e-01", "epoch": 0.0662} {"step": 33105, "loss": 1.0181, "grad_norm": "3.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.157e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.698e-01", "anc_acc": "5.400e-01", "epoch": 0.06621} {"step": 33110, "loss": 1.8054, "grad_norm": "3.483e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.970e+00", "anc_loss": "2.092e+00", "dlm_acc": "4.601e-01", "anc_acc": "4.369e-01", "epoch": 0.06622} {"step": 33115, "loss": 0.92, "grad_norm": "2.498e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.605e-01", "anc_loss": "9.656e-01", "dlm_acc": "6.333e-01", "anc_acc": "6.027e-01", "epoch": 0.06623} {"step": 33120, "loss": 1.331, "grad_norm": "2.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.292e+00", "dlm_acc": "5.849e-01", "anc_acc": "5.590e-01", "epoch": 0.06624} {"step": 33125, "loss": 1.3948, "grad_norm": "4.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.786e+00", "anc_loss": "1.857e+00", "dlm_acc": "3.677e-01", "anc_acc": "3.533e-01", "epoch": 0.06625} {"step": 33130, "loss": 1.2246, "grad_norm": "2.162e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.028e+00", "anc_loss": "1.137e+00", "dlm_acc": "6.147e-01", "anc_acc": "5.859e-01", "epoch": 0.06626} {"step": 33135, "loss": 1.5151, "grad_norm": "5.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.478e+00", "anc_loss": "1.577e+00", "dlm_acc": "5.086e-01", "anc_acc": "4.862e-01", "epoch": 0.06627} {"step": 33140, "loss": 1.0561, "grad_norm": "3.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.076e+00", "anc_loss": "1.172e+00", "dlm_acc": "6.103e-01", "anc_acc": "5.867e-01", "epoch": 0.06628} {"step": 33145, "loss": 1.1908, "grad_norm": "4.905e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.517e-01", "anc_acc": "5.258e-01", "epoch": 0.06629} {"step": 33150, "loss": 1.2684, "grad_norm": "1.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.446e+00", "dlm_acc": "5.617e-01", "anc_acc": "5.350e-01", "epoch": 0.0663} {"step": 33155, "loss": 1.2565, "grad_norm": "2.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.314e+00", "dlm_acc": "5.740e-01", "anc_acc": "5.493e-01", "epoch": 0.06631} {"step": 33160, "loss": 1.2898, "grad_norm": "6.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.789e-01", "anc_acc": "5.536e-01", "epoch": 0.06632} {"step": 33165, "loss": 1.6257, "grad_norm": "5.292e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.622e+00", "anc_loss": "1.752e+00", "dlm_acc": "5.289e-01", "anc_acc": "5.042e-01", "epoch": 0.06633} {"step": 33170, "loss": 1.2782, "grad_norm": "2.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.979e-01", "anc_loss": "8.852e-01", "dlm_acc": "6.755e-01", "anc_acc": "6.439e-01", "epoch": 0.06634} {"step": 33175, "loss": 1.2923, "grad_norm": "6.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.126e+00", "anc_loss": "1.248e+00", "dlm_acc": "6.038e-01", "anc_acc": "5.658e-01", "epoch": 0.06635} {"step": 33180, "loss": 1.1583, "grad_norm": "3.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.356e+00", "dlm_acc": "5.446e-01", "anc_acc": "5.059e-01", "epoch": 0.06636} {"step": 33185, "loss": 0.8001, "grad_norm": "4.921e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.719e-01", "anc_loss": "7.578e-01", "dlm_acc": "6.852e-01", "anc_acc": "6.505e-01", "epoch": 0.06637} {"step": 33190, "loss": 1.2171, "grad_norm": "5.174e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.131e+00", "dlm_acc": "6.321e-01", "anc_acc": "5.989e-01", "epoch": 0.06638} {"step": 33195, "loss": 1.1768, "grad_norm": "3.628e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.167e+00", "anc_loss": "1.268e+00", "dlm_acc": "5.635e-01", "anc_acc": "5.393e-01", "epoch": 0.06639} {"step": 33200, "loss": 1.5332, "grad_norm": "2.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.750e-01", "anc_loss": "1.083e+00", "dlm_acc": "6.620e-01", "anc_acc": "6.326e-01", "epoch": 0.0664} {"step": 33205, "loss": 0.9305, "grad_norm": "3.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.547e-01", "anc_loss": "7.703e-01", "dlm_acc": "7.133e-01", "anc_acc": "6.729e-01", "epoch": 0.06641} {"step": 33210, "loss": 1.2514, "grad_norm": "3.341e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.456e+00", "anc_loss": "1.503e+00", "dlm_acc": "4.372e-01", "anc_acc": "4.268e-01", "epoch": 0.06642} {"step": 33215, "loss": 1.2001, "grad_norm": "2.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.797e-01", "anc_loss": "1.075e+00", "dlm_acc": "5.659e-01", "anc_acc": "5.350e-01", "epoch": 0.06643} {"step": 33220, "loss": 1.0992, "grad_norm": "2.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.015e+00", "anc_loss": "1.131e+00", "dlm_acc": "6.040e-01", "anc_acc": "5.663e-01", "epoch": 0.06644} {"step": 33225, "loss": 1.5322, "grad_norm": "3.113e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.666e+00", "dlm_acc": "5.313e-01", "anc_acc": "4.894e-01", "epoch": 0.06645} {"step": 33230, "loss": 1.7136, "grad_norm": "8.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.231e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.982e-01", "anc_acc": "5.667e-01", "epoch": 0.06646} {"step": 33235, "loss": 1.002, "grad_norm": "2.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.297e-01", "anc_acc": "5.016e-01", "epoch": 0.06647} {"step": 33240, "loss": 1.3788, "grad_norm": "2.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.260e+00", "anc_loss": "1.356e+00", "dlm_acc": "5.031e-01", "anc_acc": "4.742e-01", "epoch": 0.06648} {"step": 33245, "loss": 1.6521, "grad_norm": "5.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.540e-01", "anc_acc": "5.150e-01", "epoch": 0.06649} {"step": 33250, "loss": 1.566, "grad_norm": "6.048e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.756e+00", "anc_loss": "1.909e+00", "dlm_acc": "4.484e-01", "anc_acc": "4.111e-01", "epoch": 0.0665} {"step": 33255, "loss": 1.2197, "grad_norm": "2.420e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.225e+00", "anc_loss": "1.328e+00", "dlm_acc": "5.696e-01", "anc_acc": "5.451e-01", "epoch": 0.06651} {"step": 33260, "loss": 1.4442, "grad_norm": "4.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.734e-01", "anc_loss": "1.200e+00", "dlm_acc": "6.254e-01", "anc_acc": "5.504e-01", "epoch": 0.06652} {"step": 33265, "loss": 0.988, "grad_norm": "2.804e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.441e-01", "anc_loss": "9.082e-01", "dlm_acc": "6.712e-01", "anc_acc": "6.070e-01", "epoch": 0.06653} {"step": 33270, "loss": 1.5437, "grad_norm": "3.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.528e+00", "anc_loss": "1.687e+00", "dlm_acc": "5.174e-01", "anc_acc": "4.752e-01", "epoch": 0.06654} {"step": 33275, "loss": 1.0266, "grad_norm": "3.089e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.766e-01", "anc_loss": "9.023e-01", "dlm_acc": "6.064e-01", "anc_acc": "5.645e-01", "epoch": 0.06655} {"step": 33280, "loss": 1.4926, "grad_norm": "5.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.827e+00", "anc_loss": "1.936e+00", "dlm_acc": "3.437e-01", "anc_acc": "3.197e-01", "epoch": 0.06656} {"step": 33285, "loss": 1.3249, "grad_norm": "3.883e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.523e+00", "anc_loss": "1.714e+00", "dlm_acc": "3.914e-01", "anc_acc": "3.475e-01", "epoch": 0.06657} {"step": 33290, "loss": 1.4773, "grad_norm": "8.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.506e+00", "anc_loss": "1.688e+00", "dlm_acc": "4.073e-01", "anc_acc": "3.616e-01", "epoch": 0.06658} {"step": 33295, "loss": 1.3098, "grad_norm": "5.696e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.534e+00", "anc_loss": "1.694e+00", "dlm_acc": "3.671e-01", "anc_acc": "3.258e-01", "epoch": 0.06659} {"step": 33300, "loss": 1.612, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.682e+00", "anc_loss": "1.802e+00", "dlm_acc": "4.555e-01", "anc_acc": "4.305e-01", "epoch": 0.0666} {"step": 33305, "loss": 1.3592, "grad_norm": "8.676e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.172e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.788e-01", "anc_acc": "5.514e-01", "epoch": 0.06661} {"step": 33310, "loss": 1.3638, "grad_norm": "8.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.132e+00", "anc_loss": "1.225e+00", "dlm_acc": "6.177e-01", "anc_acc": "5.942e-01", "epoch": 0.06662} {"step": 33315, "loss": 1.075, "grad_norm": "2.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.591e-01", "anc_acc": "5.312e-01", "epoch": 0.06663} {"step": 33320, "loss": 0.9616, "grad_norm": "4.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.195e-01", "anc_loss": "1.014e+00", "dlm_acc": "6.306e-01", "anc_acc": "6.038e-01", "epoch": 0.06664} {"step": 33325, "loss": 1.267, "grad_norm": "3.778e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.436e+00", "dlm_acc": "5.724e-01", "anc_acc": "5.324e-01", "epoch": 0.06665} {"step": 33330, "loss": 1.3583, "grad_norm": "7.320e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.235e+00", "anc_loss": "1.317e+00", "dlm_acc": "5.117e-01", "anc_acc": "4.902e-01", "epoch": 0.06666} {"step": 33335, "loss": 1.0271, "grad_norm": "2.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.289e-01", "anc_loss": "8.625e-01", "dlm_acc": "3.584e-01", "anc_acc": "3.458e-01", "epoch": 0.06667} {"step": 33340, "loss": 1.266, "grad_norm": "4.794e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.502e-01", "anc_acc": "5.264e-01", "epoch": 0.06668} {"step": 33345, "loss": 1.2128, "grad_norm": "5.714e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.346e+00", "dlm_acc": "4.661e-01", "anc_acc": "4.437e-01", "epoch": 0.06669} {"step": 33350, "loss": 1.0311, "grad_norm": "3.513e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.566e-01", "anc_loss": "8.562e-01", "dlm_acc": "6.527e-01", "anc_acc": "6.174e-01", "epoch": 0.0667} {"step": 33355, "loss": 1.1081, "grad_norm": "2.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.555e-01", "anc_loss": "1.062e+00", "dlm_acc": "6.514e-01", "anc_acc": "6.189e-01", "epoch": 0.06671} {"step": 33360, "loss": 1.202, "grad_norm": "1.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.131e+00", "dlm_acc": "5.580e-01", "anc_acc": "5.281e-01", "epoch": 0.06672} {"step": 33365, "loss": 1.4838, "grad_norm": "3.192e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.791e+00", "anc_loss": "1.887e+00", "dlm_acc": "4.480e-01", "anc_acc": "4.243e-01", "epoch": 0.06673} {"step": 33370, "loss": 1.3166, "grad_norm": "3.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.261e+00", "anc_loss": "1.392e+00", "dlm_acc": "5.545e-01", "anc_acc": "5.137e-01", "epoch": 0.06674} {"step": 33375, "loss": 1.6732, "grad_norm": "4.748e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.482e+00", "anc_loss": "1.627e+00", "dlm_acc": "5.286e-01", "anc_acc": "4.972e-01", "epoch": 0.06675} {"step": 33380, "loss": 1.159, "grad_norm": "2.493e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.074e-01", "anc_loss": "7.609e-01", "dlm_acc": "6.443e-01", "anc_acc": "6.287e-01", "epoch": 0.06676} {"step": 33385, "loss": 1.4025, "grad_norm": "8.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.668e-01", "anc_loss": "8.289e-01", "dlm_acc": "6.321e-01", "anc_acc": "6.097e-01", "epoch": 0.06677} {"step": 33390, "loss": 1.1629, "grad_norm": "3.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.688e-01", "anc_loss": "8.234e-01", "dlm_acc": "5.975e-01", "anc_acc": "5.830e-01", "epoch": 0.06678} {"step": 33395, "loss": 0.8598, "grad_norm": "2.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.652e-01", "anc_loss": "7.199e-01", "dlm_acc": "6.310e-01", "anc_acc": "6.135e-01", "epoch": 0.06679} {"step": 33400, "loss": 1.1002, "grad_norm": "4.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.484e-01", "anc_loss": "8.047e-01", "dlm_acc": "6.081e-01", "anc_acc": "5.902e-01", "epoch": 0.0668} {"step": 33405, "loss": 1.0225, "grad_norm": "2.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.731e-01", "anc_acc": "5.485e-01", "epoch": 0.06681} {"step": 33410, "loss": 1.038, "grad_norm": "3.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.176e-01", "anc_loss": "5.492e-01", "dlm_acc": "6.855e-01", "anc_acc": "6.712e-01", "epoch": 0.06682} {"step": 33415, "loss": 1.091, "grad_norm": "5.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.957e-01", "anc_loss": "4.375e-01", "dlm_acc": "7.459e-01", "anc_acc": "7.278e-01", "epoch": 0.06683} {"step": 33420, "loss": 1.0919, "grad_norm": "5.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.141e-01", "anc_loss": "5.824e-01", "dlm_acc": "6.994e-01", "anc_acc": "6.768e-01", "epoch": 0.06684} {"step": 33425, "loss": 1.2719, "grad_norm": "2.945e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.863e-01", "anc_loss": "6.359e-01", "dlm_acc": "6.718e-01", "anc_acc": "6.511e-01", "epoch": 0.06685} {"step": 33430, "loss": 1.0613, "grad_norm": "3.234e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.292e-01", "anc_loss": "5.827e-01", "dlm_acc": "7.670e-01", "anc_acc": "7.538e-01", "epoch": 0.06686} {"step": 33435, "loss": 1.4999, "grad_norm": "2.896e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.566e+00", "anc_loss": "1.692e+00", "dlm_acc": "4.815e-01", "anc_acc": "4.481e-01", "epoch": 0.06687} {"step": 33440, "loss": 1.5289, "grad_norm": "4.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.526e+00", "anc_loss": "1.627e+00", "dlm_acc": "4.860e-01", "anc_acc": "4.625e-01", "epoch": 0.06688} {"step": 33445, "loss": 1.3578, "grad_norm": "3.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.914e-01", "anc_loss": "1.077e+00", "dlm_acc": "6.096e-01", "anc_acc": "5.858e-01", "epoch": 0.06689} {"step": 33450, "loss": 1.2749, "grad_norm": "4.110e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.206e+00", "dlm_acc": "5.267e-01", "anc_acc": "5.000e-01", "epoch": 0.0669} {"step": 33455, "loss": 1.4495, "grad_norm": "4.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.601e-01", "anc_acc": "5.330e-01", "epoch": 0.06691} {"step": 33460, "loss": 1.2504, "grad_norm": "3.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.033e-01", "anc_loss": "1.022e+00", "dlm_acc": "6.649e-01", "anc_acc": "6.311e-01", "epoch": 0.06692} {"step": 33465, "loss": 1.0727, "grad_norm": "1.695e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.078e+00", "anc_loss": "1.177e+00", "dlm_acc": "5.891e-01", "anc_acc": "5.633e-01", "epoch": 0.06693} {"step": 33470, "loss": 1.4496, "grad_norm": "5.152e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.476e+00", "anc_loss": "1.595e+00", "dlm_acc": "5.201e-01", "anc_acc": "4.959e-01", "epoch": 0.06694} {"step": 33475, "loss": 1.2942, "grad_norm": "3.293e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.039e+00", "anc_loss": "2.089e+00", "dlm_acc": "2.481e-01", "anc_acc": "2.334e-01", "epoch": 0.06695} {"step": 33480, "loss": 1.5144, "grad_norm": "3.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.341e+00", "anc_loss": "1.453e+00", "dlm_acc": "4.865e-01", "anc_acc": "4.583e-01", "epoch": 0.06696} {"step": 33485, "loss": 1.3488, "grad_norm": "2.668e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.635e+00", "anc_loss": "1.736e+00", "dlm_acc": "4.163e-01", "anc_acc": "3.911e-01", "epoch": 0.06697} {"step": 33490, "loss": 1.1536, "grad_norm": "6.385e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.236e+00", "dlm_acc": "6.039e-01", "anc_acc": "5.761e-01", "epoch": 0.06698} {"step": 33495, "loss": 1.222, "grad_norm": "3.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.284e-01", "anc_loss": "9.177e-01", "dlm_acc": "7.035e-01", "anc_acc": "6.805e-01", "epoch": 0.06699} {"step": 33500, "loss": 0.8561, "grad_norm": "3.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.039e-01", "anc_loss": "2.588e-01", "dlm_acc": "8.893e-01", "anc_acc": "8.669e-01", "epoch": 0.067} {"step": 33505, "loss": 1.0946, "grad_norm": "5.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.090e+00", "anc_loss": "1.203e+00", "dlm_acc": "6.286e-01", "anc_acc": "5.972e-01", "epoch": 0.06701} {"step": 33510, "loss": 1.335, "grad_norm": "3.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.015e+00", "anc_loss": "1.109e+00", "dlm_acc": "5.952e-01", "anc_acc": "5.698e-01", "epoch": 0.06702} {"step": 33515, "loss": 1.3862, "grad_norm": "3.646e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.206e+00", "anc_loss": "1.319e+00", "dlm_acc": "5.427e-01", "anc_acc": "5.153e-01", "epoch": 0.06703} {"step": 33520, "loss": 1.5894, "grad_norm": "1.004e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.343e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.262e-01", "anc_acc": "4.994e-01", "epoch": 0.06704} {"step": 33525, "loss": 1.3173, "grad_norm": "2.921e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.442e+00", "anc_loss": "1.547e+00", "dlm_acc": "5.168e-01", "anc_acc": "4.914e-01", "epoch": 0.06705} {"step": 33530, "loss": 1.6213, "grad_norm": "4.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.588e+00", "anc_loss": "1.721e+00", "dlm_acc": "4.345e-01", "anc_acc": "3.906e-01", "epoch": 0.06706} {"step": 33535, "loss": 1.348, "grad_norm": "2.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.677e-01", "anc_acc": "5.447e-01", "epoch": 0.06707} {"step": 33540, "loss": 1.4236, "grad_norm": "5.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.227e+00", "dlm_acc": "6.036e-01", "anc_acc": "5.768e-01", "epoch": 0.06708} {"step": 33545, "loss": 1.3902, "grad_norm": "2.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.275e+00", "dlm_acc": "5.608e-01", "anc_acc": "5.247e-01", "epoch": 0.06709} {"step": 33550, "loss": 1.3858, "grad_norm": "5.862e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.126e+00", "dlm_acc": "6.452e-01", "anc_acc": "6.266e-01", "epoch": 0.0671} {"step": 33555, "loss": 1.2519, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.097e-01", "anc_acc": "4.867e-01", "epoch": 0.06711} {"step": 33560, "loss": 1.2722, "grad_norm": "2.573e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.389e+00", "dlm_acc": "5.932e-01", "anc_acc": "5.609e-01", "epoch": 0.06712} {"step": 33565, "loss": 1.2524, "grad_norm": "4.059e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.625e-01", "anc_loss": "9.289e-01", "dlm_acc": "5.273e-01", "anc_acc": "5.108e-01", "epoch": 0.06713} {"step": 33570, "loss": 1.3197, "grad_norm": "2.395e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.613e-01", "anc_loss": "7.098e-01", "dlm_acc": "5.903e-01", "anc_acc": "5.817e-01", "epoch": 0.06714} {"step": 33575, "loss": 1.2887, "grad_norm": "3.678e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.238e-01", "anc_loss": "8.047e-01", "dlm_acc": "6.562e-01", "anc_acc": "6.190e-01", "epoch": 0.06715} {"step": 33580, "loss": 1.1601, "grad_norm": "9.214e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.555e-01", "anc_loss": "7.977e-01", "dlm_acc": "5.800e-01", "anc_acc": "5.609e-01", "epoch": 0.06716} {"step": 33585, "loss": 0.9662, "grad_norm": "2.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.375e-01", "anc_loss": "8.141e-01", "dlm_acc": "5.989e-01", "anc_acc": "5.712e-01", "epoch": 0.06717} {"step": 33590, "loss": 0.6518, "grad_norm": "2.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.928e-01", "anc_loss": "4.480e-01", "dlm_acc": "7.972e-01", "anc_acc": "7.784e-01", "epoch": 0.06718} {"step": 33595, "loss": 1.122, "grad_norm": "2.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.551e-01", "anc_loss": "9.242e-01", "dlm_acc": "5.797e-01", "anc_acc": "5.545e-01", "epoch": 0.06719} {"step": 33600, "loss": 1.1966, "grad_norm": "2.806e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.245e+00", "dlm_acc": "5.866e-01", "anc_acc": "5.612e-01", "epoch": 0.0672} {"step": 33605, "loss": 1.1366, "grad_norm": "3.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.126e+00", "anc_loss": "1.234e+00", "dlm_acc": "6.153e-01", "anc_acc": "5.884e-01", "epoch": 0.06721} {"step": 33610, "loss": 1.5829, "grad_norm": "3.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.012e-01", "anc_loss": "6.508e-01", "dlm_acc": "6.667e-01", "anc_acc": "6.457e-01", "epoch": 0.06722} {"step": 33615, "loss": 1.0235, "grad_norm": "3.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.828e-01", "anc_loss": "6.453e-01", "dlm_acc": "6.810e-01", "anc_acc": "6.473e-01", "epoch": 0.06723} {"step": 33620, "loss": 0.7402, "grad_norm": "8.299e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.563e-01", "anc_loss": "5.953e-01", "dlm_acc": "5.998e-01", "anc_acc": "5.817e-01", "epoch": 0.06724} {"step": 33625, "loss": 1.5319, "grad_norm": "4.046e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.552e+00", "anc_loss": "1.643e+00", "dlm_acc": "4.689e-01", "anc_acc": "4.470e-01", "epoch": 0.06725} {"step": 33630, "loss": 1.5239, "grad_norm": "1.628e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.435e+00", "anc_loss": "1.577e+00", "dlm_acc": "5.545e-01", "anc_acc": "5.237e-01", "epoch": 0.06726} {"step": 33635, "loss": 1.3457, "grad_norm": "2.970e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.250e-01", "anc_loss": "8.941e-01", "dlm_acc": "6.386e-01", "anc_acc": "6.189e-01", "epoch": 0.06727} {"step": 33640, "loss": 1.4101, "grad_norm": "4.921e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.011e+00", "anc_loss": "1.112e+00", "dlm_acc": "5.860e-01", "anc_acc": "5.590e-01", "epoch": 0.06728} {"step": 33645, "loss": 1.4661, "grad_norm": "3.456e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.208e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.692e-01", "anc_acc": "5.464e-01", "epoch": 0.06729} {"step": 33650, "loss": 1.6117, "grad_norm": "4.094e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.868e+00", "anc_loss": "1.871e+00", "dlm_acc": "3.456e-01", "anc_acc": "3.450e-01", "epoch": 0.0673} {"step": 33655, "loss": 1.5863, "grad_norm": "5.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.388e+00", "anc_loss": "2.441e+00", "dlm_acc": "2.196e-01", "anc_acc": "2.077e-01", "epoch": 0.06731} {"step": 33660, "loss": 1.4584, "grad_norm": "4.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.016e-01", "anc_loss": "9.883e-01", "dlm_acc": "6.245e-01", "anc_acc": "6.025e-01", "epoch": 0.06732} {"step": 33665, "loss": 1.2486, "grad_norm": "3.370e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.422e-01", "anc_loss": "5.539e-01", "dlm_acc": "7.773e-01", "anc_acc": "7.393e-01", "epoch": 0.06733} {"step": 33670, "loss": 1.2205, "grad_norm": "2.365e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.715e-01", "anc_loss": "9.078e-01", "dlm_acc": "6.801e-01", "anc_acc": "6.414e-01", "epoch": 0.06734} {"step": 33675, "loss": 1.334, "grad_norm": "5.132e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.113e-01", "anc_acc": "4.812e-01", "epoch": 0.06735} {"step": 33680, "loss": 1.2084, "grad_norm": "4.956e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.133e+00", "dlm_acc": "6.434e-01", "anc_acc": "6.201e-01", "epoch": 0.06736} {"step": 33685, "loss": 1.2832, "grad_norm": "3.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.703e-01", "anc_loss": "5.941e-01", "dlm_acc": "5.950e-01", "anc_acc": "5.801e-01", "epoch": 0.06737} {"step": 33690, "loss": 0.8491, "grad_norm": "3.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.955e-01", "anc_loss": "1.002e+00", "dlm_acc": "6.526e-01", "anc_acc": "6.239e-01", "epoch": 0.06738} {"step": 33695, "loss": 0.8712, "grad_norm": "2.260e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.309e-01", "anc_loss": "8.078e-01", "dlm_acc": "6.926e-01", "anc_acc": "6.695e-01", "epoch": 0.06739} {"step": 33700, "loss": 1.2798, "grad_norm": "4.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.305e-01", "anc_loss": "7.855e-01", "dlm_acc": "6.103e-01", "anc_acc": "5.882e-01", "epoch": 0.0674} {"step": 33705, "loss": 1.6215, "grad_norm": "6.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.245e+00", "dlm_acc": "5.871e-01", "anc_acc": "5.684e-01", "epoch": 0.06741} {"step": 33710, "loss": 1.6781, "grad_norm": "5.684e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.464e-01", "anc_acc": "5.230e-01", "epoch": 0.06742} {"step": 33715, "loss": 1.5538, "grad_norm": "2.622e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.200e+00", "dlm_acc": "5.869e-01", "anc_acc": "5.535e-01", "epoch": 0.06743} {"step": 33720, "loss": 1.5411, "grad_norm": "4.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.389e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.138e-01", "anc_acc": "4.920e-01", "epoch": 0.06744} {"step": 33725, "loss": 1.5617, "grad_norm": "4.035e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.050e+00", "anc_loss": "1.125e+00", "dlm_acc": "5.430e-01", "anc_acc": "5.233e-01", "epoch": 0.06745} {"step": 33730, "loss": 1.4912, "grad_norm": "2.632e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.277e+00", "dlm_acc": "4.484e-01", "anc_acc": "4.353e-01", "epoch": 0.06746} {"step": 33735, "loss": 1.4884, "grad_norm": "3.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.150e-01", "anc_acc": "4.841e-01", "epoch": 0.06747} {"step": 33740, "loss": 1.3784, "grad_norm": "4.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.297e+00", "dlm_acc": "5.472e-01", "anc_acc": "5.165e-01", "epoch": 0.06748} {"step": 33745, "loss": 1.4507, "grad_norm": "3.849e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.299e+00", "anc_loss": "1.470e+00", "dlm_acc": "5.310e-01", "anc_acc": "4.994e-01", "epoch": 0.06749} {"step": 33750, "loss": 1.0729, "grad_norm": "2.732e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.758e-01", "anc_loss": "1.051e+00", "dlm_acc": "6.482e-01", "anc_acc": "5.903e-01", "epoch": 0.0675} {"step": 33755, "loss": 1.0151, "grad_norm": "7.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.007e+00", "anc_loss": "1.137e+00", "dlm_acc": "5.983e-01", "anc_acc": "5.577e-01", "epoch": 0.06751} {"step": 33760, "loss": 1.1322, "grad_norm": "3.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.158e+00", "dlm_acc": "6.170e-01", "anc_acc": "5.919e-01", "epoch": 0.06752} {"step": 33765, "loss": 1.1092, "grad_norm": "3.101e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.095e-01", "anc_loss": "8.804e-01", "dlm_acc": "6.406e-01", "anc_acc": "6.217e-01", "epoch": 0.06753} {"step": 33770, "loss": 1.2839, "grad_norm": "3.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.047e+00", "anc_loss": "1.135e+00", "dlm_acc": "5.372e-01", "anc_acc": "5.153e-01", "epoch": 0.06754} {"step": 33775, "loss": 1.4748, "grad_norm": "3.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.622e-01", "anc_acc": "5.326e-01", "epoch": 0.06755} {"step": 33780, "loss": 1.2554, "grad_norm": "2.231e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.527e-01", "anc_loss": "6.535e-01", "dlm_acc": "7.971e-01", "anc_acc": "7.632e-01", "epoch": 0.06756} {"step": 33785, "loss": 1.51, "grad_norm": "2.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.255e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.015e-01", "anc_acc": "4.636e-01", "epoch": 0.06757} {"step": 33790, "loss": 1.3067, "grad_norm": "3.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.146e+00", "anc_loss": "1.251e+00", "dlm_acc": "5.509e-01", "anc_acc": "5.138e-01", "epoch": 0.06758} {"step": 33795, "loss": 1.6406, "grad_norm": "2.930e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.536e+00", "dlm_acc": "5.044e-01", "anc_acc": "4.513e-01", "epoch": 0.06759} {"step": 33800, "loss": 1.5661, "grad_norm": "3.972e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.544e+00", "dlm_acc": "4.706e-01", "anc_acc": "4.410e-01", "epoch": 0.0676} {"step": 33805, "loss": 1.7097, "grad_norm": "3.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.606e+00", "dlm_acc": "5.403e-01", "anc_acc": "4.962e-01", "epoch": 0.06761} {"step": 33810, "loss": 1.4299, "grad_norm": "4.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.448e-01", "anc_acc": "4.997e-01", "epoch": 0.06762} {"step": 33815, "loss": 1.3966, "grad_norm": "2.918e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.481e+00", "dlm_acc": "5.325e-01", "anc_acc": "5.092e-01", "epoch": 0.06763} {"step": 33820, "loss": 1.4509, "grad_norm": "2.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.476e-01", "anc_acc": "5.186e-01", "epoch": 0.06764} {"step": 33825, "loss": 1.1641, "grad_norm": "2.173e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.844e-01", "anc_loss": "1.064e+00", "dlm_acc": "5.747e-01", "anc_acc": "5.538e-01", "epoch": 0.06765} {"step": 33830, "loss": 1.0784, "grad_norm": "5.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.996e-01", "anc_loss": "7.754e-01", "dlm_acc": "6.969e-01", "anc_acc": "6.722e-01", "epoch": 0.06766} {"step": 33835, "loss": 1.0932, "grad_norm": "4.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.130e+00", "dlm_acc": "6.123e-01", "anc_acc": "5.717e-01", "epoch": 0.06767} {"step": 33840, "loss": 1.2533, "grad_norm": "2.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.400e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.115e-01", "epoch": 0.06768} {"step": 33845, "loss": 0.9842, "grad_norm": "3.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.203e-01", "anc_loss": "8.648e-01", "dlm_acc": "7.033e-01", "anc_acc": "6.415e-01", "epoch": 0.06769} {"step": 33850, "loss": 1.3734, "grad_norm": "4.440e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.651e+00", "anc_loss": "1.749e+00", "dlm_acc": "3.962e-01", "anc_acc": "3.716e-01", "epoch": 0.0677} {"step": 33855, "loss": 1.314, "grad_norm": "2.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.460e+00", "dlm_acc": "5.638e-01", "anc_acc": "5.368e-01", "epoch": 0.06771} {"step": 33860, "loss": 1.5286, "grad_norm": "2.273e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.503e-01", "anc_loss": "8.992e-01", "dlm_acc": "7.398e-01", "anc_acc": "7.316e-01", "epoch": 0.06772} {"step": 33865, "loss": 0.937, "grad_norm": "3.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.369e-01", "anc_loss": "5.027e-01", "dlm_acc": "7.600e-01", "anc_acc": "7.348e-01", "epoch": 0.06773} {"step": 33870, "loss": 1.0167, "grad_norm": "3.292e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.047e-01", "anc_loss": "4.369e-01", "dlm_acc": "7.193e-01", "anc_acc": "7.012e-01", "epoch": 0.06774} {"step": 33875, "loss": 0.8129, "grad_norm": "1.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.471e-01", "anc_loss": "4.771e-01", "dlm_acc": "6.603e-01", "anc_acc": "6.388e-01", "epoch": 0.06775} {"step": 33880, "loss": 0.8017, "grad_norm": "4.545e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.666e-01", "anc_loss": "2.996e-01", "dlm_acc": "8.101e-01", "anc_acc": "7.851e-01", "epoch": 0.06776} {"step": 33885, "loss": 0.995, "grad_norm": "3.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.312e-01", "anc_loss": "3.641e-01", "dlm_acc": "7.777e-01", "anc_acc": "7.553e-01", "epoch": 0.06777} {"step": 33890, "loss": 0.9747, "grad_norm": "2.238e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.488e-01", "anc_loss": "5.602e-01", "dlm_acc": "7.603e-01", "anc_acc": "7.153e-01", "epoch": 0.06778} {"step": 33895, "loss": 1.2896, "grad_norm": "4.557e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.696e-01", "anc_acc": "5.235e-01", "epoch": 0.06779} {"step": 33900, "loss": 1.3545, "grad_norm": "3.207e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.338e+00", "dlm_acc": "5.569e-01", "anc_acc": "5.324e-01", "epoch": 0.0678} {"step": 33905, "loss": 1.5051, "grad_norm": "3.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.798e+00", "anc_loss": "1.862e+00", "dlm_acc": "3.780e-01", "anc_acc": "3.622e-01", "epoch": 0.06781} {"step": 33910, "loss": 1.3261, "grad_norm": "2.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.477e+00", "anc_loss": "2.498e+00", "dlm_acc": "1.116e-01", "anc_acc": "9.784e-02", "epoch": 0.06782} {"step": 33915, "loss": 1.1165, "grad_norm": "3.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.723e-01", "anc_loss": "8.031e-01", "dlm_acc": "4.391e-01", "anc_acc": "4.168e-01", "epoch": 0.06783} {"step": 33920, "loss": 0.9452, "grad_norm": "2.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.449e-01", "anc_loss": "6.617e-01", "dlm_acc": "5.170e-01", "anc_acc": "5.053e-01", "epoch": 0.06784} {"step": 33925, "loss": 1.2076, "grad_norm": "3.332e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.258e-01", "anc_loss": "7.469e-01", "dlm_acc": "5.022e-01", "anc_acc": "4.897e-01", "epoch": 0.06785} {"step": 33930, "loss": 0.8702, "grad_norm": "2.309e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.320e-01", "anc_loss": "5.484e-01", "dlm_acc": "5.363e-01", "anc_acc": "5.195e-01", "epoch": 0.06786} {"step": 33935, "loss": 1.1434, "grad_norm": "3.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.082e-01", "anc_loss": "6.328e-01", "dlm_acc": "5.130e-01", "anc_acc": "4.909e-01", "epoch": 0.06787} {"step": 33940, "loss": 1.1283, "grad_norm": "2.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.141e-01", "anc_loss": "7.383e-01", "dlm_acc": "4.951e-01", "anc_acc": "4.775e-01", "epoch": 0.06788} {"step": 33945, "loss": 1.1872, "grad_norm": "4.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.026e+00", "anc_loss": "1.055e+00", "dlm_acc": "4.009e-01", "anc_acc": "3.775e-01", "epoch": 0.06789} {"step": 33950, "loss": 1.3196, "grad_norm": "3.471e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.376e-01", "anc_acc": "5.117e-01", "epoch": 0.0679} {"step": 33955, "loss": 1.4368, "grad_norm": "3.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.225e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.600e-01", "anc_acc": "5.295e-01", "epoch": 0.06791} {"step": 33960, "loss": 1.3564, "grad_norm": "3.263e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.768e-01", "anc_loss": "8.988e-01", "dlm_acc": "6.994e-01", "anc_acc": "6.665e-01", "epoch": 0.06792} {"step": 33965, "loss": 1.3526, "grad_norm": "3.198e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.727e-01", "anc_acc": "5.320e-01", "epoch": 0.06793} {"step": 33970, "loss": 1.4462, "grad_norm": "4.416e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.447e+00", "dlm_acc": "5.613e-01", "anc_acc": "5.305e-01", "epoch": 0.06794} {"step": 33975, "loss": 1.6497, "grad_norm": "4.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.477e+00", "dlm_acc": "5.431e-01", "anc_acc": "5.192e-01", "epoch": 0.06795} {"step": 33980, "loss": 1.4706, "grad_norm": "3.473e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.525e+00", "dlm_acc": "5.248e-01", "anc_acc": "4.901e-01", "epoch": 0.06796} {"step": 33985, "loss": 1.2738, "grad_norm": "4.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.498e+00", "anc_loss": "1.633e+00", "dlm_acc": "5.210e-01", "anc_acc": "4.903e-01", "epoch": 0.06797} {"step": 33990, "loss": 0.841, "grad_norm": "3.806e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.162e+00", "dlm_acc": "5.808e-01", "anc_acc": "5.569e-01", "epoch": 0.06798} {"step": 33995, "loss": 1.2733, "grad_norm": "4.994e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.198e+00", "dlm_acc": "6.330e-01", "anc_acc": "6.035e-01", "epoch": 0.06799} {"step": 34000, "loss": 0.959, "grad_norm": "3.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.486e+00", "anc_loss": "1.573e+00", "dlm_acc": "4.915e-01", "anc_acc": "4.694e-01", "epoch": 0.068} {"step": 34005, "loss": 1.3313, "grad_norm": "3.879e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.465e+00", "dlm_acc": "5.753e-01", "anc_acc": "5.342e-01", "epoch": 0.06801} {"step": 34010, "loss": 1.1245, "grad_norm": "2.324e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.460e+00", "dlm_acc": "5.747e-01", "anc_acc": "5.447e-01", "epoch": 0.06802} {"step": 34015, "loss": 1.1835, "grad_norm": "3.569e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.938e+00", "anc_loss": "2.011e+00", "dlm_acc": "3.626e-01", "anc_acc": "3.448e-01", "epoch": 0.06803} {"step": 34020, "loss": 1.0099, "grad_norm": "3.525e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.705e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.595e-01", "anc_acc": "6.380e-01", "epoch": 0.06804} {"step": 34025, "loss": 1.0583, "grad_norm": "2.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.258e-01", "anc_loss": "7.859e-01", "dlm_acc": "6.714e-01", "anc_acc": "6.513e-01", "epoch": 0.06805} {"step": 34030, "loss": 1.0914, "grad_norm": "3.006e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.680e-01", "anc_loss": "1.087e+00", "dlm_acc": "6.250e-01", "anc_acc": "5.914e-01", "epoch": 0.06806} {"step": 34035, "loss": 1.2381, "grad_norm": "2.598e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.250e+00", "dlm_acc": "6.055e-01", "anc_acc": "5.641e-01", "epoch": 0.06807} {"step": 34040, "loss": 1.5754, "grad_norm": "3.117e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.261e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.628e-01", "anc_acc": "5.263e-01", "epoch": 0.06808} {"step": 34045, "loss": 1.6827, "grad_norm": "3.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.725e-01", "anc_loss": "8.982e-01", "dlm_acc": "7.307e-01", "anc_acc": "6.894e-01", "epoch": 0.06809} {"step": 34050, "loss": 1.3399, "grad_norm": "2.590e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.436e-01", "anc_acc": "5.184e-01", "epoch": 0.0681} {"step": 34055, "loss": 1.1383, "grad_norm": "1.887e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.973e-01", "anc_loss": "9.771e-01", "dlm_acc": "6.518e-01", "anc_acc": "6.291e-01", "epoch": 0.06811} {"step": 34060, "loss": 1.9039, "grad_norm": "3.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.407e+00", "dlm_acc": "5.815e-01", "anc_acc": "5.570e-01", "epoch": 0.06812} {"step": 34065, "loss": 1.4373, "grad_norm": "2.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.101e+00", "dlm_acc": "5.477e-01", "anc_acc": "5.332e-01", "epoch": 0.06813} {"step": 34070, "loss": 1.5272, "grad_norm": "3.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.675e+00", "dlm_acc": "5.037e-01", "anc_acc": "4.681e-01", "epoch": 0.06814} {"step": 34075, "loss": 1.4181, "grad_norm": "5.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.646e-01", "anc_loss": "1.057e+00", "dlm_acc": "6.754e-01", "anc_acc": "6.475e-01", "epoch": 0.06815} {"step": 34080, "loss": 1.1219, "grad_norm": "3.107e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.028e+00", "anc_loss": "1.183e+00", "dlm_acc": "6.190e-01", "anc_acc": "5.760e-01", "epoch": 0.06816} {"step": 34085, "loss": 1.2502, "grad_norm": "5.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.251e+00", "anc_loss": "1.326e+00", "dlm_acc": "5.184e-01", "anc_acc": "5.022e-01", "epoch": 0.06817} {"step": 34090, "loss": 1.2094, "grad_norm": "3.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.289e+00", "dlm_acc": "5.963e-01", "anc_acc": "5.534e-01", "epoch": 0.06818} {"step": 34095, "loss": 1.4042, "grad_norm": "3.997e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.238e-01", "anc_loss": "1.004e+00", "dlm_acc": "6.339e-01", "anc_acc": "6.099e-01", "epoch": 0.06819} {"step": 34100, "loss": 1.5609, "grad_norm": "4.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.409e+00", "anc_loss": "2.422e+00", "dlm_acc": "2.733e-02", "anc_acc": "2.575e-02", "epoch": 0.0682} {"step": 34105, "loss": 1.7896, "grad_norm": "5.111e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.148e+00", "anc_loss": "2.234e+00", "dlm_acc": "3.205e-01", "anc_acc": "3.017e-01", "epoch": 0.06821} {"step": 34110, "loss": 1.5951, "grad_norm": "2.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.794e+00", "anc_loss": "1.892e+00", "dlm_acc": "4.168e-01", "anc_acc": "3.932e-01", "epoch": 0.06822} {"step": 34115, "loss": 1.1143, "grad_norm": "2.481e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.152e+00", "dlm_acc": "5.954e-01", "anc_acc": "5.670e-01", "epoch": 0.06823} {"step": 34120, "loss": 1.2424, "grad_norm": "4.695e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.388e+00", "dlm_acc": "5.243e-01", "anc_acc": "5.004e-01", "epoch": 0.06824} {"step": 34125, "loss": 1.4239, "grad_norm": "7.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.067e+00", "anc_loss": "1.164e+00", "dlm_acc": "6.733e-01", "anc_acc": "6.546e-01", "epoch": 0.06825} {"step": 34130, "loss": 1.2216, "grad_norm": "2.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.818e-01", "anc_acc": "5.537e-01", "epoch": 0.06826} {"step": 34135, "loss": 1.3961, "grad_norm": "2.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.511e+00", "dlm_acc": "5.531e-01", "anc_acc": "5.296e-01", "epoch": 0.06827} {"step": 34140, "loss": 1.5655, "grad_norm": "2.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.561e+00", "dlm_acc": "5.080e-01", "anc_acc": "4.841e-01", "epoch": 0.06828} {"step": 34145, "loss": 1.4383, "grad_norm": "4.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.607e+00", "dlm_acc": "4.991e-01", "anc_acc": "4.746e-01", "epoch": 0.06829} {"step": 34150, "loss": 1.557, "grad_norm": "3.646e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.720e+00", "anc_loss": "1.847e+00", "dlm_acc": "4.873e-01", "anc_acc": "4.614e-01", "epoch": 0.0683} {"step": 34155, "loss": 1.4492, "grad_norm": "3.879e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.617e-01", "anc_acc": "5.382e-01", "epoch": 0.06831} {"step": 34160, "loss": 1.5396, "grad_norm": "3.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.958e+00", "anc_loss": "2.019e+00", "dlm_acc": "3.360e-01", "anc_acc": "3.224e-01", "epoch": 0.06832} {"step": 34165, "loss": 1.0107, "grad_norm": "2.713e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.039e-01", "anc_loss": "3.262e-01", "dlm_acc": "8.588e-01", "anc_acc": "8.474e-01", "epoch": 0.06833} {"step": 34170, "loss": 0.9183, "grad_norm": "4.043e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.699e-02", "anc_loss": "7.231e-02", "dlm_acc": "9.796e-01", "anc_acc": "9.776e-01", "epoch": 0.06834} {"step": 34175, "loss": 1.4292, "grad_norm": "5.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.288e+00", "dlm_acc": "5.888e-01", "anc_acc": "5.688e-01", "epoch": 0.06835} {"step": 34180, "loss": 1.433, "grad_norm": "4.095e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.716e+00", "anc_loss": "1.847e+00", "dlm_acc": "5.041e-01", "anc_acc": "4.757e-01", "epoch": 0.06836} {"step": 34185, "loss": 1.5667, "grad_norm": "3.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.511e+00", "dlm_acc": "5.147e-01", "anc_acc": "4.886e-01", "epoch": 0.06837} {"step": 34190, "loss": 1.745, "grad_norm": "5.573e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.613e+00", "dlm_acc": "5.107e-01", "anc_acc": "4.827e-01", "epoch": 0.06838} {"step": 34195, "loss": 1.6264, "grad_norm": "2.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.178e+00", "anc_loss": "2.275e+00", "dlm_acc": "2.436e-01", "anc_acc": "2.252e-01", "epoch": 0.06839} {"step": 34200, "loss": 1.3604, "grad_norm": "3.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.482e-01", "anc_acc": "5.226e-01", "epoch": 0.0684} {"step": 34205, "loss": 1.3146, "grad_norm": "2.550e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.494e+00", "anc_loss": "1.607e+00", "dlm_acc": "5.177e-01", "anc_acc": "4.931e-01", "epoch": 0.06841} {"step": 34210, "loss": 1.3134, "grad_norm": "2.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.346e-01", "anc_acc": "5.076e-01", "epoch": 0.06842} {"step": 34215, "loss": 1.3335, "grad_norm": "4.048e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.477e-01", "anc_acc": "5.188e-01", "epoch": 0.06843} {"step": 34220, "loss": 1.2942, "grad_norm": "3.403e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.865e-01", "anc_acc": "5.545e-01", "epoch": 0.06844} {"step": 34225, "loss": 1.2696, "grad_norm": "2.871e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.163e+00", "dlm_acc": "6.417e-01", "anc_acc": "6.103e-01", "epoch": 0.06845} {"step": 34230, "loss": 1.6132, "grad_norm": "3.263e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.566e+00", "dlm_acc": "5.670e-01", "anc_acc": "5.381e-01", "epoch": 0.06846} {"step": 34235, "loss": 1.2986, "grad_norm": "2.608e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.340e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.352e-01", "anc_acc": "5.113e-01", "epoch": 0.06847} {"step": 34240, "loss": 1.4811, "grad_norm": "3.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.521e+00", "dlm_acc": "5.429e-01", "anc_acc": "5.175e-01", "epoch": 0.06848} {"step": 34245, "loss": 1.3332, "grad_norm": "3.306e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.635e-01", "anc_acc": "5.367e-01", "epoch": 0.06849} {"step": 34250, "loss": 1.9719, "grad_norm": "3.307e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.863e+00", "anc_loss": "1.980e+00", "dlm_acc": "4.481e-01", "anc_acc": "4.255e-01", "epoch": 0.0685} {"step": 34255, "loss": 1.1035, "grad_norm": "2.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.110e+00", "dlm_acc": "5.894e-01", "anc_acc": "5.587e-01", "epoch": 0.06851} {"step": 34260, "loss": 1.4516, "grad_norm": "4.276e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.415e+00", "dlm_acc": "6.170e-01", "anc_acc": "5.895e-01", "epoch": 0.06852} {"step": 34265, "loss": 1.1214, "grad_norm": "2.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.163e+00", "anc_loss": "1.273e+00", "dlm_acc": "5.806e-01", "anc_acc": "5.506e-01", "epoch": 0.06853} {"step": 34270, "loss": 1.4312, "grad_norm": "3.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.522e+00", "anc_loss": "1.642e+00", "dlm_acc": "5.027e-01", "anc_acc": "4.791e-01", "epoch": 0.06854} {"step": 34275, "loss": 1.3616, "grad_norm": "4.053e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.484e+00", "anc_loss": "1.604e+00", "dlm_acc": "5.047e-01", "anc_acc": "4.787e-01", "epoch": 0.06855} {"step": 34280, "loss": 1.2188, "grad_norm": "2.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.228e+00", "dlm_acc": "5.958e-01", "anc_acc": "5.648e-01", "epoch": 0.06856} {"step": 34285, "loss": 1.1505, "grad_norm": "3.863e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.436e-01", "anc_acc": "5.175e-01", "epoch": 0.06857} {"step": 34290, "loss": 0.8225, "grad_norm": "2.048e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.365e-01", "anc_loss": "5.232e-01", "dlm_acc": "8.239e-01", "anc_acc": "8.024e-01", "epoch": 0.06858} {"step": 34295, "loss": 1.2242, "grad_norm": "3.431e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.852e-01", "anc_acc": "5.573e-01", "epoch": 0.06859} {"step": 34300, "loss": 1.328, "grad_norm": "3.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.175e+00", "dlm_acc": "6.085e-01", "anc_acc": "5.810e-01", "epoch": 0.0686} {"step": 34305, "loss": 1.1701, "grad_norm": "2.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.289e-01", "anc_loss": "1.009e+00", "dlm_acc": "6.104e-01", "anc_acc": "5.887e-01", "epoch": 0.06861} {"step": 34310, "loss": 1.6066, "grad_norm": "2.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.556e+00", "dlm_acc": "5.277e-01", "anc_acc": "5.072e-01", "epoch": 0.06862} {"step": 34315, "loss": 1.6094, "grad_norm": "3.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.580e+00", "anc_loss": "1.720e+00", "dlm_acc": "5.291e-01", "anc_acc": "5.020e-01", "epoch": 0.06863} {"step": 34320, "loss": 1.1473, "grad_norm": "5.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.226e+00", "dlm_acc": "5.885e-01", "anc_acc": "5.630e-01", "epoch": 0.06864} {"step": 34325, "loss": 1.2746, "grad_norm": "3.245e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.564e+00", "anc_loss": "1.691e+00", "dlm_acc": "5.155e-01", "anc_acc": "4.846e-01", "epoch": 0.06865} {"step": 34330, "loss": 1.091, "grad_norm": "2.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.664e-01", "anc_loss": "8.582e-01", "dlm_acc": "7.032e-01", "anc_acc": "6.812e-01", "epoch": 0.06866} {"step": 34335, "loss": 1.8851, "grad_norm": "3.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.395e-01", "anc_loss": "5.520e-01", "dlm_acc": "6.626e-01", "anc_acc": "6.555e-01", "epoch": 0.06867} {"step": 34340, "loss": 0.9829, "grad_norm": "5.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.027e-01", "anc_loss": "4.145e-01", "dlm_acc": "6.991e-01", "anc_acc": "6.946e-01", "epoch": 0.06868} {"step": 34345, "loss": 1.3282, "grad_norm": "4.388e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.051e-01", "anc_loss": "4.180e-01", "dlm_acc": "6.794e-01", "anc_acc": "6.738e-01", "epoch": 0.06869} {"step": 34350, "loss": 1.2256, "grad_norm": "5.928e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.416e-01", "anc_loss": "8.061e-01", "dlm_acc": "6.764e-01", "anc_acc": "6.585e-01", "epoch": 0.0687} {"step": 34355, "loss": 1.4983, "grad_norm": "5.636e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.680e+00", "anc_loss": "1.803e+00", "dlm_acc": "5.031e-01", "anc_acc": "4.753e-01", "epoch": 0.06871} {"step": 34360, "loss": 1.2574, "grad_norm": "2.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.279e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.520e-01", "anc_acc": "5.233e-01", "epoch": 0.06872} {"step": 34365, "loss": 1.2804, "grad_norm": "3.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.072e+00", "anc_loss": "1.209e+00", "dlm_acc": "6.074e-01", "anc_acc": "5.746e-01", "epoch": 0.06873} {"step": 34370, "loss": 1.5593, "grad_norm": "3.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.555e+00", "anc_loss": "1.638e+00", "dlm_acc": "4.165e-01", "anc_acc": "3.965e-01", "epoch": 0.06874} {"step": 34375, "loss": 1.2448, "grad_norm": "2.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.061e+00", "anc_loss": "1.182e+00", "dlm_acc": "6.250e-01", "anc_acc": "5.961e-01", "epoch": 0.06875} {"step": 34380, "loss": 1.1347, "grad_norm": "3.149e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.902e-01", "anc_loss": "2.203e-01", "dlm_acc": "8.988e-01", "anc_acc": "8.884e-01", "epoch": 0.06876} {"step": 34385, "loss": 1.6096, "grad_norm": "3.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.281e+00", "dlm_acc": "6.281e-01", "anc_acc": "6.017e-01", "epoch": 0.06877} {"step": 34390, "loss": 1.4087, "grad_norm": "4.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.303e+00", "dlm_acc": "5.861e-01", "anc_acc": "5.493e-01", "epoch": 0.06878} {"step": 34395, "loss": 1.6794, "grad_norm": "3.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.020e+00", "anc_loss": "1.080e+00", "dlm_acc": "5.080e-01", "anc_acc": "4.886e-01", "epoch": 0.06879} {"step": 34400, "loss": 0.9745, "grad_norm": "1.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.047e-01", "anc_loss": "8.074e-01", "dlm_acc": "6.771e-01", "anc_acc": "6.445e-01", "epoch": 0.0688} {"step": 34405, "loss": 1.0267, "grad_norm": "1.485e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.215e-01", "anc_loss": "6.719e-01", "dlm_acc": "5.529e-01", "anc_acc": "5.299e-01", "epoch": 0.06881} {"step": 34410, "loss": 1.0592, "grad_norm": "3.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.172e+00", "dlm_acc": "4.307e-01", "anc_acc": "4.142e-01", "epoch": 0.06882} {"step": 34415, "loss": 1.231, "grad_norm": "9.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.450e+00", "dlm_acc": "4.480e-01", "anc_acc": "4.280e-01", "epoch": 0.06883} {"step": 34420, "loss": 1.2076, "grad_norm": "4.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.278e+00", "anc_loss": "1.351e+00", "dlm_acc": "4.923e-01", "anc_acc": "4.741e-01", "epoch": 0.06884} {"step": 34425, "loss": 1.3873, "grad_norm": "2.856e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.444e+00", "anc_loss": "1.545e+00", "dlm_acc": "5.033e-01", "anc_acc": "4.801e-01", "epoch": 0.06885} {"step": 34430, "loss": 1.4468, "grad_norm": "3.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.739e-01", "anc_acc": "5.505e-01", "epoch": 0.06886} {"step": 34435, "loss": 1.8576, "grad_norm": "2.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.471e+00", "dlm_acc": "5.180e-01", "anc_acc": "4.798e-01", "epoch": 0.06887} {"step": 34440, "loss": 1.1148, "grad_norm": "2.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.216e+00", "dlm_acc": "6.084e-01", "anc_acc": "5.830e-01", "epoch": 0.06888} {"step": 34445, "loss": 1.1932, "grad_norm": "3.632e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.548e+00", "dlm_acc": "5.229e-01", "anc_acc": "4.990e-01", "epoch": 0.06889} {"step": 34450, "loss": 1.6169, "grad_norm": "2.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.719e+00", "dlm_acc": "4.980e-01", "anc_acc": "4.624e-01", "epoch": 0.0689} {"step": 34455, "loss": 1.825, "grad_norm": "3.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.444e+00", "anc_loss": "1.556e+00", "dlm_acc": "5.273e-01", "anc_acc": "5.039e-01", "epoch": 0.06891} {"step": 34460, "loss": 1.6712, "grad_norm": "4.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.670e+00", "anc_loss": "1.805e+00", "dlm_acc": "4.894e-01", "anc_acc": "4.582e-01", "epoch": 0.06892} {"step": 34465, "loss": 1.3769, "grad_norm": "4.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.331e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.394e-01", "anc_acc": "5.091e-01", "epoch": 0.06893} {"step": 34470, "loss": 1.2249, "grad_norm": "2.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.787e-01", "anc_loss": "9.603e-01", "dlm_acc": "6.581e-01", "anc_acc": "6.322e-01", "epoch": 0.06894} {"step": 34475, "loss": 1.0289, "grad_norm": "2.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.357e-01", "anc_loss": "5.071e-01", "dlm_acc": "7.917e-01", "anc_acc": "7.649e-01", "epoch": 0.06895} {"step": 34480, "loss": 1.2268, "grad_norm": "3.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.128e+00", "anc_loss": "1.228e+00", "dlm_acc": "6.134e-01", "anc_acc": "5.894e-01", "epoch": 0.06896} {"step": 34485, "loss": 1.1572, "grad_norm": "3.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.354e+00", "dlm_acc": "5.793e-01", "anc_acc": "5.257e-01", "epoch": 0.06897} {"step": 34490, "loss": 1.0972, "grad_norm": "5.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.777e-01", "anc_loss": "9.930e-01", "dlm_acc": "6.915e-01", "anc_acc": "6.558e-01", "epoch": 0.06898} {"step": 34495, "loss": 1.2702, "grad_norm": "2.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.664e-01", "anc_loss": "1.065e+00", "dlm_acc": "6.346e-01", "anc_acc": "6.061e-01", "epoch": 0.06899} {"step": 34500, "loss": 0.8867, "grad_norm": "3.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.695e-01", "anc_loss": "1.063e+00", "dlm_acc": "5.811e-01", "anc_acc": "5.516e-01", "epoch": 0.069} {"step": 34505, "loss": 1.1814, "grad_norm": "5.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.658e+00", "anc_loss": "1.769e+00", "dlm_acc": "5.109e-01", "anc_acc": "4.859e-01", "epoch": 0.06901} {"step": 34510, "loss": 0.9525, "grad_norm": "3.516e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.495e-01", "anc_acc": "5.170e-01", "epoch": 0.06902} {"step": 34515, "loss": 1.1048, "grad_norm": "3.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.266e+00", "dlm_acc": "6.316e-01", "anc_acc": "6.026e-01", "epoch": 0.06903} {"step": 34520, "loss": 0.9634, "grad_norm": "3.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.478e+00", "dlm_acc": "5.591e-01", "anc_acc": "5.297e-01", "epoch": 0.06904} {"step": 34525, "loss": 1.2715, "grad_norm": "4.455e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.567e+00", "dlm_acc": "5.408e-01", "anc_acc": "5.135e-01", "epoch": 0.06905} {"step": 34530, "loss": 0.8552, "grad_norm": "7.005e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.758e-01", "anc_loss": "9.844e-01", "dlm_acc": "6.568e-01", "anc_acc": "6.229e-01", "epoch": 0.06906} {"step": 34535, "loss": 0.9822, "grad_norm": "2.062e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.321e-01", "anc_acc": "5.088e-01", "epoch": 0.06907} {"step": 34540, "loss": 1.0444, "grad_norm": "3.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.564e+00", "dlm_acc": "5.503e-01", "anc_acc": "5.201e-01", "epoch": 0.06908} {"step": 34545, "loss": 0.9167, "grad_norm": "3.146e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.283e+00", "anc_loss": "1.399e+00", "dlm_acc": "5.549e-01", "anc_acc": "5.267e-01", "epoch": 0.06909} {"step": 34550, "loss": 0.8323, "grad_norm": "5.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.534e-01", "anc_acc": "5.290e-01", "epoch": 0.0691} {"step": 34555, "loss": 1.2321, "grad_norm": "2.983e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.392e+00", "anc_loss": "1.508e+00", "dlm_acc": "5.389e-01", "anc_acc": "5.116e-01", "epoch": 0.06911} {"step": 34560, "loss": 1.0366, "grad_norm": "3.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.584e+00", "dlm_acc": "5.375e-01", "anc_acc": "5.068e-01", "epoch": 0.06912} {"step": 34565, "loss": 1.1604, "grad_norm": "2.791e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.404e+00", "dlm_acc": "5.779e-01", "anc_acc": "5.521e-01", "epoch": 0.06913} {"step": 34570, "loss": 1.2727, "grad_norm": "6.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.331e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.588e-01", "anc_acc": "5.282e-01", "epoch": 0.06914} {"step": 34575, "loss": 0.9963, "grad_norm": "7.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.374e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.556e-01", "anc_acc": "5.267e-01", "epoch": 0.06915} {"step": 34580, "loss": 1.1087, "grad_norm": "5.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.385e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.159e-01", "anc_acc": "4.861e-01", "epoch": 0.06916} {"step": 34585, "loss": 0.9462, "grad_norm": "3.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.321e+00", "anc_loss": "1.390e+00", "dlm_acc": "4.377e-01", "anc_acc": "4.172e-01", "epoch": 0.06917} {"step": 34590, "loss": 0.8155, "grad_norm": "4.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.231e+00", "anc_loss": "1.389e+00", "dlm_acc": "5.746e-01", "anc_acc": "5.280e-01", "epoch": 0.06918} {"step": 34595, "loss": 0.547, "grad_norm": "3.065e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.239e+00", "dlm_acc": "4.979e-01", "anc_acc": "4.780e-01", "epoch": 0.06919} {"step": 34600, "loss": 1.1309, "grad_norm": "2.192e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.313e+00", "dlm_acc": "5.957e-01", "anc_acc": "5.646e-01", "epoch": 0.0692} {"step": 34605, "loss": 0.979, "grad_norm": "4.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.211e+00", "dlm_acc": "5.426e-01", "anc_acc": "5.187e-01", "epoch": 0.06921} {"step": 34610, "loss": 1.1989, "grad_norm": "1.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.435e+00", "anc_loss": "1.551e+00", "dlm_acc": "5.443e-01", "anc_acc": "5.181e-01", "epoch": 0.06922} {"step": 34615, "loss": 0.7153, "grad_norm": "9.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.395e-01", "anc_loss": "7.168e-01", "dlm_acc": "6.942e-01", "anc_acc": "6.692e-01", "epoch": 0.06923} {"step": 34620, "loss": 0.8885, "grad_norm": "2.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.445e-01", "anc_loss": "1.083e+00", "dlm_acc": "6.224e-01", "anc_acc": "5.826e-01", "epoch": 0.06924} {"step": 34625, "loss": 0.9638, "grad_norm": "4.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.734e-01", "anc_loss": "1.091e+00", "dlm_acc": "5.864e-01", "anc_acc": "5.520e-01", "epoch": 0.06925} {"step": 34630, "loss": 1.0917, "grad_norm": "3.220e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.707e-01", "anc_acc": "5.406e-01", "epoch": 0.06926} {"step": 34635, "loss": 1.0323, "grad_norm": "3.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.891e-01", "anc_loss": "1.065e+00", "dlm_acc": "6.556e-01", "anc_acc": "5.958e-01", "epoch": 0.06927} {"step": 34640, "loss": 1.2467, "grad_norm": "9.081e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.701e-01", "anc_acc": "5.230e-01", "epoch": 0.06928} {"step": 34645, "loss": 1.2282, "grad_norm": "3.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.741e+00", "dlm_acc": "3.970e-01", "anc_acc": "3.646e-01", "epoch": 0.06929} {"step": 34650, "loss": 1.0591, "grad_norm": "4.846e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.288e-01", "epoch": 0.0693} {"step": 34655, "loss": 1.0325, "grad_norm": "2.114e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.042e+00", "anc_loss": "1.164e+00", "dlm_acc": "5.852e-01", "anc_acc": "5.475e-01", "epoch": 0.06931} {"step": 34660, "loss": 1.0757, "grad_norm": "4.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.361e+00", "dlm_acc": "5.620e-01", "anc_acc": "5.321e-01", "epoch": 0.06932} {"step": 34665, "loss": 1.3146, "grad_norm": "5.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.309e+00", "anc_loss": "1.437e+00", "dlm_acc": "5.317e-01", "anc_acc": "4.952e-01", "epoch": 0.06933} {"step": 34670, "loss": 1.2319, "grad_norm": "5.493e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.610e-01", "anc_acc": "5.285e-01", "epoch": 0.06934} {"step": 34675, "loss": 0.8316, "grad_norm": "4.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.258e-01", "anc_loss": "9.648e-01", "dlm_acc": "5.726e-01", "anc_acc": "5.234e-01", "epoch": 0.06935} {"step": 34680, "loss": 1.2803, "grad_norm": "3.670e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.512e+00", "dlm_acc": "4.520e-01", "anc_acc": "4.168e-01", "epoch": 0.06936} {"step": 34685, "loss": 0.6714, "grad_norm": "2.129e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.379e-01", "anc_loss": "7.059e-01", "dlm_acc": "7.607e-01", "anc_acc": "7.242e-01", "epoch": 0.06937} {"step": 34690, "loss": 1.3068, "grad_norm": "5.095e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.844e-01", "anc_loss": "1.041e+00", "dlm_acc": "7.080e-01", "anc_acc": "6.486e-01", "epoch": 0.06938} {"step": 34695, "loss": 1.1038, "grad_norm": "4.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.804e-01", "anc_acc": "5.484e-01", "epoch": 0.06939} {"step": 34700, "loss": 1.0846, "grad_norm": "2.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.552e+00", "dlm_acc": "4.510e-01", "anc_acc": "4.284e-01", "epoch": 0.0694} {"step": 34705, "loss": 1.1918, "grad_norm": "3.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.250e+00", "dlm_acc": "6.082e-01", "anc_acc": "5.508e-01", "epoch": 0.06941} {"step": 34710, "loss": 0.91, "grad_norm": "3.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.250e-01", "anc_loss": "1.032e+00", "dlm_acc": "6.208e-01", "anc_acc": "5.832e-01", "epoch": 0.06942} {"step": 34715, "loss": 1.1446, "grad_norm": "3.456e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.859e-01", "anc_acc": "5.518e-01", "epoch": 0.06943} {"step": 34720, "loss": 1.0731, "grad_norm": "3.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.146e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.728e-01", "anc_acc": "5.246e-01", "epoch": 0.06944} {"step": 34725, "loss": 1.2156, "grad_norm": "2.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.379e+00", "dlm_acc": "5.743e-01", "anc_acc": "5.364e-01", "epoch": 0.06945} {"step": 34730, "loss": 1.3647, "grad_norm": "3.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.755e+00", "anc_loss": "1.829e+00", "dlm_acc": "3.057e-01", "anc_acc": "2.903e-01", "epoch": 0.06946} {"step": 34735, "loss": 1.7942, "grad_norm": "1.189e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.991e+00", "anc_loss": "2.028e+00", "dlm_acc": "2.994e-01", "anc_acc": "2.867e-01", "epoch": 0.06947} {"step": 34740, "loss": 1.8531, "grad_norm": "4.591e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.375e+00", "anc_loss": "2.475e+00", "dlm_acc": "2.216e-01", "anc_acc": "2.001e-01", "epoch": 0.06948} {"step": 34745, "loss": 1.0698, "grad_norm": "3.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.408e-01", "anc_loss": "3.563e-01", "dlm_acc": "7.217e-01", "anc_acc": "7.121e-01", "epoch": 0.06949} {"step": 34750, "loss": 1.4638, "grad_norm": "3.119e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.844e-01", "anc_acc": "5.558e-01", "epoch": 0.0695} {"step": 34755, "loss": 1.062, "grad_norm": "2.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.835e-01", "anc_loss": "8.547e-01", "dlm_acc": "7.086e-01", "anc_acc": "6.919e-01", "epoch": 0.06951} {"step": 34760, "loss": 1.7311, "grad_norm": "1.039e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.652e+00", "anc_loss": "1.769e+00", "dlm_acc": "4.711e-01", "anc_acc": "4.479e-01", "epoch": 0.06952} {"step": 34765, "loss": 1.4006, "grad_norm": "3.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.944e-01", "anc_acc": "5.753e-01", "epoch": 0.06953} {"step": 34770, "loss": 1.0227, "grad_norm": "3.358e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.571e-01", "anc_acc": "5.300e-01", "epoch": 0.06954} {"step": 34775, "loss": 1.2822, "grad_norm": "4.487e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.352e-01", "anc_loss": "8.109e-01", "dlm_acc": "6.464e-01", "anc_acc": "6.274e-01", "epoch": 0.06955} {"step": 34780, "loss": 1.824, "grad_norm": "3.325e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.863e+00", "anc_loss": "1.988e+00", "dlm_acc": "4.630e-01", "anc_acc": "4.390e-01", "epoch": 0.06956} {"step": 34785, "loss": 1.1111, "grad_norm": "2.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.035e-01", "anc_loss": "1.000e+00", "dlm_acc": "6.153e-01", "anc_acc": "5.876e-01", "epoch": 0.06957} {"step": 34790, "loss": 1.2317, "grad_norm": "5.132e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.750e-01", "anc_loss": "9.828e-01", "dlm_acc": "6.345e-01", "anc_acc": "6.090e-01", "epoch": 0.06958} {"step": 34795, "loss": 1.3369, "grad_norm": "3.762e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.161e-01", "anc_loss": "6.600e-01", "dlm_acc": "7.884e-01", "anc_acc": "7.698e-01", "epoch": 0.06959} {"step": 34800, "loss": 1.3407, "grad_norm": "4.307e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.090e+00", "dlm_acc": "6.016e-01", "anc_acc": "5.857e-01", "epoch": 0.0696} {"step": 34805, "loss": 1.5353, "grad_norm": "3.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.630e-01", "anc_acc": "5.350e-01", "epoch": 0.06961} {"step": 34810, "loss": 1.1475, "grad_norm": "4.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.238e+00", "dlm_acc": "5.392e-01", "anc_acc": "5.188e-01", "epoch": 0.06962} {"step": 34815, "loss": 1.3101, "grad_norm": "2.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.973e-01", "anc_loss": "9.602e-01", "dlm_acc": "4.707e-01", "anc_acc": "4.524e-01", "epoch": 0.06963} {"step": 34820, "loss": 1.6978, "grad_norm": "5.139e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.500e+00", "anc_loss": "1.621e+00", "dlm_acc": "5.203e-01", "anc_acc": "4.948e-01", "epoch": 0.06964} {"step": 34825, "loss": 0.9503, "grad_norm": "3.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.430e-01", "anc_loss": "2.836e-01", "dlm_acc": "8.814e-01", "anc_acc": "8.669e-01", "epoch": 0.06965} {"step": 34830, "loss": 1.7285, "grad_norm": "4.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.112e+00", "anc_loss": "1.191e+00", "dlm_acc": "6.440e-01", "anc_acc": "6.255e-01", "epoch": 0.06966} {"step": 34835, "loss": 1.4874, "grad_norm": "4.245e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.248e-01", "anc_loss": "5.986e-01", "dlm_acc": "7.741e-01", "anc_acc": "7.501e-01", "epoch": 0.06967} {"step": 34840, "loss": 0.78, "grad_norm": "6.339e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.254e-01", "anc_loss": "6.752e-01", "dlm_acc": "6.787e-01", "anc_acc": "6.643e-01", "epoch": 0.06968} {"step": 34845, "loss": 0.9732, "grad_norm": "4.331e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.300e-01", "anc_loss": "4.632e-01", "dlm_acc": "8.198e-01", "anc_acc": "8.110e-01", "epoch": 0.06969} {"step": 34850, "loss": 1.0806, "grad_norm": "2.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.176e-01", "anc_loss": "8.082e-01", "dlm_acc": "7.620e-01", "anc_acc": "7.407e-01", "epoch": 0.0697} {"step": 34855, "loss": 1.2482, "grad_norm": "2.327e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.326e-01", "anc_acc": "5.104e-01", "epoch": 0.06971} {"step": 34860, "loss": 1.3241, "grad_norm": "2.731e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.158e+00", "anc_loss": "1.255e+00", "dlm_acc": "5.558e-01", "anc_acc": "5.337e-01", "epoch": 0.06972} {"step": 34865, "loss": 0.9646, "grad_norm": "2.792e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.544e-01", "anc_loss": "1.848e-01", "dlm_acc": "9.027e-01", "anc_acc": "8.850e-01", "epoch": 0.06973} {"step": 34870, "loss": 1.0133, "grad_norm": "3.111e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e-01", "anc_loss": "1.842e-01", "dlm_acc": "9.086e-01", "anc_acc": "8.824e-01", "epoch": 0.06974} {"step": 34875, "loss": 0.8692, "grad_norm": "2.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.341e-01", "anc_loss": "1.686e-01", "dlm_acc": "9.146e-01", "anc_acc": "8.923e-01", "epoch": 0.06975} {"step": 34880, "loss": 1.1391, "grad_norm": "7.062e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.422e-01", "anc_loss": "8.656e-01", "dlm_acc": "5.498e-01", "anc_acc": "5.400e-01", "epoch": 0.06976} {"step": 34885, "loss": 0.8407, "grad_norm": "2.136e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.211e-01", "anc_loss": "5.234e-01", "dlm_acc": "5.727e-01", "anc_acc": "5.722e-01", "epoch": 0.06977} {"step": 34890, "loss": 1.2503, "grad_norm": "4.969e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.047e-01", "anc_loss": "8.531e-01", "dlm_acc": "6.466e-01", "anc_acc": "6.328e-01", "epoch": 0.06978} {"step": 34895, "loss": 1.0995, "grad_norm": "2.075e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.797e-01", "anc_loss": "8.461e-01", "dlm_acc": "6.506e-01", "anc_acc": "6.324e-01", "epoch": 0.06979} {"step": 34900, "loss": 1.6614, "grad_norm": "6.258e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.192e-01", "anc_loss": "2.421e-01", "dlm_acc": "8.517e-01", "anc_acc": "8.419e-01", "epoch": 0.0698} {"step": 34905, "loss": 1.4886, "grad_norm": "3.768e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.107e-02", "anc_loss": "7.448e-02", "dlm_acc": "9.711e-01", "anc_acc": "9.657e-01", "epoch": 0.06981} {"step": 34910, "loss": 0.7619, "grad_norm": "1.689e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.476e-02", "anc_loss": "2.104e-02", "dlm_acc": "9.916e-01", "anc_acc": "9.874e-01", "epoch": 0.06982} {"step": 34915, "loss": 0.7511, "grad_norm": "3.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.910e-03", "anc_loss": "1.000e-02", "dlm_acc": "9.980e-01", "anc_acc": "9.965e-01", "epoch": 0.06983} {"step": 34920, "loss": 0.816, "grad_norm": "2.149e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.825e-04", "anc_loss": "1.839e-02", "dlm_acc": "9.998e-01", "anc_acc": "9.934e-01", "epoch": 0.06984} {"step": 34925, "loss": 0.9006, "grad_norm": "3.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.768e-01", "anc_loss": "6.191e-01", "dlm_acc": "8.031e-01", "anc_acc": "7.899e-01", "epoch": 0.06985} {"step": 34930, "loss": 0.968, "grad_norm": "2.083e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.328e-01", "anc_loss": "8.950e-01", "dlm_acc": "6.903e-01", "anc_acc": "6.724e-01", "epoch": 0.06986} {"step": 34935, "loss": 0.7903, "grad_norm": "2.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.229e-01", "anc_loss": "2.533e-01", "dlm_acc": "8.852e-01", "anc_acc": "8.765e-01", "epoch": 0.06987} {"step": 34940, "loss": 1.1964, "grad_norm": "7.520e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.822e+00", "anc_loss": "1.940e+00", "dlm_acc": "5.239e-01", "anc_acc": "5.030e-01", "epoch": 0.06988} {"step": 34945, "loss": 0.9159, "grad_norm": "3.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.508e-01", "anc_loss": "1.053e+00", "dlm_acc": "6.529e-01", "anc_acc": "6.296e-01", "epoch": 0.06989} {"step": 34950, "loss": 1.2411, "grad_norm": "4.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.137e-01", "anc_loss": "7.625e-01", "dlm_acc": "5.685e-01", "anc_acc": "5.541e-01", "epoch": 0.0699} {"step": 34955, "loss": 1.0715, "grad_norm": "3.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.852e-01", "anc_loss": "8.734e-01", "dlm_acc": "6.831e-01", "anc_acc": "6.570e-01", "epoch": 0.06991} {"step": 34960, "loss": 0.8697, "grad_norm": "3.906e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.534e-01", "anc_loss": "6.248e-01", "dlm_acc": "7.785e-01", "anc_acc": "7.538e-01", "epoch": 0.06992} {"step": 34965, "loss": 1.2428, "grad_norm": "5.330e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.645e+00", "anc_loss": "1.745e+00", "dlm_acc": "4.918e-01", "anc_acc": "4.707e-01", "epoch": 0.06993} {"step": 34970, "loss": 0.8065, "grad_norm": "2.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.054e+00", "anc_loss": "1.155e+00", "dlm_acc": "6.287e-01", "anc_acc": "6.023e-01", "epoch": 0.06994} {"step": 34975, "loss": 0.9501, "grad_norm": "3.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.700e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.002e-01", "epoch": 0.06995} {"step": 34980, "loss": 0.9037, "grad_norm": "4.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.254e+00", "dlm_acc": "6.096e-01", "anc_acc": "5.819e-01", "epoch": 0.06996} {"step": 34985, "loss": 0.9882, "grad_norm": "3.321e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.269e+00", "anc_loss": "1.376e+00", "dlm_acc": "5.755e-01", "anc_acc": "5.518e-01", "epoch": 0.06997} {"step": 34990, "loss": 1.322, "grad_norm": "3.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.539e+00", "anc_loss": "1.655e+00", "dlm_acc": "5.065e-01", "anc_acc": "4.808e-01", "epoch": 0.06998} {"step": 34995, "loss": 0.902, "grad_norm": "2.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.169e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.559e-01", "anc_acc": "5.276e-01", "epoch": 0.06999} {"step": 35000, "loss": 1.2382, "grad_norm": "3.914e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.832e-01", "anc_loss": "9.281e-01", "dlm_acc": "7.112e-01", "anc_acc": "6.739e-01", "epoch": 0.07} {"step": 35005, "loss": 1.1367, "grad_norm": "3.545e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.250e-01", "anc_loss": "8.348e-01", "dlm_acc": "7.019e-01", "anc_acc": "6.700e-01", "epoch": 0.07001} {"step": 35010, "loss": 1.3649, "grad_norm": "4.434e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.427e-01", "anc_acc": "5.176e-01", "epoch": 0.07002} {"step": 35015, "loss": 1.0425, "grad_norm": "1.271e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.458e+00", "dlm_acc": "5.461e-01", "anc_acc": "5.180e-01", "epoch": 0.07003} {"step": 35020, "loss": 1.3442, "grad_norm": "3.845e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.144e-01", "anc_acc": "4.936e-01", "epoch": 0.07004} {"step": 35025, "loss": 1.7342, "grad_norm": "3.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.475e+00", "anc_loss": "1.600e+00", "dlm_acc": "5.339e-01", "anc_acc": "5.016e-01", "epoch": 0.07005} {"step": 35030, "loss": 1.2864, "grad_norm": "2.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.770e-01", "anc_loss": "8.812e-01", "dlm_acc": "7.128e-01", "anc_acc": "6.817e-01", "epoch": 0.07006} {"step": 35035, "loss": 0.9817, "grad_norm": "2.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.203e+00", "dlm_acc": "5.987e-01", "anc_acc": "5.703e-01", "epoch": 0.07007} {"step": 35040, "loss": 1.2121, "grad_norm": "3.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.194e+00", "anc_loss": "1.301e+00", "dlm_acc": "5.453e-01", "anc_acc": "5.174e-01", "epoch": 0.07008} {"step": 35045, "loss": 1.4741, "grad_norm": "6.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.728e+00", "anc_loss": "1.833e+00", "dlm_acc": "4.568e-01", "anc_acc": "4.333e-01", "epoch": 0.07009} {"step": 35050, "loss": 1.6762, "grad_norm": "3.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.580e+00", "anc_loss": "2.631e+00", "dlm_acc": "1.252e-01", "anc_acc": "1.193e-01", "epoch": 0.0701} {"step": 35055, "loss": 1.2888, "grad_norm": "3.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.450e+00", "dlm_acc": "5.399e-01", "anc_acc": "5.136e-01", "epoch": 0.07011} {"step": 35060, "loss": 1.2057, "grad_norm": "3.042e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.557e+00", "anc_loss": "1.694e+00", "dlm_acc": "5.070e-01", "anc_acc": "4.763e-01", "epoch": 0.07012} {"step": 35065, "loss": 0.9138, "grad_norm": "3.717e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.301e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.528e-01", "anc_acc": "5.229e-01", "epoch": 0.07013} {"step": 35070, "loss": 0.958, "grad_norm": "2.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.232e+00", "dlm_acc": "5.410e-01", "anc_acc": "5.167e-01", "epoch": 0.07014} {"step": 35075, "loss": 1.234, "grad_norm": "3.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.622e+00", "anc_loss": "1.797e+00", "dlm_acc": "5.737e-01", "anc_acc": "5.598e-01", "epoch": 0.07015} {"step": 35080, "loss": 1.1934, "grad_norm": "3.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.369e+00", "anc_loss": "1.492e+00", "dlm_acc": "5.477e-01", "anc_acc": "5.193e-01", "epoch": 0.07016} {"step": 35085, "loss": 1.2672, "grad_norm": "4.879e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.270e+00", "dlm_acc": "5.928e-01", "anc_acc": "5.750e-01", "epoch": 0.07017} {"step": 35090, "loss": 1.4384, "grad_norm": "4.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.523e+00", "anc_loss": "1.634e+00", "dlm_acc": "5.121e-01", "anc_acc": "4.871e-01", "epoch": 0.07018} {"step": 35095, "loss": 1.0022, "grad_norm": "3.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.169e+00", "anc_loss": "1.237e+00", "dlm_acc": "4.745e-01", "anc_acc": "4.566e-01", "epoch": 0.07019} {"step": 35100, "loss": 1.071, "grad_norm": "2.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.965e-01", "anc_loss": "1.089e+00", "dlm_acc": "6.198e-01", "anc_acc": "5.959e-01", "epoch": 0.0702} {"step": 35105, "loss": 0.6027, "grad_norm": "1.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.324e-01", "anc_loss": "3.600e-01", "dlm_acc": "7.831e-01", "anc_acc": "7.739e-01", "epoch": 0.07021} {"step": 35110, "loss": 1.0889, "grad_norm": "3.650e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.292e-01", "epoch": 0.07022} {"step": 35115, "loss": 0.9581, "grad_norm": "2.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.539e-01", "anc_loss": "9.789e-01", "dlm_acc": "4.052e-01", "anc_acc": "3.981e-01", "epoch": 0.07023} {"step": 35120, "loss": 1.3353, "grad_norm": "3.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.535e+00", "dlm_acc": "5.104e-01", "anc_acc": "4.859e-01", "epoch": 0.07024} {"step": 35125, "loss": 2.112, "grad_norm": "6.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.806e+00", "anc_loss": "1.969e+00", "dlm_acc": "5.079e-01", "anc_acc": "4.769e-01", "epoch": 0.07025} {"step": 35130, "loss": 1.5915, "grad_norm": "2.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.614e+00", "anc_loss": "1.742e+00", "dlm_acc": "4.951e-01", "anc_acc": "4.677e-01", "epoch": 0.07026} {"step": 35135, "loss": 1.0944, "grad_norm": "2.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.273e-01", "anc_loss": "1.021e+00", "dlm_acc": "5.896e-01", "anc_acc": "5.646e-01", "epoch": 0.07027} {"step": 35140, "loss": 1.3062, "grad_norm": "5.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.276e+00", "anc_loss": "1.383e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.349e-01", "epoch": 0.07028} {"step": 35145, "loss": 1.2775, "grad_norm": "3.353e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.889e-01", "anc_loss": "8.973e-01", "dlm_acc": "6.557e-01", "anc_acc": "6.224e-01", "epoch": 0.07029} {"step": 35150, "loss": 1.577, "grad_norm": "2.307e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.654e-01", "anc_acc": "5.416e-01", "epoch": 0.0703} {"step": 35155, "loss": 1.3173, "grad_norm": "5.497e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.788e+00", "anc_loss": "1.886e+00", "dlm_acc": "3.840e-01", "anc_acc": "3.633e-01", "epoch": 0.07031} {"step": 35160, "loss": 1.29, "grad_norm": "4.955e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.193e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.724e-01", "anc_acc": "5.351e-01", "epoch": 0.07032} {"step": 35165, "loss": 1.1277, "grad_norm": "4.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.193e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.931e-01", "anc_acc": "5.514e-01", "epoch": 0.07033} {"step": 35170, "loss": 1.0688, "grad_norm": "2.681e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.041e+00", "anc_loss": "1.158e+00", "dlm_acc": "5.949e-01", "anc_acc": "5.645e-01", "epoch": 0.07034} {"step": 35175, "loss": 1.06, "grad_norm": "2.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.246e+00", "dlm_acc": "5.227e-01", "anc_acc": "4.851e-01", "epoch": 0.07035} {"step": 35180, "loss": 1.0505, "grad_norm": "2.673e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.832e-01", "anc_loss": "9.770e-01", "dlm_acc": "6.487e-01", "anc_acc": "6.229e-01", "epoch": 0.07036} {"step": 35185, "loss": 1.0584, "grad_norm": "3.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.117e-01", "anc_loss": "5.352e-01", "dlm_acc": "6.196e-01", "anc_acc": "6.050e-01", "epoch": 0.07037} {"step": 35190, "loss": 0.5692, "grad_norm": "3.604e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.270e-01", "anc_loss": "5.527e-01", "dlm_acc": "6.451e-01", "anc_acc": "6.344e-01", "epoch": 0.07038} {"step": 35195, "loss": 1.1556, "grad_norm": "2.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.199e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.357e-01", "anc_acc": "5.142e-01", "epoch": 0.07039} {"step": 35200, "loss": 1.3983, "grad_norm": "2.667e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.664e+00", "dlm_acc": "4.335e-01", "anc_acc": "4.052e-01", "epoch": 0.0704} {"step": 35205, "loss": 1.2319, "grad_norm": "3.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.797e+00", "anc_loss": "1.887e+00", "dlm_acc": "3.596e-01", "anc_acc": "3.349e-01", "epoch": 0.07041} {"step": 35210, "loss": 0.8116, "grad_norm": "2.522e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.488e-01", "anc_loss": "8.449e-01", "dlm_acc": "6.807e-01", "anc_acc": "6.521e-01", "epoch": 0.07042} {"step": 35215, "loss": 1.1524, "grad_norm": "3.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.190e+00", "dlm_acc": "6.368e-01", "anc_acc": "6.161e-01", "epoch": 0.07043} {"step": 35220, "loss": 1.0336, "grad_norm": "5.386e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.688e-01", "anc_loss": "9.371e-01", "dlm_acc": "7.106e-01", "anc_acc": "6.595e-01", "epoch": 0.07044} {"step": 35225, "loss": 1.2435, "grad_norm": "2.751e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.375e+00", "dlm_acc": "5.386e-01", "anc_acc": "5.154e-01", "epoch": 0.07045} {"step": 35230, "loss": 1.3417, "grad_norm": "3.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.280e+00", "dlm_acc": "6.032e-01", "anc_acc": "5.772e-01", "epoch": 0.07046} {"step": 35235, "loss": 1.4767, "grad_norm": "3.174e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.621e+00", "anc_loss": "1.698e+00", "dlm_acc": "4.951e-01", "anc_acc": "4.707e-01", "epoch": 0.07047} {"step": 35240, "loss": 0.8438, "grad_norm": "1.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.063e+00", "anc_loss": "1.163e+00", "dlm_acc": "6.011e-01", "anc_acc": "5.728e-01", "epoch": 0.07048} {"step": 35245, "loss": 0.9428, "grad_norm": "2.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.213e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.493e-01", "epoch": 0.07049} {"step": 35250, "loss": 1.5358, "grad_norm": "4.491e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.619e+00", "anc_loss": "1.758e+00", "dlm_acc": "5.059e-01", "anc_acc": "4.753e-01", "epoch": 0.0705} {"step": 35255, "loss": 1.4778, "grad_norm": "3.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.516e+00", "dlm_acc": "5.434e-01", "anc_acc": "5.015e-01", "epoch": 0.07051} {"step": 35260, "loss": 1.0656, "grad_norm": "3.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.132e+00", "anc_loss": "1.246e+00", "dlm_acc": "5.565e-01", "anc_acc": "5.216e-01", "epoch": 0.07052} {"step": 35265, "loss": 0.9892, "grad_norm": "3.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.268e+00", "dlm_acc": "5.947e-01", "anc_acc": "5.591e-01", "epoch": 0.07053} {"step": 35270, "loss": 0.7876, "grad_norm": "3.434e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.850e-01", "anc_loss": "8.135e-01", "dlm_acc": "6.062e-01", "anc_acc": "5.973e-01", "epoch": 0.07054} {"step": 35275, "loss": 1.1215, "grad_norm": "4.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.490e-01", "anc_loss": "3.799e-01", "dlm_acc": "7.729e-01", "anc_acc": "7.604e-01", "epoch": 0.07055} {"step": 35280, "loss": 0.9413, "grad_norm": "4.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.023e-01", "anc_loss": "3.195e-01", "dlm_acc": "7.732e-01", "anc_acc": "7.657e-01", "epoch": 0.07056} {"step": 35285, "loss": 0.7783, "grad_norm": "2.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.541e-01", "anc_loss": "2.775e-01", "dlm_acc": "8.302e-01", "anc_acc": "8.179e-01", "epoch": 0.07057} {"step": 35290, "loss": 0.8578, "grad_norm": "6.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.343e-01", "anc_loss": "8.806e-01", "dlm_acc": "7.442e-01", "anc_acc": "7.322e-01", "epoch": 0.07058} {"step": 35295, "loss": 1.1176, "grad_norm": "4.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.604e-01", "anc_acc": "5.100e-01", "epoch": 0.07059} {"step": 35300, "loss": 1.2294, "grad_norm": "3.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.076e+00", "anc_loss": "1.183e+00", "dlm_acc": "5.967e-01", "anc_acc": "5.689e-01", "epoch": 0.0706} {"step": 35305, "loss": 1.0139, "grad_norm": "3.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.938e-01", "anc_loss": "1.115e+00", "dlm_acc": "6.235e-01", "anc_acc": "5.888e-01", "epoch": 0.07061} {"step": 35310, "loss": 1.3661, "grad_norm": "3.271e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.372e-01", "anc_acc": "5.048e-01", "epoch": 0.07062} {"step": 35315, "loss": 1.1034, "grad_norm": "3.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.166e+00", "dlm_acc": "6.086e-01", "anc_acc": "5.687e-01", "epoch": 0.07063} {"step": 35320, "loss": 1.2278, "grad_norm": "4.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.533e-01", "anc_acc": "5.074e-01", "epoch": 0.07064} {"step": 35325, "loss": 1.5181, "grad_norm": "4.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.605e+00", "dlm_acc": "5.745e-01", "anc_acc": "5.473e-01", "epoch": 0.07065} {"step": 35330, "loss": 1.3454, "grad_norm": "3.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.404e+00", "dlm_acc": "5.450e-01", "anc_acc": "5.025e-01", "epoch": 0.07066} {"step": 35335, "loss": 1.2063, "grad_norm": "3.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.395e-01", "anc_loss": "1.113e+00", "dlm_acc": "6.281e-01", "anc_acc": "5.679e-01", "epoch": 0.07067} {"step": 35340, "loss": 1.2878, "grad_norm": "3.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.506e+00", "dlm_acc": "5.193e-01", "anc_acc": "4.879e-01", "epoch": 0.07068} {"step": 35345, "loss": 1.3054, "grad_norm": "4.753e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.589e+00", "dlm_acc": "5.097e-01", "anc_acc": "4.830e-01", "epoch": 0.07069} {"step": 35350, "loss": 1.4338, "grad_norm": "5.511e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.089e-01", "anc_acc": "4.873e-01", "epoch": 0.0707} {"step": 35355, "loss": 0.8415, "grad_norm": "1.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.770e-01", "anc_loss": "9.293e-01", "dlm_acc": "6.254e-01", "anc_acc": "6.118e-01", "epoch": 0.07071} {"step": 35360, "loss": 1.2657, "grad_norm": "3.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.453e+00", "anc_loss": "1.536e+00", "dlm_acc": "4.804e-01", "anc_acc": "4.630e-01", "epoch": 0.07072} {"step": 35365, "loss": 1.0085, "grad_norm": "3.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.981e-01", "anc_loss": "1.090e+00", "dlm_acc": "6.438e-01", "anc_acc": "6.187e-01", "epoch": 0.07073} {"step": 35370, "loss": 1.2768, "grad_norm": "4.436e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.663e+00", "anc_loss": "1.778e+00", "dlm_acc": "4.890e-01", "anc_acc": "4.650e-01", "epoch": 0.07074} {"step": 35375, "loss": 1.2282, "grad_norm": "2.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.098e-01", "anc_loss": "6.449e-01", "dlm_acc": "5.992e-01", "anc_acc": "5.866e-01", "epoch": 0.07075} {"step": 35380, "loss": 1.0201, "grad_norm": "3.089e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.355e-01", "anc_loss": "5.484e-01", "dlm_acc": "6.028e-01", "anc_acc": "5.994e-01", "epoch": 0.07076} {"step": 35385, "loss": 1.4115, "grad_norm": "3.352e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.371e-01", "anc_loss": "9.918e-01", "dlm_acc": "5.599e-01", "anc_acc": "5.443e-01", "epoch": 0.07077} {"step": 35390, "loss": 1.3681, "grad_norm": "3.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.646e-01", "anc_acc": "5.395e-01", "epoch": 0.07078} {"step": 35395, "loss": 1.2127, "grad_norm": "3.696e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.957e-01", "anc_loss": "9.898e-01", "dlm_acc": "6.826e-01", "anc_acc": "6.629e-01", "epoch": 0.07079} {"step": 35400, "loss": 1.5711, "grad_norm": "9.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.494e+00", "anc_loss": "1.614e+00", "dlm_acc": "5.084e-01", "anc_acc": "4.840e-01", "epoch": 0.0708} {"step": 35405, "loss": 1.4598, "grad_norm": "6.408e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.539e+00", "anc_loss": "1.652e+00", "dlm_acc": "5.315e-01", "anc_acc": "5.065e-01", "epoch": 0.07081} {"step": 35410, "loss": 1.058, "grad_norm": "3.696e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.157e+00", "dlm_acc": "5.151e-01", "anc_acc": "4.885e-01", "epoch": 0.07082} {"step": 35415, "loss": 1.388, "grad_norm": "2.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.501e+00", "anc_loss": "1.657e+00", "dlm_acc": "5.213e-01", "anc_acc": "4.953e-01", "epoch": 0.07083} {"step": 35420, "loss": 1.4039, "grad_norm": "3.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.587e+00", "anc_loss": "1.698e+00", "dlm_acc": "4.976e-01", "anc_acc": "4.720e-01", "epoch": 0.07084} {"step": 35425, "loss": 1.2591, "grad_norm": "4.174e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.474e-01", "anc_acc": "5.178e-01", "epoch": 0.07085} {"step": 35430, "loss": 1.253, "grad_norm": "4.569e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.229e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.720e-01", "anc_acc": "5.461e-01", "epoch": 0.07086} {"step": 35435, "loss": 1.7971, "grad_norm": "2.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.695e+00", "anc_loss": "1.801e+00", "dlm_acc": "4.336e-01", "anc_acc": "4.125e-01", "epoch": 0.07087} {"step": 35440, "loss": 1.6566, "grad_norm": "3.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.563e-01", "anc_loss": "1.059e+00", "dlm_acc": "6.608e-01", "anc_acc": "6.340e-01", "epoch": 0.07088} {"step": 35445, "loss": 1.0122, "grad_norm": "4.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.199e+00", "anc_loss": "1.323e+00", "dlm_acc": "5.935e-01", "anc_acc": "5.632e-01", "epoch": 0.07089} {"step": 35450, "loss": 1.2046, "grad_norm": "3.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.502e+00", "anc_loss": "1.638e+00", "dlm_acc": "5.366e-01", "anc_acc": "5.065e-01", "epoch": 0.0709} {"step": 35455, "loss": 0.9352, "grad_norm": "2.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.929e-01", "anc_acc": "5.651e-01", "epoch": 0.07091} {"step": 35460, "loss": 1.2504, "grad_norm": "3.153e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.394e-01", "epoch": 0.07092} {"step": 35465, "loss": 1.3651, "grad_norm": "2.766e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.541e+00", "anc_loss": "1.639e+00", "dlm_acc": "4.688e-01", "anc_acc": "4.480e-01", "epoch": 0.07093} {"step": 35470, "loss": 1.4164, "grad_norm": "5.085e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.531e+00", "anc_loss": "1.654e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.311e-01", "epoch": 0.07094} {"step": 35475, "loss": 1.4326, "grad_norm": "6.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.466e+00", "anc_loss": "1.582e+00", "dlm_acc": "5.182e-01", "anc_acc": "4.926e-01", "epoch": 0.07095} {"step": 35480, "loss": 1.0369, "grad_norm": "1.986e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.231e+00", "anc_loss": "1.381e+00", "dlm_acc": "6.011e-01", "anc_acc": "5.696e-01", "epoch": 0.07096} {"step": 35485, "loss": 1.1982, "grad_norm": "2.436e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.684e+00", "anc_loss": "1.920e+00", "dlm_acc": "4.665e-01", "anc_acc": "4.418e-01", "epoch": 0.07097} {"step": 35490, "loss": 1.3285, "grad_norm": "2.945e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.884e+00", "anc_loss": "2.000e+00", "dlm_acc": "4.117e-01", "anc_acc": "3.867e-01", "epoch": 0.07098} {"step": 35495, "loss": 1.1571, "grad_norm": "3.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.146e-01", "anc_acc": "4.907e-01", "epoch": 0.07099} {"step": 35500, "loss": 1.1448, "grad_norm": "2.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.286e+00", "dlm_acc": "5.890e-01", "anc_acc": "5.595e-01", "epoch": 0.071} {"step": 35505, "loss": 1.1594, "grad_norm": "2.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.223e+00", "dlm_acc": "4.317e-01", "anc_acc": "4.220e-01", "epoch": 0.07101} {"step": 35510, "loss": 1.7035, "grad_norm": "5.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.048e-01", "anc_acc": "4.870e-01", "epoch": 0.07102} {"step": 35515, "loss": 1.2371, "grad_norm": "3.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.090e+00", "anc_loss": "1.173e+00", "dlm_acc": "5.477e-01", "anc_acc": "5.254e-01", "epoch": 0.07103} {"step": 35520, "loss": 1.2477, "grad_norm": "3.231e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.160e+00", "dlm_acc": "5.886e-01", "anc_acc": "5.514e-01", "epoch": 0.07104} {"step": 35525, "loss": 1.5246, "grad_norm": "5.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.516e+00", "dlm_acc": "5.124e-01", "anc_acc": "4.708e-01", "epoch": 0.07105} {"step": 35530, "loss": 1.2107, "grad_norm": "3.629e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.195e-01", "anc_loss": "1.025e+00", "dlm_acc": "6.878e-01", "anc_acc": "6.646e-01", "epoch": 0.07106} {"step": 35535, "loss": 1.111, "grad_norm": "1.863e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.282e-01", "anc_acc": "4.998e-01", "epoch": 0.07107} {"step": 35540, "loss": 1.3856, "grad_norm": "5.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.375e+00", "dlm_acc": "5.733e-01", "anc_acc": "5.405e-01", "epoch": 0.07108} {"step": 35545, "loss": 1.1789, "grad_norm": "4.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.777e+00", "anc_loss": "1.884e+00", "dlm_acc": "3.500e-01", "anc_acc": "3.222e-01", "epoch": 0.07109} {"step": 35550, "loss": 1.4687, "grad_norm": "2.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.332e+00", "anc_loss": "1.432e+00", "dlm_acc": "5.274e-01", "anc_acc": "5.039e-01", "epoch": 0.0711} {"step": 35555, "loss": 1.1183, "grad_norm": "3.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.370e+00", "anc_loss": "1.497e+00", "dlm_acc": "5.325e-01", "anc_acc": "4.981e-01", "epoch": 0.07111} {"step": 35560, "loss": 1.4645, "grad_norm": "3.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.294e-01", "anc_acc": "4.930e-01", "epoch": 0.07112} {"step": 35565, "loss": 1.3687, "grad_norm": "2.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.179e+00", "dlm_acc": "6.476e-01", "anc_acc": "6.076e-01", "epoch": 0.07113} {"step": 35570, "loss": 1.2173, "grad_norm": "6.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.309e+00", "anc_loss": "1.419e+00", "dlm_acc": "5.492e-01", "anc_acc": "5.269e-01", "epoch": 0.07114} {"step": 35575, "loss": 1.104, "grad_norm": "5.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.344e-01", "anc_loss": "7.953e-01", "dlm_acc": "5.841e-01", "anc_acc": "5.662e-01", "epoch": 0.07115} {"step": 35580, "loss": 1.0053, "grad_norm": "3.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.164e-01", "anc_loss": "6.953e-01", "dlm_acc": "6.563e-01", "anc_acc": "6.321e-01", "epoch": 0.07116} {"step": 35585, "loss": 0.7626, "grad_norm": "1.456e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.188e-01", "anc_loss": "7.016e-01", "dlm_acc": "6.428e-01", "anc_acc": "6.105e-01", "epoch": 0.07117} {"step": 35590, "loss": 0.985, "grad_norm": "1.139e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.789e-01", "anc_loss": "9.047e-01", "dlm_acc": "4.213e-01", "anc_acc": "4.111e-01", "epoch": 0.07118} {"step": 35595, "loss": 0.6329, "grad_norm": "4.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.350e-01", "anc_loss": "3.699e-01", "dlm_acc": "7.408e-01", "anc_acc": "7.198e-01", "epoch": 0.07119} {"step": 35600, "loss": 0.7943, "grad_norm": "3.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.018e-01", "anc_loss": "2.488e-01", "dlm_acc": "8.560e-01", "anc_acc": "8.234e-01", "epoch": 0.0712} {"step": 35605, "loss": 1.081, "grad_norm": "3.081e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.641e-01", "anc_loss": "4.926e-01", "dlm_acc": "6.202e-01", "anc_acc": "6.008e-01", "epoch": 0.07121} {"step": 35610, "loss": 1.6735, "grad_norm": "2.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.172e+00", "anc_loss": "1.229e+00", "dlm_acc": "4.340e-01", "anc_acc": "4.139e-01", "epoch": 0.07122} {"step": 35615, "loss": 1.342, "grad_norm": "3.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.609e-01", "anc_loss": "1.116e+00", "dlm_acc": "6.117e-01", "anc_acc": "5.704e-01", "epoch": 0.07123} {"step": 35620, "loss": 1.0535, "grad_norm": "4.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.417e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.459e-01", "anc_acc": "5.162e-01", "epoch": 0.07124} {"step": 35625, "loss": 0.7264, "grad_norm": "1.940e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.728e-01", "anc_loss": "1.813e-01", "dlm_acc": "8.712e-01", "anc_acc": "8.673e-01", "epoch": 0.07125} {"step": 35630, "loss": 1.318, "grad_norm": "4.444e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.502e+00", "anc_loss": "1.541e+00", "dlm_acc": "4.370e-01", "anc_acc": "4.273e-01", "epoch": 0.07126} {"step": 35635, "loss": 1.7172, "grad_norm": "3.753e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.492e-01", "anc_loss": "9.641e-01", "dlm_acc": "6.213e-01", "anc_acc": "5.938e-01", "epoch": 0.07127} {"step": 35640, "loss": 1.3222, "grad_norm": "5.764e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.674e+00", "anc_loss": "1.772e+00", "dlm_acc": "5.172e-01", "anc_acc": "4.954e-01", "epoch": 0.07128} {"step": 35645, "loss": 1.3179, "grad_norm": "4.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.607e-01", "anc_loss": "7.793e-01", "dlm_acc": "7.517e-01", "anc_acc": "7.139e-01", "epoch": 0.07129} {"step": 35650, "loss": 1.4522, "grad_norm": "7.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.157e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.694e-01", "anc_acc": "5.348e-01", "epoch": 0.0713} {"step": 35655, "loss": 1.4508, "grad_norm": "3.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.237e-01", "anc_acc": "4.988e-01", "epoch": 0.07131} {"step": 35660, "loss": 1.462, "grad_norm": "3.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.715e-01", "anc_loss": "8.113e-01", "dlm_acc": "5.254e-01", "anc_acc": "5.126e-01", "epoch": 0.07132} {"step": 35665, "loss": 1.5847, "grad_norm": "2.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.258e-01", "anc_loss": "7.273e-01", "dlm_acc": "5.721e-01", "anc_acc": "5.316e-01", "epoch": 0.07133} {"step": 35670, "loss": 1.3492, "grad_norm": "2.043e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.785e-01", "anc_loss": "5.961e-01", "dlm_acc": "5.735e-01", "anc_acc": "5.632e-01", "epoch": 0.07134} {"step": 35675, "loss": 0.8659, "grad_norm": "2.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.113e-01", "anc_loss": "4.371e-01", "dlm_acc": "6.870e-01", "anc_acc": "6.691e-01", "epoch": 0.07135} {"step": 35680, "loss": 0.8029, "grad_norm": "2.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.398e-01", "anc_loss": "4.699e-01", "dlm_acc": "6.515e-01", "anc_acc": "6.351e-01", "epoch": 0.07136} {"step": 35685, "loss": 0.9088, "grad_norm": "3.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.699e-01", "anc_loss": "4.824e-01", "dlm_acc": "6.131e-01", "anc_acc": "6.054e-01", "epoch": 0.07137} {"step": 35690, "loss": 1.3572, "grad_norm": "4.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.945e-01", "anc_loss": "1.040e+00", "dlm_acc": "5.155e-01", "anc_acc": "5.035e-01", "epoch": 0.07138} {"step": 35695, "loss": 1.1033, "grad_norm": "1.065e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.766e-01", "anc_loss": "9.680e-01", "dlm_acc": "5.797e-01", "anc_acc": "5.546e-01", "epoch": 0.07139} {"step": 35700, "loss": 1.2421, "grad_norm": "2.947e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.208e+00", "dlm_acc": "5.569e-01", "anc_acc": "5.305e-01", "epoch": 0.0714} {"step": 35705, "loss": 1.4461, "grad_norm": "4.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.319e+00", "dlm_acc": "5.002e-01", "anc_acc": "4.719e-01", "epoch": 0.07141} {"step": 35710, "loss": 1.3867, "grad_norm": "3.717e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.511e+00", "anc_loss": "1.685e+00", "dlm_acc": "4.500e-01", "anc_acc": "4.150e-01", "epoch": 0.07142} {"step": 35715, "loss": 1.4815, "grad_norm": "7.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.265e+00", "dlm_acc": "6.085e-01", "anc_acc": "5.580e-01", "epoch": 0.07143} {"step": 35720, "loss": 1.6857, "grad_norm": "4.377e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.426e+00", "anc_loss": "1.556e+00", "dlm_acc": "5.070e-01", "anc_acc": "4.712e-01", "epoch": 0.07144} {"step": 35725, "loss": 1.5471, "grad_norm": "4.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.381e+00", "anc_loss": "1.558e+00", "dlm_acc": "5.574e-01", "anc_acc": "5.165e-01", "epoch": 0.07145} {"step": 35730, "loss": 1.4465, "grad_norm": "9.065e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.393e-01", "anc_loss": "8.445e-01", "dlm_acc": "7.253e-01", "anc_acc": "7.031e-01", "epoch": 0.07146} {"step": 35735, "loss": 1.0429, "grad_norm": "4.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.181e+00", "dlm_acc": "5.297e-01", "anc_acc": "5.067e-01", "epoch": 0.07147} {"step": 35740, "loss": 1.2858, "grad_norm": "4.491e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.348e-01", "anc_acc": "5.105e-01", "epoch": 0.07148} {"step": 35745, "loss": 1.3521, "grad_norm": "3.330e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.514e+00", "anc_loss": "1.616e+00", "dlm_acc": "4.720e-01", "anc_acc": "4.482e-01", "epoch": 0.07149} {"step": 35750, "loss": 1.1329, "grad_norm": "3.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.184e+00", "dlm_acc": "6.063e-01", "anc_acc": "5.768e-01", "epoch": 0.0715} {"step": 35755, "loss": 1.4325, "grad_norm": "3.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.396e+00", "dlm_acc": "5.548e-01", "anc_acc": "5.305e-01", "epoch": 0.07151} {"step": 35760, "loss": 1.2521, "grad_norm": "2.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.200e+00", "anc_loss": "1.310e+00", "dlm_acc": "5.733e-01", "anc_acc": "5.461e-01", "epoch": 0.07152} {"step": 35765, "loss": 0.9767, "grad_norm": "4.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.187e+00", "dlm_acc": "6.070e-01", "anc_acc": "5.744e-01", "epoch": 0.07153} {"step": 35770, "loss": 0.9727, "grad_norm": "4.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.666e-01", "anc_loss": "8.641e-01", "dlm_acc": "7.221e-01", "anc_acc": "6.958e-01", "epoch": 0.07154} {"step": 35775, "loss": 1.2059, "grad_norm": "2.766e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.134e+00", "dlm_acc": "6.519e-01", "anc_acc": "6.180e-01", "epoch": 0.07155} {"step": 35780, "loss": 1.2765, "grad_norm": "2.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.516e+00", "dlm_acc": "5.896e-01", "anc_acc": "5.699e-01", "epoch": 0.07156} {"step": 35785, "loss": 1.3769, "grad_norm": "2.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.302e+00", "anc_loss": "1.415e+00", "dlm_acc": "5.492e-01", "anc_acc": "5.215e-01", "epoch": 0.07157} {"step": 35790, "loss": 1.1783, "grad_norm": "5.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.295e+00", "dlm_acc": "5.812e-01", "anc_acc": "5.548e-01", "epoch": 0.07158} {"step": 35795, "loss": 1.1123, "grad_norm": "2.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.174e+00", "dlm_acc": "6.095e-01", "anc_acc": "5.745e-01", "epoch": 0.07159} {"step": 35800, "loss": 1.4714, "grad_norm": "5.405e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.561e+00", "anc_loss": "1.691e+00", "dlm_acc": "5.054e-01", "anc_acc": "4.774e-01", "epoch": 0.0716} {"step": 35805, "loss": 1.1357, "grad_norm": "2.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.273e+00", "dlm_acc": "5.799e-01", "anc_acc": "5.561e-01", "epoch": 0.07161} {"step": 35810, "loss": 1.0872, "grad_norm": "3.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.224e+00", "dlm_acc": "5.691e-01", "anc_acc": "5.406e-01", "epoch": 0.07162} {"step": 35815, "loss": 1.1934, "grad_norm": "3.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.235e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.858e-01", "anc_acc": "5.515e-01", "epoch": 0.07163} {"step": 35820, "loss": 1.3447, "grad_norm": "3.678e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.335e+00", "dlm_acc": "6.027e-01", "anc_acc": "5.736e-01", "epoch": 0.07164} {"step": 35825, "loss": 1.8207, "grad_norm": "4.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.683e+00", "anc_loss": "1.792e+00", "dlm_acc": "5.064e-01", "anc_acc": "4.835e-01", "epoch": 0.07165} {"step": 35830, "loss": 1.4532, "grad_norm": "6.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.605e+00", "dlm_acc": "5.512e-01", "anc_acc": "5.270e-01", "epoch": 0.07166} {"step": 35835, "loss": 0.9639, "grad_norm": "3.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.111e+00", "dlm_acc": "6.060e-01", "anc_acc": "5.766e-01", "epoch": 0.07167} {"step": 35840, "loss": 1.4619, "grad_norm": "4.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.577e+00", "anc_loss": "1.688e+00", "dlm_acc": "5.030e-01", "anc_acc": "4.788e-01", "epoch": 0.07168} {"step": 35845, "loss": 1.2013, "grad_norm": "2.646e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.223e+00", "dlm_acc": "6.399e-01", "anc_acc": "6.150e-01", "epoch": 0.07169} {"step": 35850, "loss": 1.2206, "grad_norm": "4.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.251e+00", "dlm_acc": "6.039e-01", "anc_acc": "5.771e-01", "epoch": 0.0717} {"step": 35855, "loss": 1.8632, "grad_norm": "4.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.844e+00", "anc_loss": "1.997e+00", "dlm_acc": "4.972e-01", "anc_acc": "4.652e-01", "epoch": 0.07171} {"step": 35860, "loss": 0.9378, "grad_norm": "4.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.577e+00", "dlm_acc": "5.542e-01", "anc_acc": "5.275e-01", "epoch": 0.07172} {"step": 35865, "loss": 1.1814, "grad_norm": "3.119e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.519e+00", "anc_loss": "1.650e+00", "dlm_acc": "5.339e-01", "anc_acc": "5.032e-01", "epoch": 0.07173} {"step": 35870, "loss": 1.4716, "grad_norm": "4.731e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.073e+00", "anc_loss": "2.191e+00", "dlm_acc": "4.464e-01", "anc_acc": "4.233e-01", "epoch": 0.07174} {"step": 35875, "loss": 0.7412, "grad_norm": "2.386e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.586e-01", "anc_loss": "1.052e+00", "dlm_acc": "6.318e-01", "anc_acc": "6.045e-01", "epoch": 0.07175} {"step": 35880, "loss": 1.2189, "grad_norm": "3.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.500e-01", "epoch": 0.07176} {"step": 35885, "loss": 1.0173, "grad_norm": "2.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.207e-01", "anc_loss": "7.730e-01", "dlm_acc": "6.984e-01", "anc_acc": "6.850e-01", "epoch": 0.07177} {"step": 35890, "loss": 0.9813, "grad_norm": "3.837e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.519e-01", "anc_loss": "5.062e-01", "dlm_acc": "8.110e-01", "anc_acc": "7.910e-01", "epoch": 0.07178} {"step": 35895, "loss": 1.3169, "grad_norm": "4.830e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.321e+00", "dlm_acc": "5.857e-01", "anc_acc": "5.612e-01", "epoch": 0.07179} {"step": 35900, "loss": 0.9988, "grad_norm": "4.479e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.865e-01", "anc_loss": "6.227e-01", "dlm_acc": "5.692e-01", "anc_acc": "5.508e-01", "epoch": 0.0718} {"step": 35905, "loss": 0.9278, "grad_norm": "4.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.430e-01", "anc_loss": "8.285e-01", "dlm_acc": "7.152e-01", "anc_acc": "6.980e-01", "epoch": 0.07181} {"step": 35910, "loss": 0.8992, "grad_norm": "3.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.969e-01", "anc_loss": "4.891e-01", "dlm_acc": "8.339e-01", "anc_acc": "8.105e-01", "epoch": 0.07182} {"step": 35915, "loss": 0.936, "grad_norm": "2.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.570e-01", "anc_loss": "6.480e-01", "dlm_acc": "7.642e-01", "anc_acc": "7.400e-01", "epoch": 0.07183} {"step": 35920, "loss": 1.1875, "grad_norm": "1.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.731e-01", "anc_loss": "3.904e-01", "dlm_acc": "7.679e-01", "anc_acc": "7.605e-01", "epoch": 0.07184} {"step": 35925, "loss": 0.9559, "grad_norm": "2.299e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.592e-01", "anc_loss": "4.953e-01", "dlm_acc": "6.866e-01", "anc_acc": "6.753e-01", "epoch": 0.07185} {"step": 35930, "loss": 0.8526, "grad_norm": "3.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.049e-01", "anc_loss": "3.375e-01", "dlm_acc": "7.458e-01", "anc_acc": "7.254e-01", "epoch": 0.07186} {"step": 35935, "loss": 1.0419, "grad_norm": "2.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.590e-01", "anc_loss": "3.836e-01", "dlm_acc": "7.213e-01", "anc_acc": "7.074e-01", "epoch": 0.07187} {"step": 35940, "loss": 1.2202, "grad_norm": "2.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.672e-01", "anc_loss": "4.020e-01", "dlm_acc": "7.292e-01", "anc_acc": "7.068e-01", "epoch": 0.07188} {"step": 35945, "loss": 0.8373, "grad_norm": "2.736e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.588e-01", "anc_loss": "3.871e-01", "dlm_acc": "7.174e-01", "anc_acc": "7.002e-01", "epoch": 0.07189} {"step": 35950, "loss": 0.5428, "grad_norm": "2.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.088e-01", "anc_loss": "4.400e-01", "dlm_acc": "7.197e-01", "anc_acc": "6.990e-01", "epoch": 0.0719} {"step": 35955, "loss": 1.287, "grad_norm": "4.062e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.770e-01", "anc_loss": "4.082e-01", "dlm_acc": "7.847e-01", "anc_acc": "7.636e-01", "epoch": 0.07191} {"step": 35960, "loss": 1.4121, "grad_norm": "6.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.477e-01", "anc_loss": "1.024e+00", "dlm_acc": "6.676e-01", "anc_acc": "6.485e-01", "epoch": 0.07192} {"step": 35965, "loss": 1.1915, "grad_norm": "3.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.133e+00", "dlm_acc": "6.401e-01", "anc_acc": "6.122e-01", "epoch": 0.07193} {"step": 35970, "loss": 1.2406, "grad_norm": "3.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.011e+00", "anc_loss": "1.152e+00", "dlm_acc": "6.589e-01", "anc_acc": "6.202e-01", "epoch": 0.07194} {"step": 35975, "loss": 1.1028, "grad_norm": "4.511e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.717e-01", "anc_loss": "6.887e-01", "dlm_acc": "8.225e-01", "anc_acc": "7.974e-01", "epoch": 0.07195} {"step": 35980, "loss": 0.7247, "grad_norm": "2.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e-01", "anc_loss": "2.255e-01", "dlm_acc": "9.498e-01", "anc_acc": "9.291e-01", "epoch": 0.07196} {"step": 35985, "loss": 0.9043, "grad_norm": "2.976e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.875e-01", "anc_loss": "9.992e-01", "dlm_acc": "6.876e-01", "anc_acc": "6.605e-01", "epoch": 0.07197} {"step": 35990, "loss": 0.7861, "grad_norm": "3.878e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.069e+00", "anc_loss": "1.175e+00", "dlm_acc": "6.389e-01", "anc_acc": "6.125e-01", "epoch": 0.07198} {"step": 35995, "loss": 0.7851, "grad_norm": "3.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.656e-01", "anc_loss": "7.371e-01", "dlm_acc": "6.147e-01", "anc_acc": "5.849e-01", "epoch": 0.07199} {"step": 36000, "loss": 1.0862, "grad_norm": "5.011e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.398e-01", "anc_loss": "7.937e-01", "dlm_acc": "4.905e-01", "anc_acc": "4.627e-01", "epoch": 0.072} {"step": 36005, "loss": 1.1828, "grad_norm": "3.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.680e-01", "anc_loss": "7.242e-01", "dlm_acc": "4.976e-01", "anc_acc": "4.665e-01", "epoch": 0.07201} {"step": 36010, "loss": 1.8793, "grad_norm": "2.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.584e-01", "anc_loss": "1.013e+00", "dlm_acc": "6.666e-01", "anc_acc": "6.516e-01", "epoch": 0.07202} {"step": 36015, "loss": 0.8666, "grad_norm": "2.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.441e-01", "anc_loss": "5.984e-01", "dlm_acc": "8.079e-01", "anc_acc": "7.951e-01", "epoch": 0.07203} {"step": 36020, "loss": 1.0289, "grad_norm": "3.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.332e-01", "anc_loss": "3.755e-01", "dlm_acc": "8.342e-01", "anc_acc": "8.164e-01", "epoch": 0.07204} {"step": 36025, "loss": 1.2423, "grad_norm": "4.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.189e+00", "dlm_acc": "6.450e-01", "anc_acc": "6.180e-01", "epoch": 0.07205} {"step": 36030, "loss": 0.9768, "grad_norm": "2.666e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.129e-01", "anc_loss": "8.992e-01", "dlm_acc": "6.818e-01", "anc_acc": "6.571e-01", "epoch": 0.07206} {"step": 36035, "loss": 1.6841, "grad_norm": "5.626e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.507e+00", "anc_loss": "1.605e+00", "dlm_acc": "5.296e-01", "anc_acc": "5.087e-01", "epoch": 0.07207} {"step": 36040, "loss": 1.2285, "grad_norm": "4.547e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.047e-01", "anc_loss": "5.328e-01", "dlm_acc": "6.825e-01", "anc_acc": "6.677e-01", "epoch": 0.07208} {"step": 36045, "loss": 1.2356, "grad_norm": "5.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.293e-01", "anc_loss": "4.602e-01", "dlm_acc": "7.433e-01", "anc_acc": "7.323e-01", "epoch": 0.07209} {"step": 36050, "loss": 1.1371, "grad_norm": "3.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.297e-01", "anc_loss": "4.668e-01", "dlm_acc": "7.449e-01", "anc_acc": "7.314e-01", "epoch": 0.0721} {"step": 36055, "loss": 1.0845, "grad_norm": "2.389e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.430e-01", "anc_loss": "4.723e-01", "dlm_acc": "7.199e-01", "anc_acc": "7.072e-01", "epoch": 0.07211} {"step": 36060, "loss": 1.4115, "grad_norm": "6.019e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.199e+00", "dlm_acc": "6.324e-01", "anc_acc": "6.092e-01", "epoch": 0.07212} {"step": 36065, "loss": 1.3625, "grad_norm": "5.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.840e-01", "anc_loss": "1.051e+00", "dlm_acc": "5.309e-01", "anc_acc": "5.093e-01", "epoch": 0.07213} {"step": 36070, "loss": 1.5777, "grad_norm": "5.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.998e-01", "anc_loss": "1.073e+00", "dlm_acc": "6.532e-01", "anc_acc": "6.339e-01", "epoch": 0.07214} {"step": 36075, "loss": 1.2932, "grad_norm": "3.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.711e-01", "anc_loss": "8.686e-01", "dlm_acc": "7.198e-01", "anc_acc": "6.950e-01", "epoch": 0.07215} {"step": 36080, "loss": 1.3844, "grad_norm": "7.293e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.482e+00", "dlm_acc": "6.026e-01", "anc_acc": "5.801e-01", "epoch": 0.07216} {"step": 36085, "loss": 1.4321, "grad_norm": "4.299e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.289e+00", "dlm_acc": "6.234e-01", "anc_acc": "6.010e-01", "epoch": 0.07217} {"step": 36090, "loss": 1.4673, "grad_norm": "4.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.111e+00", "dlm_acc": "6.677e-01", "anc_acc": "6.445e-01", "epoch": 0.07218} {"step": 36095, "loss": 1.1764, "grad_norm": "2.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.418e+00", "dlm_acc": "5.808e-01", "anc_acc": "5.526e-01", "epoch": 0.07219} {"step": 36100, "loss": 0.9664, "grad_norm": "4.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.191e-01", "anc_loss": "4.621e-01", "dlm_acc": "8.354e-01", "anc_acc": "8.231e-01", "epoch": 0.0722} {"step": 36105, "loss": 0.7758, "grad_norm": "2.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e-01", "anc_loss": "1.194e-01", "dlm_acc": "9.364e-01", "anc_acc": "9.302e-01", "epoch": 0.07221} {"step": 36110, "loss": 0.6046, "grad_norm": "2.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.145e-02", "anc_loss": "7.108e-02", "dlm_acc": "9.597e-01", "anc_acc": "9.550e-01", "epoch": 0.07222} {"step": 36115, "loss": 1.0974, "grad_norm": "3.117e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.783e-01", "anc_loss": "5.503e-01", "dlm_acc": "8.141e-01", "anc_acc": "7.933e-01", "epoch": 0.07223} {"step": 36120, "loss": 0.9578, "grad_norm": "3.424e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.275e-01", "anc_loss": "4.591e-01", "dlm_acc": "8.067e-01", "anc_acc": "7.944e-01", "epoch": 0.07224} {"step": 36125, "loss": 1.6791, "grad_norm": "4.719e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.035e-01", "anc_loss": "9.668e-01", "dlm_acc": "6.432e-01", "anc_acc": "6.254e-01", "epoch": 0.07225} {"step": 36130, "loss": 0.8666, "grad_norm": "2.511e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.457e-01", "anc_loss": "2.688e-01", "dlm_acc": "8.970e-01", "anc_acc": "8.869e-01", "epoch": 0.07226} {"step": 36135, "loss": 0.8334, "grad_norm": "3.370e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.009e-01", "anc_loss": "6.806e-01", "dlm_acc": "7.827e-01", "anc_acc": "7.587e-01", "epoch": 0.07227} {"step": 36140, "loss": 1.2163, "grad_norm": "5.222e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.189e+00", "anc_loss": "1.287e+00", "dlm_acc": "6.274e-01", "anc_acc": "6.068e-01", "epoch": 0.07228} {"step": 36145, "loss": 1.0094, "grad_norm": "4.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.512e-01", "anc_loss": "8.191e-01", "dlm_acc": "6.716e-01", "anc_acc": "6.490e-01", "epoch": 0.07229} {"step": 36150, "loss": 0.7941, "grad_norm": "8.088e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.605e-01", "anc_loss": "2.658e-01", "dlm_acc": "8.472e-01", "anc_acc": "8.448e-01", "epoch": 0.0723} {"step": 36155, "loss": 1.0654, "grad_norm": "3.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.359e-01", "anc_loss": "2.437e-01", "dlm_acc": "8.586e-01", "anc_acc": "8.583e-01", "epoch": 0.07231} {"step": 36160, "loss": 1.336, "grad_norm": "4.762e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.281e+00", "dlm_acc": "5.653e-01", "anc_acc": "5.441e-01", "epoch": 0.07232} {"step": 36165, "loss": 1.0215, "grad_norm": "2.688e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.023e-01", "anc_loss": "9.961e-01", "dlm_acc": "6.572e-01", "anc_acc": "6.323e-01", "epoch": 0.07233} {"step": 36170, "loss": 0.9847, "grad_norm": "4.404e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.316e-01", "anc_loss": "6.832e-01", "dlm_acc": "7.098e-01", "anc_acc": "6.926e-01", "epoch": 0.07234} {"step": 36175, "loss": 1.2183, "grad_norm": "7.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.396e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.425e-01", "anc_acc": "5.211e-01", "epoch": 0.07235} {"step": 36180, "loss": 1.0751, "grad_norm": "2.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.245e+00", "dlm_acc": "5.855e-01", "anc_acc": "5.459e-01", "epoch": 0.07236} {"step": 36185, "loss": 1.3148, "grad_norm": "2.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.637e+00", "anc_loss": "1.742e+00", "dlm_acc": "4.356e-01", "anc_acc": "4.107e-01", "epoch": 0.07237} {"step": 36190, "loss": 1.0057, "grad_norm": "2.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.920e-01", "anc_acc": "5.647e-01", "epoch": 0.07238} {"step": 36195, "loss": 1.0073, "grad_norm": "4.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.750e-01", "anc_loss": "8.742e-01", "dlm_acc": "6.619e-01", "anc_acc": "6.275e-01", "epoch": 0.07239} {"step": 36200, "loss": 1.3404, "grad_norm": "4.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.097e+00", "dlm_acc": "6.191e-01", "anc_acc": "5.934e-01", "epoch": 0.0724} {"step": 36205, "loss": 1.2552, "grad_norm": "3.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.190e+00", "dlm_acc": "6.049e-01", "anc_acc": "5.508e-01", "epoch": 0.07241} {"step": 36210, "loss": 1.1089, "grad_norm": "2.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.375e-01", "anc_loss": "1.113e+00", "dlm_acc": "6.706e-01", "anc_acc": "6.153e-01", "epoch": 0.07242} {"step": 36215, "loss": 0.9731, "grad_norm": "3.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.867e-01", "anc_loss": "9.484e-01", "dlm_acc": "6.981e-01", "anc_acc": "6.542e-01", "epoch": 0.07243} {"step": 36220, "loss": 1.3337, "grad_norm": "2.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.613e+00", "anc_loss": "1.712e+00", "dlm_acc": "4.854e-01", "anc_acc": "4.638e-01", "epoch": 0.07244} {"step": 36225, "loss": 1.1993, "grad_norm": "3.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.403e+00", "anc_loss": "1.578e+00", "dlm_acc": "5.106e-01", "anc_acc": "4.673e-01", "epoch": 0.07245} {"step": 36230, "loss": 1.0009, "grad_norm": "4.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.570e-01", "anc_loss": "1.080e+00", "dlm_acc": "6.176e-01", "anc_acc": "5.814e-01", "epoch": 0.07246} {"step": 36235, "loss": 1.0969, "grad_norm": "2.932e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.276e+00", "anc_loss": "1.389e+00", "dlm_acc": "5.289e-01", "anc_acc": "4.994e-01", "epoch": 0.07247} {"step": 36240, "loss": 0.7998, "grad_norm": "2.508e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.344e-01", "anc_loss": "8.656e-01", "dlm_acc": "7.019e-01", "anc_acc": "6.641e-01", "epoch": 0.07248} {"step": 36245, "loss": 1.1997, "grad_norm": "2.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.894e-01", "anc_acc": "5.490e-01", "epoch": 0.07249} {"step": 36250, "loss": 0.8229, "grad_norm": "1.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.562e-01", "anc_loss": "8.684e-01", "dlm_acc": "6.849e-01", "anc_acc": "6.527e-01", "epoch": 0.0725} {"step": 36255, "loss": 1.4247, "grad_norm": "4.752e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.204e+00", "dlm_acc": "5.919e-01", "anc_acc": "5.473e-01", "epoch": 0.07251} {"step": 36260, "loss": 1.0605, "grad_norm": "2.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.797e-01", "anc_loss": "1.067e+00", "dlm_acc": "6.287e-01", "anc_acc": "5.976e-01", "epoch": 0.07252} {"step": 36265, "loss": 1.1729, "grad_norm": "3.624e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.625e-01", "anc_loss": "9.391e-01", "dlm_acc": "6.809e-01", "anc_acc": "6.586e-01", "epoch": 0.07253} {"step": 36270, "loss": 1.4283, "grad_norm": "4.370e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.643e+00", "dlm_acc": "4.944e-01", "anc_acc": "4.443e-01", "epoch": 0.07254} {"step": 36275, "loss": 1.2688, "grad_norm": "3.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.438e+00", "anc_loss": "1.616e+00", "dlm_acc": "5.210e-01", "anc_acc": "4.812e-01", "epoch": 0.07255} {"step": 36280, "loss": 0.9798, "grad_norm": "6.077e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.650e-01", "anc_loss": "1.046e+00", "dlm_acc": "6.038e-01", "anc_acc": "5.808e-01", "epoch": 0.07256} {"step": 36285, "loss": 1.1278, "grad_norm": "4.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.789e-01", "anc_loss": "9.320e-01", "dlm_acc": "6.605e-01", "anc_acc": "6.047e-01", "epoch": 0.07257} {"step": 36290, "loss": 1.3091, "grad_norm": "2.979e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.007e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.204e-01", "anc_acc": "5.875e-01", "epoch": 0.07258} {"step": 36295, "loss": 1.1873, "grad_norm": "3.444e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.170e+00", "dlm_acc": "6.054e-01", "anc_acc": "5.826e-01", "epoch": 0.07259} {"step": 36300, "loss": 1.2101, "grad_norm": "3.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.338e+00", "dlm_acc": "5.619e-01", "anc_acc": "5.144e-01", "epoch": 0.0726} {"step": 36305, "loss": 1.4152, "grad_norm": "4.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.606e+00", "anc_loss": "1.711e+00", "dlm_acc": "4.171e-01", "anc_acc": "3.847e-01", "epoch": 0.07261} {"step": 36310, "loss": 1.3093, "grad_norm": "3.128e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.409e+00", "anc_loss": "1.491e+00", "dlm_acc": "4.830e-01", "anc_acc": "4.635e-01", "epoch": 0.07262} {"step": 36315, "loss": 1.7849, "grad_norm": "3.422e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.268e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.520e-01", "anc_acc": "5.241e-01", "epoch": 0.07263} {"step": 36320, "loss": 1.898, "grad_norm": "3.940e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.708e-01", "anc_acc": "5.335e-01", "epoch": 0.07264} {"step": 36325, "loss": 2.0684, "grad_norm": "3.003e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.881e+00", "anc_loss": "1.999e+00", "dlm_acc": "4.437e-01", "anc_acc": "4.169e-01", "epoch": 0.07265} {"step": 36330, "loss": 1.6136, "grad_norm": "4.957e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.343e+00", "dlm_acc": "5.675e-01", "anc_acc": "5.432e-01", "epoch": 0.07266} {"step": 36335, "loss": 1.585, "grad_norm": "4.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.383e+00", "anc_loss": "1.554e+00", "dlm_acc": "5.596e-01", "anc_acc": "5.205e-01", "epoch": 0.07267} {"step": 36340, "loss": 1.2462, "grad_norm": "3.871e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.461e-01", "anc_acc": "5.168e-01", "epoch": 0.07268} {"step": 36345, "loss": 1.2654, "grad_norm": "3.024e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.072e+00", "anc_loss": "2.216e+00", "dlm_acc": "3.095e-01", "anc_acc": "2.779e-01", "epoch": 0.07269} {"step": 36350, "loss": 0.8292, "grad_norm": "4.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.185e+00", "anc_loss": "1.316e+00", "dlm_acc": "5.728e-01", "anc_acc": "5.286e-01", "epoch": 0.0727} {"step": 36355, "loss": 1.0816, "grad_norm": "5.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.771e-01", "anc_acc": "5.159e-01", "epoch": 0.07271} {"step": 36360, "loss": 1.435, "grad_norm": "1.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.673e+00", "anc_loss": "1.731e+00", "dlm_acc": "4.500e-01", "anc_acc": "4.359e-01", "epoch": 0.07272} {"step": 36365, "loss": 1.1292, "grad_norm": "2.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e-01", "anc_loss": "1.689e-01", "dlm_acc": "9.161e-01", "anc_acc": "9.031e-01", "epoch": 0.07273} {"step": 36370, "loss": 1.3427, "grad_norm": "4.214e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.891e-01", "anc_loss": "8.574e-01", "dlm_acc": "6.901e-01", "anc_acc": "6.674e-01", "epoch": 0.07274} {"step": 36375, "loss": 1.3213, "grad_norm": "2.241e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.137e-01", "anc_loss": "5.596e-01", "dlm_acc": "6.954e-01", "anc_acc": "6.691e-01", "epoch": 0.07275} {"step": 36380, "loss": 0.872, "grad_norm": "4.869e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.271e-01", "anc_loss": "7.016e-01", "dlm_acc": "7.555e-01", "anc_acc": "7.234e-01", "epoch": 0.07276} {"step": 36385, "loss": 1.1456, "grad_norm": "2.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.793e-01", "anc_loss": "9.742e-01", "dlm_acc": "6.414e-01", "anc_acc": "6.100e-01", "epoch": 0.07277} {"step": 36390, "loss": 1.1675, "grad_norm": "3.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.464e+00", "anc_loss": "1.592e+00", "dlm_acc": "5.283e-01", "anc_acc": "4.990e-01", "epoch": 0.07278} {"step": 36395, "loss": 1.0118, "grad_norm": "3.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.289e+00", "dlm_acc": "5.104e-01", "anc_acc": "4.924e-01", "epoch": 0.07279} {"step": 36400, "loss": 0.7915, "grad_norm": "4.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.871e-01", "anc_loss": "7.590e-01", "dlm_acc": "7.082e-01", "anc_acc": "6.850e-01", "epoch": 0.0728} {"step": 36405, "loss": 1.1316, "grad_norm": "3.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.387e-01", "anc_loss": "7.273e-01", "dlm_acc": "6.748e-01", "anc_acc": "6.468e-01", "epoch": 0.07281} {"step": 36410, "loss": 0.8575, "grad_norm": "2.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.180e-01", "anc_loss": "4.887e-01", "dlm_acc": "7.648e-01", "anc_acc": "7.395e-01", "epoch": 0.07282} {"step": 36415, "loss": 1.4637, "grad_norm": "7.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.308e-01", "anc_acc": "5.062e-01", "epoch": 0.07283} {"step": 36420, "loss": 1.6596, "grad_norm": "4.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.927e+00", "anc_loss": "2.030e+00", "dlm_acc": "4.049e-01", "anc_acc": "3.855e-01", "epoch": 0.07284} {"step": 36425, "loss": 1.0849, "grad_norm": "2.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.191e-01", "anc_loss": "9.617e-01", "dlm_acc": "6.412e-01", "anc_acc": "5.975e-01", "epoch": 0.07285} {"step": 36430, "loss": 1.2581, "grad_norm": "6.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.803e-01", "anc_acc": "5.439e-01", "epoch": 0.07286} {"step": 36435, "loss": 1.0903, "grad_norm": "3.146e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.906e-01", "anc_loss": "1.153e+00", "dlm_acc": "6.121e-01", "anc_acc": "5.701e-01", "epoch": 0.07287} {"step": 36440, "loss": 1.9623, "grad_norm": "6.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.569e+00", "dlm_acc": "5.450e-01", "anc_acc": "5.146e-01", "epoch": 0.07288} {"step": 36445, "loss": 1.2628, "grad_norm": "5.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.511e+00", "dlm_acc": "4.825e-01", "anc_acc": "4.603e-01", "epoch": 0.07289} {"step": 36450, "loss": 1.3447, "grad_norm": "4.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.626e+00", "anc_loss": "1.713e+00", "dlm_acc": "4.615e-01", "anc_acc": "4.402e-01", "epoch": 0.0729} {"step": 36455, "loss": 1.494, "grad_norm": "4.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.245e+00", "dlm_acc": "6.225e-01", "anc_acc": "5.881e-01", "epoch": 0.07291} {"step": 36460, "loss": 1.2158, "grad_norm": "2.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.382e-01", "anc_acc": "5.005e-01", "epoch": 0.07292} {"step": 36465, "loss": 1.0371, "grad_norm": "2.837e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.711e-01", "anc_loss": "8.443e-01", "dlm_acc": "5.831e-01", "anc_acc": "5.608e-01", "epoch": 0.07293} {"step": 36470, "loss": 1.2263, "grad_norm": "3.306e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.205e+00", "dlm_acc": "6.032e-01", "anc_acc": "5.738e-01", "epoch": 0.07294} {"step": 36475, "loss": 1.2742, "grad_norm": "5.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.819e-01", "anc_loss": "1.097e+00", "dlm_acc": "6.719e-01", "anc_acc": "6.444e-01", "epoch": 0.07295} {"step": 36480, "loss": 1.2127, "grad_norm": "3.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.506e-01", "anc_acc": "5.169e-01", "epoch": 0.07296} {"step": 36485, "loss": 1.2701, "grad_norm": "2.747e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.472e-01", "anc_acc": "4.936e-01", "epoch": 0.07297} {"step": 36490, "loss": 0.9533, "grad_norm": "2.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.344e-01", "anc_loss": "9.160e-01", "dlm_acc": "6.017e-01", "anc_acc": "5.774e-01", "epoch": 0.07298} {"step": 36495, "loss": 1.1765, "grad_norm": "4.122e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.061e+00", "anc_loss": "1.139e+00", "dlm_acc": "5.777e-01", "anc_acc": "5.529e-01", "epoch": 0.07299} {"step": 36500, "loss": 1.094, "grad_norm": "3.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.309e+00", "anc_loss": "1.486e+00", "dlm_acc": "5.540e-01", "anc_acc": "5.060e-01", "epoch": 0.073} {"step": 36505, "loss": 0.8903, "grad_norm": "3.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.934e-01", "anc_loss": "1.079e+00", "dlm_acc": "6.014e-01", "anc_acc": "5.815e-01", "epoch": 0.07301} {"step": 36510, "loss": 1.1843, "grad_norm": "4.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.064e+00", "anc_loss": "1.156e+00", "dlm_acc": "5.446e-01", "anc_acc": "5.145e-01", "epoch": 0.07302} {"step": 36515, "loss": 1.1493, "grad_norm": "6.943e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.282e+00", "dlm_acc": "5.390e-01", "anc_acc": "5.086e-01", "epoch": 0.07303} {"step": 36520, "loss": 1.2579, "grad_norm": "7.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.191e+00", "dlm_acc": "5.905e-01", "anc_acc": "5.745e-01", "epoch": 0.07304} {"step": 36525, "loss": 1.1387, "grad_norm": "3.970e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.770e-01", "anc_loss": "9.703e-01", "dlm_acc": "6.708e-01", "anc_acc": "6.455e-01", "epoch": 0.07305} {"step": 36530, "loss": 1.3704, "grad_norm": "4.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.961e-01", "anc_loss": "7.680e-01", "dlm_acc": "6.106e-01", "anc_acc": "5.883e-01", "epoch": 0.07306} {"step": 36535, "loss": 1.137, "grad_norm": "7.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.570e-01", "anc_loss": "6.012e-01", "dlm_acc": "6.375e-01", "anc_acc": "6.276e-01", "epoch": 0.07307} {"step": 36540, "loss": 0.9036, "grad_norm": "2.438e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.707e-01", "anc_loss": "8.703e-01", "dlm_acc": "6.897e-01", "anc_acc": "6.592e-01", "epoch": 0.07308} {"step": 36545, "loss": 1.1966, "grad_norm": "5.005e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.114e+00", "dlm_acc": "5.064e-01", "anc_acc": "4.882e-01", "epoch": 0.07309} {"step": 36550, "loss": 1.1749, "grad_norm": "3.170e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.082e+00", "anc_loss": "1.197e+00", "dlm_acc": "6.340e-01", "anc_acc": "6.072e-01", "epoch": 0.0731} {"step": 36555, "loss": 1.0173, "grad_norm": "2.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.422e-01", "anc_loss": "7.094e-01", "dlm_acc": "6.337e-01", "anc_acc": "6.033e-01", "epoch": 0.07311} {"step": 36560, "loss": 1.5728, "grad_norm": "3.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.466e+00", "anc_loss": "1.590e+00", "dlm_acc": "5.490e-01", "anc_acc": "5.212e-01", "epoch": 0.07312} {"step": 36565, "loss": 0.8847, "grad_norm": "3.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.124e+00", "anc_loss": "1.213e+00", "dlm_acc": "5.640e-01", "anc_acc": "5.383e-01", "epoch": 0.07313} {"step": 36570, "loss": 0.8694, "grad_norm": "2.131e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.620e-01", "anc_acc": "5.336e-01", "epoch": 0.07314} {"step": 36575, "loss": 0.9311, "grad_norm": "4.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.875e-01", "anc_loss": "1.000e+00", "dlm_acc": "6.104e-01", "anc_acc": "5.784e-01", "epoch": 0.07315} {"step": 36580, "loss": 0.8799, "grad_norm": "2.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.465e-01", "anc_loss": "8.206e-01", "dlm_acc": "6.866e-01", "anc_acc": "6.655e-01", "epoch": 0.07316} {"step": 36585, "loss": 0.7347, "grad_norm": "4.053e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.191e-01", "anc_loss": "3.739e-01", "dlm_acc": "8.028e-01", "anc_acc": "7.759e-01", "epoch": 0.07317} {"step": 36590, "loss": 1.1352, "grad_norm": "2.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.072e+00", "anc_loss": "1.168e+00", "dlm_acc": "5.424e-01", "anc_acc": "5.139e-01", "epoch": 0.07318} {"step": 36595, "loss": 1.2324, "grad_norm": "3.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.144e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.849e-01", "anc_acc": "5.614e-01", "epoch": 0.07319} {"step": 36600, "loss": 1.3633, "grad_norm": "3.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.172e-01", "anc_loss": "7.523e-01", "dlm_acc": "6.104e-01", "anc_acc": "5.978e-01", "epoch": 0.0732} {"step": 36605, "loss": 0.9269, "grad_norm": "2.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.484e-01", "anc_loss": "7.539e-01", "dlm_acc": "4.159e-01", "anc_acc": "4.122e-01", "epoch": 0.07321} {"step": 36610, "loss": 1.4293, "grad_norm": "4.112e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.243e+00", "dlm_acc": "5.607e-01", "anc_acc": "5.286e-01", "epoch": 0.07322} {"step": 36615, "loss": 1.522, "grad_norm": "7.997e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.354e+00", "dlm_acc": "5.017e-01", "anc_acc": "4.743e-01", "epoch": 0.07323} {"step": 36620, "loss": 0.9587, "grad_norm": "3.198e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.641e-01", "anc_loss": "1.002e+00", "dlm_acc": "2.812e-01", "anc_acc": "2.564e-01", "epoch": 0.07324} {"step": 36625, "loss": 0.9362, "grad_norm": "3.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.406e-01", "anc_loss": "9.062e-01", "dlm_acc": "5.372e-01", "anc_acc": "5.155e-01", "epoch": 0.07325} {"step": 36630, "loss": 0.9455, "grad_norm": "1.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.957e-01", "anc_loss": "8.664e-01", "dlm_acc": "6.836e-01", "anc_acc": "6.669e-01", "epoch": 0.07326} {"step": 36635, "loss": 0.8254, "grad_norm": "2.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.047e-01", "anc_loss": "5.723e-01", "dlm_acc": "7.535e-01", "anc_acc": "7.244e-01", "epoch": 0.07327} {"step": 36640, "loss": 0.878, "grad_norm": "4.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.246e-01", "anc_loss": "7.676e-01", "dlm_acc": "6.703e-01", "anc_acc": "6.569e-01", "epoch": 0.07328} {"step": 36645, "loss": 0.9565, "grad_norm": "4.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.918e-01", "anc_loss": "6.980e-01", "dlm_acc": "5.520e-01", "anc_acc": "5.494e-01", "epoch": 0.07329} {"step": 36650, "loss": 0.9058, "grad_norm": "2.544e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.055e-01", "anc_loss": "7.109e-01", "dlm_acc": "5.565e-01", "anc_acc": "5.530e-01", "epoch": 0.0733} {"step": 36655, "loss": 0.7062, "grad_norm": "1.879e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.312e-01", "anc_loss": "5.387e-01", "dlm_acc": "6.103e-01", "anc_acc": "6.072e-01", "epoch": 0.07331} {"step": 36660, "loss": 1.1827, "grad_norm": "3.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.820e-01", "anc_loss": "7.863e-01", "dlm_acc": "5.281e-01", "anc_acc": "5.265e-01", "epoch": 0.07332} {"step": 36665, "loss": 1.2044, "grad_norm": "2.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.609e-01", "anc_loss": "1.034e+00", "dlm_acc": "5.751e-01", "anc_acc": "5.548e-01", "epoch": 0.07333} {"step": 36670, "loss": 0.9816, "grad_norm": "2.640e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.094e-01", "anc_loss": "9.883e-01", "dlm_acc": "5.931e-01", "anc_acc": "5.724e-01", "epoch": 0.07334} {"step": 36675, "loss": 0.9884, "grad_norm": "2.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.857e-01", "anc_loss": "6.725e-01", "dlm_acc": "6.872e-01", "anc_acc": "6.536e-01", "epoch": 0.07335} {"step": 36680, "loss": 1.1912, "grad_norm": "4.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.875e-01", "anc_loss": "1.066e+00", "dlm_acc": "5.360e-01", "anc_acc": "5.146e-01", "epoch": 0.07336} {"step": 36685, "loss": 0.8254, "grad_norm": "5.679e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.679e-01", "anc_loss": "6.269e-01", "dlm_acc": "6.996e-01", "anc_acc": "6.778e-01", "epoch": 0.07337} {"step": 36690, "loss": 1.2356, "grad_norm": "3.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.734e-01", "anc_loss": "8.477e-01", "dlm_acc": "5.714e-01", "anc_acc": "5.419e-01", "epoch": 0.07338} {"step": 36695, "loss": 1.1639, "grad_norm": "3.179e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.844e-01", "anc_loss": "6.246e-01", "dlm_acc": "5.669e-01", "anc_acc": "5.378e-01", "epoch": 0.07339} {"step": 36700, "loss": 1.031, "grad_norm": "2.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.531e-01", "anc_loss": "5.852e-01", "dlm_acc": "5.837e-01", "anc_acc": "5.604e-01", "epoch": 0.0734} {"step": 36705, "loss": 1.112, "grad_norm": "3.157e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.508e-01", "anc_loss": "1.036e+00", "dlm_acc": "5.757e-01", "anc_acc": "5.490e-01", "epoch": 0.07341} {"step": 36710, "loss": 0.8786, "grad_norm": "3.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.047e-01", "anc_loss": "8.641e-01", "dlm_acc": "5.656e-01", "anc_acc": "5.415e-01", "epoch": 0.07342} {"step": 36715, "loss": 1.2868, "grad_norm": "6.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.391e-01", "anc_loss": "1.088e+00", "dlm_acc": "6.773e-01", "anc_acc": "6.365e-01", "epoch": 0.07343} {"step": 36720, "loss": 1.008, "grad_norm": "3.059e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.570e-01", "anc_loss": "7.023e-01", "dlm_acc": "6.495e-01", "anc_acc": "6.351e-01", "epoch": 0.07344} {"step": 36725, "loss": 1.1769, "grad_norm": "4.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.609e-01", "anc_loss": "6.660e-01", "dlm_acc": "5.389e-01", "anc_acc": "5.373e-01", "epoch": 0.07345} {"step": 36730, "loss": 0.7396, "grad_norm": "1.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.307e-01", "anc_loss": "5.367e-01", "dlm_acc": "6.273e-01", "anc_acc": "6.234e-01", "epoch": 0.07346} {"step": 36735, "loss": 1.27, "grad_norm": "2.984e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.901e-01", "anc_acc": "5.621e-01", "epoch": 0.07347} {"step": 36740, "loss": 1.1044, "grad_norm": "4.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.418e-01", "anc_loss": "7.035e-01", "dlm_acc": "6.504e-01", "anc_acc": "6.248e-01", "epoch": 0.07348} {"step": 36745, "loss": 1.8514, "grad_norm": "3.366e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.523e+00", "anc_loss": "1.652e+00", "dlm_acc": "5.393e-01", "anc_acc": "5.138e-01", "epoch": 0.07349} {"step": 36750, "loss": 1.131, "grad_norm": "5.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.402e-01", "anc_loss": "8.340e-01", "dlm_acc": "6.895e-01", "anc_acc": "6.584e-01", "epoch": 0.0735} {"step": 36755, "loss": 1.364, "grad_norm": "4.737e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.943e-01", "anc_loss": "1.001e+00", "dlm_acc": "6.933e-01", "anc_acc": "6.647e-01", "epoch": 0.07351} {"step": 36760, "loss": 1.3093, "grad_norm": "5.664e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.642e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.304e-01", "anc_acc": "6.090e-01", "epoch": 0.07352} {"step": 36765, "loss": 0.7245, "grad_norm": "3.375e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.559e-01", "anc_loss": "2.022e-01", "dlm_acc": "9.039e-01", "anc_acc": "8.841e-01", "epoch": 0.07353} {"step": 36770, "loss": 1.1852, "grad_norm": "5.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.256e-01", "anc_acc": "4.868e-01", "epoch": 0.07354} {"step": 36775, "loss": 1.0249, "grad_norm": "4.714e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.469e-01", "anc_loss": "9.617e-01", "dlm_acc": "6.187e-01", "anc_acc": "5.728e-01", "epoch": 0.07355} {"step": 36780, "loss": 1.0934, "grad_norm": "3.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.848e-01", "anc_loss": "8.824e-01", "dlm_acc": "6.583e-01", "anc_acc": "6.259e-01", "epoch": 0.07356} {"step": 36785, "loss": 0.7068, "grad_norm": "2.664e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.841e-01", "anc_loss": "3.619e-01", "dlm_acc": "8.280e-01", "anc_acc": "7.795e-01", "epoch": 0.07357} {"step": 36790, "loss": 0.6891, "grad_norm": "2.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.594e-01", "anc_loss": "7.631e-01", "dlm_acc": "7.376e-01", "anc_acc": "7.051e-01", "epoch": 0.07358} {"step": 36795, "loss": 1.1132, "grad_norm": "4.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.046e+00", "anc_loss": "1.173e+00", "dlm_acc": "6.370e-01", "anc_acc": "6.032e-01", "epoch": 0.07359} {"step": 36800, "loss": 0.8648, "grad_norm": "2.510e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.767e-01", "anc_acc": "5.477e-01", "epoch": 0.0736} {"step": 36805, "loss": 0.737, "grad_norm": "4.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.781e-01", "anc_loss": "1.069e+00", "dlm_acc": "6.527e-01", "anc_acc": "5.982e-01", "epoch": 0.07361} {"step": 36810, "loss": 1.347, "grad_norm": "4.128e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.181e+00", "anc_loss": "2.211e+00", "dlm_acc": "2.562e-01", "anc_acc": "2.506e-01", "epoch": 0.07362} {"step": 36815, "loss": 0.7383, "grad_norm": "1.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.137e-01", "anc_loss": "7.684e-01", "dlm_acc": "5.846e-01", "anc_acc": "5.691e-01", "epoch": 0.07363} {"step": 36820, "loss": 0.8119, "grad_norm": "3.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.031e-01", "anc_loss": "5.250e-01", "dlm_acc": "5.796e-01", "anc_acc": "5.666e-01", "epoch": 0.07364} {"step": 36825, "loss": 0.6824, "grad_norm": "2.031e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.617e-01", "anc_loss": "5.781e-01", "dlm_acc": "5.829e-01", "anc_acc": "5.752e-01", "epoch": 0.07365} {"step": 36830, "loss": 0.6649, "grad_norm": "1.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.195e-01", "anc_loss": "5.352e-01", "dlm_acc": "5.838e-01", "anc_acc": "5.778e-01", "epoch": 0.07366} {"step": 36835, "loss": 0.6089, "grad_norm": "2.196e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.391e-01", "anc_loss": "5.559e-01", "dlm_acc": "5.872e-01", "anc_acc": "5.813e-01", "epoch": 0.07367} {"step": 36840, "loss": 0.4981, "grad_norm": "1.214e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.484e-01", "anc_loss": "4.758e-01", "dlm_acc": "6.592e-01", "anc_acc": "6.457e-01", "epoch": 0.07368} {"step": 36845, "loss": 1.036, "grad_norm": "3.160e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.279e+00", "dlm_acc": "6.051e-01", "anc_acc": "5.806e-01", "epoch": 0.07369} {"step": 36850, "loss": 1.5085, "grad_norm": "5.398e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.616e+00", "anc_loss": "1.727e+00", "dlm_acc": "5.325e-01", "anc_acc": "5.042e-01", "epoch": 0.0737} {"step": 36855, "loss": 1.0984, "grad_norm": "2.046e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.092e+00", "dlm_acc": "5.947e-01", "anc_acc": "5.684e-01", "epoch": 0.07371} {"step": 36860, "loss": 1.3319, "grad_norm": "2.085e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.121e+00", "dlm_acc": "6.233e-01", "anc_acc": "5.948e-01", "epoch": 0.07372} {"step": 36865, "loss": 1.1597, "grad_norm": "5.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.726e-01", "anc_acc": "5.337e-01", "epoch": 0.07373} {"step": 36870, "loss": 1.0681, "grad_norm": "3.008e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.019e+00", "anc_loss": "1.092e+00", "dlm_acc": "5.595e-01", "anc_acc": "5.427e-01", "epoch": 0.07374} {"step": 36875, "loss": 1.2117, "grad_norm": "3.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.620e+00", "dlm_acc": "5.303e-01", "anc_acc": "4.957e-01", "epoch": 0.07375} {"step": 36880, "loss": 1.0115, "grad_norm": "4.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.124e+00", "dlm_acc": "6.365e-01", "anc_acc": "6.123e-01", "epoch": 0.07376} {"step": 36885, "loss": 1.4237, "grad_norm": "4.738e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.795e+00", "anc_loss": "1.920e+00", "dlm_acc": "4.524e-01", "anc_acc": "4.285e-01", "epoch": 0.07377} {"step": 36890, "loss": 1.1235, "grad_norm": "4.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.378e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.526e-01", "anc_acc": "5.239e-01", "epoch": 0.07378} {"step": 36895, "loss": 1.1795, "grad_norm": "2.119e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.876e-01", "anc_acc": "5.409e-01", "epoch": 0.07379} {"step": 36900, "loss": 1.2769, "grad_norm": "4.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.733e+00", "dlm_acc": "4.760e-01", "anc_acc": "4.458e-01", "epoch": 0.0738} {"step": 36905, "loss": 1.2251, "grad_norm": "3.573e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.746e+00", "anc_loss": "1.859e+00", "dlm_acc": "4.613e-01", "anc_acc": "4.376e-01", "epoch": 0.07381} {"step": 36910, "loss": 1.3745, "grad_norm": "4.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.641e+00", "anc_loss": "1.803e+00", "dlm_acc": "5.112e-01", "anc_acc": "4.752e-01", "epoch": 0.07382} {"step": 36915, "loss": 1.3745, "grad_norm": "8.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.756e+00", "anc_loss": "1.913e+00", "dlm_acc": "4.517e-01", "anc_acc": "4.175e-01", "epoch": 0.07383} {"step": 36920, "loss": 1.0931, "grad_norm": "3.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.297e+00", "dlm_acc": "5.985e-01", "anc_acc": "5.560e-01", "epoch": 0.07384} {"step": 36925, "loss": 1.3004, "grad_norm": "2.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.592e+00", "anc_loss": "1.717e+00", "dlm_acc": "4.943e-01", "anc_acc": "4.682e-01", "epoch": 0.07385} {"step": 36930, "loss": 1.091, "grad_norm": "3.496e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.284e+00", "dlm_acc": "6.169e-01", "anc_acc": "5.150e-01", "epoch": 0.07386} {"step": 36935, "loss": 1.0729, "grad_norm": "2.485e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.531e-01", "anc_loss": "1.014e+00", "dlm_acc": "6.905e-01", "anc_acc": "6.335e-01", "epoch": 0.07387} {"step": 36940, "loss": 1.0684, "grad_norm": "4.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.723e-01", "anc_loss": "9.125e-01", "dlm_acc": "7.071e-01", "anc_acc": "6.601e-01", "epoch": 0.07388} {"step": 36945, "loss": 0.8496, "grad_norm": "2.610e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.932e-01", "anc_loss": "9.797e-01", "dlm_acc": "6.612e-01", "anc_acc": "6.410e-01", "epoch": 0.07389} {"step": 36950, "loss": 1.0599, "grad_norm": "3.594e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.468e+00", "anc_loss": "1.516e+00", "dlm_acc": "4.422e-01", "anc_acc": "4.273e-01", "epoch": 0.0739} {"step": 36955, "loss": 1.529, "grad_norm": "2.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.670e+00", "anc_loss": "2.711e+00", "dlm_acc": "8.700e-02", "anc_acc": "7.823e-02", "epoch": 0.07391} {"step": 36960, "loss": 1.2307, "grad_norm": "3.932e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.839e+00", "anc_loss": "1.942e+00", "dlm_acc": "4.005e-01", "anc_acc": "3.810e-01", "epoch": 0.07392} {"step": 36965, "loss": 1.0347, "grad_norm": "2.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.453e+00", "dlm_acc": "5.673e-01", "anc_acc": "5.350e-01", "epoch": 0.07393} {"step": 36970, "loss": 1.3496, "grad_norm": "3.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.477e+00", "dlm_acc": "5.442e-01", "anc_acc": "5.143e-01", "epoch": 0.07394} {"step": 36975, "loss": 0.9773, "grad_norm": "3.483e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.062e-01", "anc_loss": "9.883e-01", "dlm_acc": "4.991e-01", "anc_acc": "4.679e-01", "epoch": 0.07395} {"step": 36980, "loss": 0.9439, "grad_norm": "2.963e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.686e-01", "anc_loss": "1.082e+00", "dlm_acc": "6.460e-01", "anc_acc": "6.189e-01", "epoch": 0.07396} {"step": 36985, "loss": 1.1129, "grad_norm": "5.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.201e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.873e-01", "anc_acc": "5.598e-01", "epoch": 0.07397} {"step": 36990, "loss": 1.156, "grad_norm": "2.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.146e+00", "dlm_acc": "6.447e-01", "anc_acc": "6.152e-01", "epoch": 0.07398} {"step": 36995, "loss": 1.2867, "grad_norm": "3.540e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.490e+00", "dlm_acc": "5.467e-01", "anc_acc": "5.217e-01", "epoch": 0.07399} {"step": 37000, "loss": 1.1917, "grad_norm": "3.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.712e+00", "dlm_acc": "5.362e-01", "anc_acc": "5.106e-01", "epoch": 0.074} {"step": 37005, "loss": 1.2975, "grad_norm": "4.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.697e+00", "anc_loss": "1.852e+00", "dlm_acc": "4.729e-01", "anc_acc": "4.383e-01", "epoch": 0.07401} {"step": 37010, "loss": 0.91, "grad_norm": "3.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.306e+00", "dlm_acc": "5.598e-01", "anc_acc": "5.337e-01", "epoch": 0.07402} {"step": 37015, "loss": 0.9534, "grad_norm": "2.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.469e+00", "dlm_acc": "5.395e-01", "anc_acc": "5.144e-01", "epoch": 0.07403} {"step": 37020, "loss": 1.2673, "grad_norm": "5.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.431e+00", "anc_loss": "1.572e+00", "dlm_acc": "5.466e-01", "anc_acc": "5.150e-01", "epoch": 0.07404} {"step": 37025, "loss": 1.2732, "grad_norm": "2.605e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.493e-01", "anc_acc": "5.195e-01", "epoch": 0.07405} {"step": 37030, "loss": 1.3491, "grad_norm": "3.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.449e+00", "anc_loss": "1.578e+00", "dlm_acc": "5.443e-01", "anc_acc": "5.122e-01", "epoch": 0.07406} {"step": 37035, "loss": 1.5121, "grad_norm": "6.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.681e+00", "anc_loss": "1.816e+00", "dlm_acc": "4.909e-01", "anc_acc": "4.649e-01", "epoch": 0.07407} {"step": 37040, "loss": 1.1586, "grad_norm": "4.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.214e+00", "anc_loss": "1.343e+00", "dlm_acc": "5.735e-01", "anc_acc": "5.442e-01", "epoch": 0.07408} {"step": 37045, "loss": 1.2825, "grad_norm": "3.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.370e+00", "anc_loss": "1.501e+00", "dlm_acc": "5.526e-01", "anc_acc": "5.212e-01", "epoch": 0.07409} {"step": 37050, "loss": 1.4361, "grad_norm": "3.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.403e+00", "anc_loss": "1.510e+00", "dlm_acc": "5.177e-01", "anc_acc": "4.898e-01", "epoch": 0.0741} {"step": 37055, "loss": 1.4666, "grad_norm": "3.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.484e+00", "anc_loss": "1.617e+00", "dlm_acc": "5.371e-01", "anc_acc": "5.078e-01", "epoch": 0.07411} {"step": 37060, "loss": 1.2272, "grad_norm": "3.749e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.260e+00", "anc_loss": "1.376e+00", "dlm_acc": "5.794e-01", "anc_acc": "5.538e-01", "epoch": 0.07412} {"step": 37065, "loss": 0.8962, "grad_norm": "3.971e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.500e-01", "anc_loss": "9.492e-01", "dlm_acc": "6.597e-01", "anc_acc": "6.303e-01", "epoch": 0.07413} {"step": 37070, "loss": 1.2568, "grad_norm": "3.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.478e+00", "dlm_acc": "5.279e-01", "anc_acc": "5.060e-01", "epoch": 0.07414} {"step": 37075, "loss": 1.4431, "grad_norm": "3.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.434e+00", "anc_loss": "1.559e+00", "dlm_acc": "5.291e-01", "anc_acc": "5.007e-01", "epoch": 0.07415} {"step": 37080, "loss": 1.6609, "grad_norm": "4.624e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.680e+00", "anc_loss": "1.783e+00", "dlm_acc": "4.833e-01", "anc_acc": "4.593e-01", "epoch": 0.07416} {"step": 37085, "loss": 1.6406, "grad_norm": "3.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.590e+00", "anc_loss": "1.713e+00", "dlm_acc": "5.135e-01", "anc_acc": "4.872e-01", "epoch": 0.07417} {"step": 37090, "loss": 1.2896, "grad_norm": "2.227e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.295e+00", "dlm_acc": "5.819e-01", "anc_acc": "5.526e-01", "epoch": 0.07418} {"step": 37095, "loss": 1.1734, "grad_norm": "1.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.120e+00", "dlm_acc": "6.415e-01", "anc_acc": "6.106e-01", "epoch": 0.07419} {"step": 37100, "loss": 1.1677, "grad_norm": "1.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.246e+00", "dlm_acc": "5.807e-01", "anc_acc": "5.532e-01", "epoch": 0.0742} {"step": 37105, "loss": 0.9601, "grad_norm": "2.038e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.145e+00", "dlm_acc": "5.857e-01", "anc_acc": "5.552e-01", "epoch": 0.07421} {"step": 37110, "loss": 1.1777, "grad_norm": "3.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.501e-01", "anc_loss": "6.095e-01", "dlm_acc": "8.255e-01", "anc_acc": "8.132e-01", "epoch": 0.07422} {"step": 37115, "loss": 1.126, "grad_norm": "2.699e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.539e-01", "anc_loss": "9.672e-01", "dlm_acc": "6.833e-01", "anc_acc": "6.552e-01", "epoch": 0.07423} {"step": 37120, "loss": 1.451, "grad_norm": "3.099e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.523e+00", "anc_loss": "1.639e+00", "dlm_acc": "5.177e-01", "anc_acc": "4.911e-01", "epoch": 0.07424} {"step": 37125, "loss": 1.125, "grad_norm": "3.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.238e+00", "dlm_acc": "5.978e-01", "anc_acc": "5.681e-01", "epoch": 0.07425} {"step": 37130, "loss": 0.8745, "grad_norm": "3.085e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.084e+00", "dlm_acc": "3.220e-01", "anc_acc": "3.139e-01", "epoch": 0.07426} {"step": 37135, "loss": 1.5046, "grad_norm": "3.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.422e+00", "anc_loss": "1.553e+00", "dlm_acc": "5.299e-01", "anc_acc": "4.997e-01", "epoch": 0.07427} {"step": 37140, "loss": 1.1893, "grad_norm": "4.327e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.602e+00", "dlm_acc": "5.179e-01", "anc_acc": "4.956e-01", "epoch": 0.07428} {"step": 37145, "loss": 1.2553, "grad_norm": "4.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.400e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.309e-01", "anc_acc": "5.064e-01", "epoch": 0.07429} {"step": 37150, "loss": 0.9241, "grad_norm": "3.462e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.570e-01", "anc_loss": "1.059e+00", "dlm_acc": "6.247e-01", "anc_acc": "5.956e-01", "epoch": 0.0743} {"step": 37155, "loss": 1.0884, "grad_norm": "2.167e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.239e+00", "dlm_acc": "5.703e-01", "anc_acc": "5.403e-01", "epoch": 0.07431} {"step": 37160, "loss": 1.0586, "grad_norm": "2.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.514e+00", "anc_loss": "1.633e+00", "dlm_acc": "4.691e-01", "anc_acc": "4.427e-01", "epoch": 0.07432} {"step": 37165, "loss": 1.2389, "grad_norm": "4.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.343e+00", "dlm_acc": "5.918e-01", "anc_acc": "5.607e-01", "epoch": 0.07433} {"step": 37170, "loss": 1.272, "grad_norm": "5.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.638e-01", "anc_acc": "5.372e-01", "epoch": 0.07434} {"step": 37175, "loss": 0.7934, "grad_norm": "6.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.909e-01", "anc_loss": "6.538e-01", "dlm_acc": "7.331e-01", "anc_acc": "7.137e-01", "epoch": 0.07435} {"step": 37180, "loss": 1.5218, "grad_norm": "4.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.254e+00", "dlm_acc": "6.339e-01", "anc_acc": "6.106e-01", "epoch": 0.07436} {"step": 37185, "loss": 1.1739, "grad_norm": "6.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.719e-01", "anc_acc": "5.419e-01", "epoch": 0.07437} {"step": 37190, "loss": 0.8786, "grad_norm": "4.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.406e-01", "anc_loss": "7.809e-01", "dlm_acc": "5.494e-01", "anc_acc": "5.363e-01", "epoch": 0.07438} {"step": 37195, "loss": 1.2377, "grad_norm": "4.806e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.148e-01", "anc_loss": "6.328e-01", "dlm_acc": "5.389e-01", "anc_acc": "5.286e-01", "epoch": 0.07439} {"step": 37200, "loss": 1.0574, "grad_norm": "2.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.195e-01", "anc_loss": "6.422e-01", "dlm_acc": "5.193e-01", "anc_acc": "5.093e-01", "epoch": 0.0744} {"step": 37205, "loss": 0.8823, "grad_norm": "4.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.635e-01", "anc_loss": "6.002e-01", "dlm_acc": "6.784e-01", "anc_acc": "6.646e-01", "epoch": 0.07441} {"step": 37210, "loss": 0.9811, "grad_norm": "2.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.220e+00", "dlm_acc": "5.955e-01", "anc_acc": "5.673e-01", "epoch": 0.07442} {"step": 37215, "loss": 1.1893, "grad_norm": "3.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.480e+00", "anc_loss": "1.609e+00", "dlm_acc": "5.256e-01", "anc_acc": "4.989e-01", "epoch": 0.07443} {"step": 37220, "loss": 0.7379, "grad_norm": "2.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.740e-01", "anc_loss": "4.104e-01", "dlm_acc": "8.798e-01", "anc_acc": "8.680e-01", "epoch": 0.07444} {"step": 37225, "loss": 1.1398, "grad_norm": "9.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.285e+00", "dlm_acc": "6.056e-01", "anc_acc": "5.811e-01", "epoch": 0.07445} {"step": 37230, "loss": 0.9956, "grad_norm": "4.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.437e-01", "anc_loss": "6.217e-01", "dlm_acc": "7.947e-01", "anc_acc": "7.667e-01", "epoch": 0.07446} {"step": 37235, "loss": 1.1353, "grad_norm": "6.822e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.067e+00", "anc_loss": "1.106e+00", "dlm_acc": "3.335e-01", "anc_acc": "3.286e-01", "epoch": 0.07447} {"step": 37240, "loss": 0.9732, "grad_norm": "2.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.072e+00", "anc_loss": "1.072e+00", "dlm_acc": "1.002e-01", "anc_acc": "9.884e-02", "epoch": 0.07448} {"step": 37245, "loss": 1.1804, "grad_norm": "5.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.183e+00", "anc_loss": "1.181e+00", "dlm_acc": "1.004e-01", "anc_acc": "1.004e-01", "epoch": 0.07449} {"step": 37250, "loss": 1.1024, "grad_norm": "3.191e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.099e+00", "anc_loss": "1.104e+00", "dlm_acc": "1.511e-01", "anc_acc": "1.451e-01", "epoch": 0.0745} {"step": 37255, "loss": 0.9294, "grad_norm": "2.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.965e-01", "anc_loss": "6.527e-01", "dlm_acc": "6.946e-01", "anc_acc": "6.753e-01", "epoch": 0.07451} {"step": 37260, "loss": 1.0763, "grad_norm": "3.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.633e-01", "anc_loss": "5.251e-01", "dlm_acc": "8.260e-01", "anc_acc": "8.039e-01", "epoch": 0.07452} {"step": 37265, "loss": 1.3983, "grad_norm": "3.566e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.979e-01", "anc_loss": "2.043e-01", "dlm_acc": "8.868e-01", "anc_acc": "8.849e-01", "epoch": 0.07453} {"step": 37270, "loss": 0.8521, "grad_norm": "3.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.129e-01", "anc_loss": "4.268e-01", "dlm_acc": "7.308e-01", "anc_acc": "7.272e-01", "epoch": 0.07454} {"step": 37275, "loss": 1.8299, "grad_norm": "4.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.215e+00", "dlm_acc": "3.912e-01", "anc_acc": "3.830e-01", "epoch": 0.07455} {"step": 37280, "loss": 1.3298, "grad_norm": "3.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.945e-01", "anc_loss": "9.516e-01", "dlm_acc": "5.706e-01", "anc_acc": "5.528e-01", "epoch": 0.07456} {"step": 37285, "loss": 1.2399, "grad_norm": "2.481e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.571e-01", "anc_loss": "7.289e-01", "dlm_acc": "7.433e-01", "anc_acc": "7.169e-01", "epoch": 0.07457} {"step": 37290, "loss": 1.0121, "grad_norm": "3.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.930e-01", "anc_loss": "8.813e-01", "dlm_acc": "7.465e-01", "anc_acc": "7.237e-01", "epoch": 0.07458} {"step": 37295, "loss": 0.8329, "grad_norm": "3.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.223e+00", "dlm_acc": "6.143e-01", "anc_acc": "5.915e-01", "epoch": 0.07459} {"step": 37300, "loss": 1.0386, "grad_norm": "2.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.484e-01", "anc_loss": "6.918e-01", "dlm_acc": "6.559e-01", "anc_acc": "6.424e-01", "epoch": 0.0746} {"step": 37305, "loss": 1.0518, "grad_norm": "2.975e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.023e-01", "anc_loss": "9.898e-01", "dlm_acc": "6.327e-01", "anc_acc": "6.030e-01", "epoch": 0.07461} {"step": 37310, "loss": 1.1216, "grad_norm": "2.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.506e+00", "dlm_acc": "5.626e-01", "anc_acc": "5.348e-01", "epoch": 0.07462} {"step": 37315, "loss": 1.2375, "grad_norm": "2.496e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.234e+00", "dlm_acc": "6.178e-01", "anc_acc": "5.823e-01", "epoch": 0.07463} {"step": 37320, "loss": 1.0844, "grad_norm": "1.996e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.296e-01", "anc_loss": "9.082e-01", "dlm_acc": "6.989e-01", "anc_acc": "6.747e-01", "epoch": 0.07464} {"step": 37325, "loss": 1.0067, "grad_norm": "2.156e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.844e-01", "anc_loss": "4.391e-01", "dlm_acc": "8.097e-01", "anc_acc": "7.911e-01", "epoch": 0.07465} {"step": 37330, "loss": 1.4248, "grad_norm": "3.609e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.106e+00", "anc_loss": "1.213e+00", "dlm_acc": "6.073e-01", "anc_acc": "5.819e-01", "epoch": 0.07466} {"step": 37335, "loss": 1.4193, "grad_norm": "3.799e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.455e-01", "anc_loss": "5.083e-01", "dlm_acc": "8.231e-01", "anc_acc": "8.046e-01", "epoch": 0.07467} {"step": 37340, "loss": 1.1094, "grad_norm": "2.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.938e-01", "anc_loss": "8.628e-01", "dlm_acc": "7.302e-01", "anc_acc": "7.102e-01", "epoch": 0.07468} {"step": 37345, "loss": 1.3625, "grad_norm": "5.246e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.310e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.328e-01", "anc_acc": "5.023e-01", "epoch": 0.07469} {"step": 37350, "loss": 1.3619, "grad_norm": "5.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.407e+00", "dlm_acc": "4.156e-01", "anc_acc": "4.002e-01", "epoch": 0.0747} {"step": 37355, "loss": 1.4922, "grad_norm": "6.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.535e-01", "anc_loss": "9.332e-01", "dlm_acc": "6.311e-01", "anc_acc": "6.047e-01", "epoch": 0.07471} {"step": 37360, "loss": 1.2126, "grad_norm": "4.438e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.820e-01", "anc_loss": "8.730e-01", "dlm_acc": "6.916e-01", "anc_acc": "6.683e-01", "epoch": 0.07472} {"step": 37365, "loss": 1.2636, "grad_norm": "2.893e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.011e+00", "anc_loss": "1.073e+00", "dlm_acc": "5.483e-01", "anc_acc": "5.307e-01", "epoch": 0.07473} {"step": 37370, "loss": 1.1433, "grad_norm": "5.191e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.006e-01", "anc_loss": "1.012e+00", "dlm_acc": "6.904e-01", "anc_acc": "6.618e-01", "epoch": 0.07474} {"step": 37375, "loss": 0.8221, "grad_norm": "6.709e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.739e-01", "anc_loss": "5.287e-01", "dlm_acc": "7.926e-01", "anc_acc": "7.750e-01", "epoch": 0.07475} {"step": 37380, "loss": 1.1631, "grad_norm": "3.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.129e-01", "anc_loss": "8.896e-01", "dlm_acc": "7.013e-01", "anc_acc": "6.789e-01", "epoch": 0.07476} {"step": 37385, "loss": 1.0999, "grad_norm": "2.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.375e-01", "anc_loss": "7.594e-01", "dlm_acc": "5.976e-01", "anc_acc": "5.925e-01", "epoch": 0.07477} {"step": 37390, "loss": 0.9996, "grad_norm": "1.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.684e-01", "anc_loss": "7.973e-01", "dlm_acc": "6.036e-01", "anc_acc": "5.944e-01", "epoch": 0.07478} {"step": 37395, "loss": 1.2992, "grad_norm": "2.863e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.554e+00", "anc_loss": "1.657e+00", "dlm_acc": "4.897e-01", "anc_acc": "4.664e-01", "epoch": 0.07479} {"step": 37400, "loss": 0.6379, "grad_norm": "4.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.984e-01", "anc_loss": "3.256e-01", "dlm_acc": "7.991e-01", "anc_acc": "7.854e-01", "epoch": 0.0748} {"step": 37405, "loss": 1.1061, "grad_norm": "3.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.617e-01", "anc_loss": "7.258e-01", "dlm_acc": "6.591e-01", "anc_acc": "6.371e-01", "epoch": 0.07481} {"step": 37410, "loss": 1.1997, "grad_norm": "3.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.945e-01", "anc_loss": "9.547e-01", "dlm_acc": "5.924e-01", "anc_acc": "5.745e-01", "epoch": 0.07482} {"step": 37415, "loss": 1.0747, "grad_norm": "5.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.418e-01", "anc_loss": "7.410e-01", "dlm_acc": "7.404e-01", "anc_acc": "7.113e-01", "epoch": 0.07483} {"step": 37420, "loss": 1.0279, "grad_norm": "4.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.199e-01", "anc_loss": "8.078e-01", "dlm_acc": "7.733e-01", "anc_acc": "7.208e-01", "epoch": 0.07484} {"step": 37425, "loss": 1.1248, "grad_norm": "3.223e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.227e-01", "anc_loss": "7.541e-01", "dlm_acc": "7.854e-01", "anc_acc": "7.496e-01", "epoch": 0.07485} {"step": 37430, "loss": 1.408, "grad_norm": "2.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.313e+00", "anc_loss": "1.431e+00", "dlm_acc": "5.719e-01", "anc_acc": "5.446e-01", "epoch": 0.07486} {"step": 37435, "loss": 1.3293, "grad_norm": "3.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.156e+00", "anc_loss": "1.261e+00", "dlm_acc": "5.801e-01", "anc_acc": "5.545e-01", "epoch": 0.07487} {"step": 37440, "loss": 1.3127, "grad_norm": "3.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.579e-01", "anc_loss": "8.537e-01", "dlm_acc": "7.230e-01", "anc_acc": "6.939e-01", "epoch": 0.07488} {"step": 37445, "loss": 1.5332, "grad_norm": "5.445e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.408e+00", "dlm_acc": "5.901e-01", "anc_acc": "5.594e-01", "epoch": 0.07489} {"step": 37450, "loss": 1.1481, "grad_norm": "3.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.283e+00", "anc_loss": "1.412e+00", "dlm_acc": "5.990e-01", "anc_acc": "5.690e-01", "epoch": 0.0749} {"step": 37455, "loss": 1.3949, "grad_norm": "7.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.373e+00", "dlm_acc": "6.009e-01", "anc_acc": "5.721e-01", "epoch": 0.07491} {"step": 37460, "loss": 1.2973, "grad_norm": "4.172e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.114e+00", "dlm_acc": "6.248e-01", "anc_acc": "5.943e-01", "epoch": 0.07492} {"step": 37465, "loss": 1.1415, "grad_norm": "2.905e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.230e+00", "dlm_acc": "6.067e-01", "anc_acc": "5.762e-01", "epoch": 0.07493} {"step": 37470, "loss": 1.3567, "grad_norm": "3.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.669e-01", "anc_loss": "1.082e+00", "dlm_acc": "6.558e-01", "anc_acc": "6.249e-01", "epoch": 0.07494} {"step": 37475, "loss": 1.477, "grad_norm": "3.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.531e+00", "anc_loss": "1.672e+00", "dlm_acc": "5.296e-01", "anc_acc": "5.003e-01", "epoch": 0.07495} {"step": 37480, "loss": 1.2392, "grad_norm": "1.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.349e+00", "dlm_acc": "5.818e-01", "anc_acc": "5.534e-01", "epoch": 0.07496} {"step": 37485, "loss": 0.9027, "grad_norm": "1.486e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.648e-01", "anc_acc": "5.352e-01", "epoch": 0.07497} {"step": 37490, "loss": 0.746, "grad_norm": "4.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.676e-01", "anc_loss": "1.056e+00", "dlm_acc": "6.504e-01", "anc_acc": "6.263e-01", "epoch": 0.07498} {"step": 37495, "loss": 1.4241, "grad_norm": "3.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.614e+00", "dlm_acc": "5.324e-01", "anc_acc": "5.095e-01", "epoch": 0.07499} {"step": 37500, "loss": 1.0966, "grad_norm": "4.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.606e+00", "dlm_acc": "5.323e-01", "anc_acc": "5.001e-01", "epoch": 0.075} {"step": 37505, "loss": 1.0041, "grad_norm": "3.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.959e-01", "anc_acc": "5.665e-01", "epoch": 0.07501} {"step": 37510, "loss": 0.9194, "grad_norm": "5.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.138e+00", "anc_loss": "1.249e+00", "dlm_acc": "5.680e-01", "anc_acc": "5.407e-01", "epoch": 0.07502} {"step": 37515, "loss": 1.2037, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.326e-01", "anc_acc": "5.032e-01", "epoch": 0.07503} {"step": 37520, "loss": 1.6334, "grad_norm": "4.449e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.249e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.633e-01", "anc_acc": "5.319e-01", "epoch": 0.07504} {"step": 37525, "loss": 1.2769, "grad_norm": "3.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.550e+00", "dlm_acc": "5.505e-01", "anc_acc": "5.058e-01", "epoch": 0.07505} {"step": 37530, "loss": 1.1341, "grad_norm": "4.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.916e-01", "anc_acc": "5.342e-01", "epoch": 0.07506} {"step": 37535, "loss": 1.3865, "grad_norm": "2.869e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.346e+00", "anc_loss": "1.458e+00", "dlm_acc": "5.571e-01", "anc_acc": "5.314e-01", "epoch": 0.07507} {"step": 37540, "loss": 0.9885, "grad_norm": "3.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.305e-01", "anc_loss": "1.030e+00", "dlm_acc": "6.614e-01", "anc_acc": "6.334e-01", "epoch": 0.07508} {"step": 37545, "loss": 0.9758, "grad_norm": "2.493e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.020e+00", "anc_loss": "1.145e+00", "dlm_acc": "5.997e-01", "anc_acc": "5.627e-01", "epoch": 0.07509} {"step": 37550, "loss": 1.0149, "grad_norm": "2.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.499e-01", "anc_loss": "1.040e+00", "dlm_acc": "6.800e-01", "anc_acc": "6.570e-01", "epoch": 0.0751} {"step": 37555, "loss": 1.0128, "grad_norm": "3.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.010e+00", "anc_loss": "1.144e+00", "dlm_acc": "6.283e-01", "anc_acc": "5.860e-01", "epoch": 0.07511} {"step": 37560, "loss": 0.9035, "grad_norm": "3.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.696e-01", "anc_loss": "7.382e-01", "dlm_acc": "7.693e-01", "anc_acc": "7.508e-01", "epoch": 0.07512} {"step": 37565, "loss": 1.1393, "grad_norm": "4.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.278e-01", "anc_acc": "4.907e-01", "epoch": 0.07513} {"step": 37570, "loss": 1.3019, "grad_norm": "2.741e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.670e+00", "anc_loss": "1.817e+00", "dlm_acc": "3.443e-01", "anc_acc": "3.070e-01", "epoch": 0.07514} {"step": 37575, "loss": 1.6806, "grad_norm": "3.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.934e+00", "anc_loss": "2.034e+00", "dlm_acc": "3.574e-01", "anc_acc": "3.378e-01", "epoch": 0.07515} {"step": 37580, "loss": 1.2612, "grad_norm": "1.531e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.266e-01", "anc_loss": "1.046e+00", "dlm_acc": "6.569e-01", "anc_acc": "6.278e-01", "epoch": 0.07516} {"step": 37585, "loss": 1.379, "grad_norm": "2.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.268e+00", "anc_loss": "1.353e+00", "dlm_acc": "5.385e-01", "anc_acc": "5.189e-01", "epoch": 0.07517} {"step": 37590, "loss": 1.6245, "grad_norm": "4.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.550e+00", "anc_loss": "1.659e+00", "dlm_acc": "4.842e-01", "anc_acc": "4.608e-01", "epoch": 0.07518} {"step": 37595, "loss": 1.6085, "grad_norm": "2.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.755e+00", "anc_loss": "1.837e+00", "dlm_acc": "4.154e-01", "anc_acc": "3.955e-01", "epoch": 0.07519} {"step": 37600, "loss": 1.1844, "grad_norm": "3.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.138e+00", "anc_loss": "1.235e+00", "dlm_acc": "5.843e-01", "anc_acc": "5.583e-01", "epoch": 0.0752} {"step": 37605, "loss": 0.7958, "grad_norm": "3.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.711e-01", "anc_loss": "9.586e-01", "dlm_acc": "6.675e-01", "anc_acc": "5.990e-01", "epoch": 0.07521} {"step": 37610, "loss": 1.2426, "grad_norm": "3.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.866e+00", "anc_loss": "1.942e+00", "dlm_acc": "3.278e-01", "anc_acc": "3.114e-01", "epoch": 0.07522} {"step": 37615, "loss": 1.3334, "grad_norm": "1.969e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.151e+00", "anc_loss": "1.295e+00", "dlm_acc": "6.121e-01", "anc_acc": "5.768e-01", "epoch": 0.07523} {"step": 37620, "loss": 1.6327, "grad_norm": "6.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.770e+00", "anc_loss": "1.869e+00", "dlm_acc": "4.323e-01", "anc_acc": "4.011e-01", "epoch": 0.07524} {"step": 37625, "loss": 1.5047, "grad_norm": "3.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.417e+00", "anc_loss": "2.442e+00", "dlm_acc": "1.331e-01", "anc_acc": "1.251e-01", "epoch": 0.07525} {"step": 37630, "loss": 1.0316, "grad_norm": "5.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.973e-01", "anc_loss": "4.602e-01", "dlm_acc": "8.064e-01", "anc_acc": "7.967e-01", "epoch": 0.07526} {"step": 37635, "loss": 1.0091, "grad_norm": "1.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.824e-01", "anc_loss": "8.924e-01", "dlm_acc": "6.520e-01", "anc_acc": "6.159e-01", "epoch": 0.07527} {"step": 37640, "loss": 1.3653, "grad_norm": "4.245e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.475e+00", "dlm_acc": "5.352e-01", "anc_acc": "5.018e-01", "epoch": 0.07528} {"step": 37645, "loss": 1.258, "grad_norm": "2.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.438e+00", "anc_loss": "1.560e+00", "dlm_acc": "5.222e-01", "anc_acc": "4.949e-01", "epoch": 0.07529} {"step": 37650, "loss": 0.8182, "grad_norm": "2.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.711e-01", "anc_loss": "1.094e+00", "dlm_acc": "5.857e-01", "anc_acc": "5.502e-01", "epoch": 0.0753} {"step": 37655, "loss": 0.9827, "grad_norm": "2.676e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.196e+00", "dlm_acc": "6.013e-01", "anc_acc": "5.708e-01", "epoch": 0.07531} {"step": 37660, "loss": 1.0726, "grad_norm": "3.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.391e+00", "dlm_acc": "4.892e-01", "anc_acc": "4.636e-01", "epoch": 0.07532} {"step": 37665, "loss": 1.0408, "grad_norm": "3.701e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.160e+00", "dlm_acc": "5.952e-01", "anc_acc": "5.659e-01", "epoch": 0.07533} {"step": 37670, "loss": 1.032, "grad_norm": "2.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.260e+00", "anc_loss": "1.373e+00", "dlm_acc": "5.616e-01", "anc_acc": "5.365e-01", "epoch": 0.07534} {"step": 37675, "loss": 0.9653, "grad_norm": "2.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.390e+00", "anc_loss": "1.517e+00", "dlm_acc": "5.298e-01", "anc_acc": "4.989e-01", "epoch": 0.07535} {"step": 37680, "loss": 1.0449, "grad_norm": "3.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.356e+00", "dlm_acc": "5.679e-01", "anc_acc": "5.396e-01", "epoch": 0.07536} {"step": 37685, "loss": 1.5008, "grad_norm": "5.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.163e+00", "anc_loss": "3.175e+00", "dlm_acc": "2.045e-02", "anc_acc": "2.011e-02", "epoch": 0.07537} {"step": 37690, "loss": 1.7586, "grad_norm": "4.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.994e+00", "anc_loss": "2.997e+00", "dlm_acc": "2.301e-02", "anc_acc": "2.185e-02", "epoch": 0.07538} {"step": 37695, "loss": 1.4193, "grad_norm": "1.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.681e+00", "anc_loss": "2.689e+00", "dlm_acc": "2.269e-02", "anc_acc": "2.271e-02", "epoch": 0.07539} {"step": 37700, "loss": 1.7978, "grad_norm": "2.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.034e+00", "anc_loss": "3.047e+00", "dlm_acc": "2.175e-02", "anc_acc": "2.158e-02", "epoch": 0.0754} {"step": 37705, "loss": 1.5485, "grad_norm": "2.725e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.261e+00", "anc_loss": "2.342e+00", "dlm_acc": "2.821e-01", "anc_acc": "2.671e-01", "epoch": 0.07541} {"step": 37710, "loss": 1.6965, "grad_norm": "3.265e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.894e+00", "anc_loss": "2.005e+00", "dlm_acc": "4.466e-01", "anc_acc": "4.265e-01", "epoch": 0.07542} {"step": 37715, "loss": 1.1283, "grad_norm": "5.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.511e+00", "anc_loss": "1.628e+00", "dlm_acc": "5.252e-01", "anc_acc": "4.986e-01", "epoch": 0.07543} {"step": 37720, "loss": 1.1218, "grad_norm": "9.947e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.648e+00", "anc_loss": "1.736e+00", "dlm_acc": "4.478e-01", "anc_acc": "4.262e-01", "epoch": 0.07544} {"step": 37725, "loss": 1.3753, "grad_norm": "4.389e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.864e+00", "anc_loss": "1.952e+00", "dlm_acc": "3.891e-01", "anc_acc": "3.722e-01", "epoch": 0.07545} {"step": 37730, "loss": 1.4551, "grad_norm": "3.591e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.728e+00", "anc_loss": "1.863e+00", "dlm_acc": "4.878e-01", "anc_acc": "4.581e-01", "epoch": 0.07546} {"step": 37735, "loss": 1.6893, "grad_norm": "1.118e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.803e+00", "anc_loss": "1.928e+00", "dlm_acc": "4.584e-01", "anc_acc": "4.334e-01", "epoch": 0.07547} {"step": 37740, "loss": 1.1048, "grad_norm": "2.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.376e+00", "dlm_acc": "5.507e-01", "anc_acc": "5.270e-01", "epoch": 0.07548} {"step": 37745, "loss": 1.0047, "grad_norm": "4.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.339e+00", "anc_loss": "1.486e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.275e-01", "epoch": 0.07549} {"step": 37750, "loss": 1.2189, "grad_norm": "3.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.438e+00", "anc_loss": "1.562e+00", "dlm_acc": "5.241e-01", "anc_acc": "4.948e-01", "epoch": 0.0755} {"step": 37755, "loss": 1.1454, "grad_norm": "2.572e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.500e+00", "anc_loss": "1.619e+00", "dlm_acc": "4.988e-01", "anc_acc": "4.735e-01", "epoch": 0.07551} {"step": 37760, "loss": 1.0229, "grad_norm": "1.689e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.460e+00", "dlm_acc": "5.261e-01", "anc_acc": "4.994e-01", "epoch": 0.07552} {"step": 37765, "loss": 0.9455, "grad_norm": "4.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.290e+00", "anc_loss": "1.375e+00", "dlm_acc": "4.198e-01", "anc_acc": "4.022e-01", "epoch": 0.07553} {"step": 37770, "loss": 0.7956, "grad_norm": "3.367e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.602e-01", "anc_loss": "8.977e-01", "dlm_acc": "3.697e-01", "anc_acc": "3.574e-01", "epoch": 0.07554} {"step": 37775, "loss": 0.9547, "grad_norm": "2.257e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.883e-01", "anc_loss": "9.258e-01", "dlm_acc": "3.652e-01", "anc_acc": "3.557e-01", "epoch": 0.07555} {"step": 37780, "loss": 1.4119, "grad_norm": "4.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.491e+00", "anc_loss": "1.611e+00", "dlm_acc": "5.194e-01", "anc_acc": "4.941e-01", "epoch": 0.07556} {"step": 37785, "loss": 1.1334, "grad_norm": "4.267e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.658e+00", "anc_loss": "1.698e+00", "dlm_acc": "2.524e-01", "anc_acc": "2.505e-01", "epoch": 0.07557} {"step": 37790, "loss": 1.4689, "grad_norm": "1.085e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.756e+00", "anc_loss": "1.834e+00", "dlm_acc": "3.346e-01", "anc_acc": "3.222e-01", "epoch": 0.07558} {"step": 37795, "loss": 1.4969, "grad_norm": "8.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.196e+00", "anc_loss": "1.341e+00", "dlm_acc": "6.058e-01", "anc_acc": "5.750e-01", "epoch": 0.07559} {"step": 37800, "loss": 1.3585, "grad_norm": "2.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.383e+00", "dlm_acc": "6.016e-01", "anc_acc": "5.702e-01", "epoch": 0.0756} {"step": 37805, "loss": 0.8499, "grad_norm": "3.744e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.133e+00", "dlm_acc": "4.652e-01", "anc_acc": "4.513e-01", "epoch": 0.07561} {"step": 37810, "loss": 1.0944, "grad_norm": "4.685e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.264e+00", "dlm_acc": "4.923e-01", "anc_acc": "4.699e-01", "epoch": 0.07562} {"step": 37815, "loss": 0.894, "grad_norm": "2.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.939e-01", "anc_acc": "5.624e-01", "epoch": 0.07563} {"step": 37820, "loss": 0.917, "grad_norm": "3.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.184e+00", "dlm_acc": "5.466e-01", "anc_acc": "5.215e-01", "epoch": 0.07564} {"step": 37825, "loss": 1.1983, "grad_norm": "3.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.536e+00", "anc_loss": "1.644e+00", "dlm_acc": "4.760e-01", "anc_acc": "4.505e-01", "epoch": 0.07565} {"step": 37830, "loss": 1.1035, "grad_norm": "4.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.472e+00", "dlm_acc": "4.980e-01", "anc_acc": "4.720e-01", "epoch": 0.07566} {"step": 37835, "loss": 1.0401, "grad_norm": "3.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.445e-01", "anc_loss": "9.914e-01", "dlm_acc": "5.019e-01", "anc_acc": "4.843e-01", "epoch": 0.07567} {"step": 37840, "loss": 0.8836, "grad_norm": "6.987e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.922e-01", "anc_loss": "7.195e-01", "dlm_acc": "4.964e-01", "anc_acc": "4.784e-01", "epoch": 0.07568} {"step": 37845, "loss": 0.7145, "grad_norm": "4.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.449e-01", "anc_loss": "6.754e-01", "dlm_acc": "5.208e-01", "anc_acc": "5.002e-01", "epoch": 0.07569} {"step": 37850, "loss": 1.0761, "grad_norm": "7.780e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.133e-01", "anc_loss": "9.844e-01", "dlm_acc": "6.231e-01", "anc_acc": "6.079e-01", "epoch": 0.0757} {"step": 37855, "loss": 0.9393, "grad_norm": "2.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.085e+00", "anc_loss": "1.123e+00", "dlm_acc": "4.057e-01", "anc_acc": "3.944e-01", "epoch": 0.07571} {"step": 37860, "loss": 0.9138, "grad_norm": "3.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.280e+00", "dlm_acc": "3.243e-01", "anc_acc": "3.235e-01", "epoch": 0.07572} {"step": 37865, "loss": 0.9145, "grad_norm": "4.348e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.013e+00", "anc_loss": "1.083e+00", "dlm_acc": "5.057e-01", "anc_acc": "4.873e-01", "epoch": 0.07573} {"step": 37870, "loss": 0.742, "grad_norm": "4.159e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.570e-01", "anc_loss": "7.307e-01", "dlm_acc": "7.207e-01", "anc_acc": "7.034e-01", "epoch": 0.07574} {"step": 37875, "loss": 0.9194, "grad_norm": "3.333e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.273e-01", "anc_loss": "1.016e+00", "dlm_acc": "6.479e-01", "anc_acc": "6.255e-01", "epoch": 0.07575} {"step": 37880, "loss": 1.361, "grad_norm": "6.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.702e+00", "anc_loss": "1.756e+00", "dlm_acc": "2.853e-01", "anc_acc": "2.782e-01", "epoch": 0.07576} {"step": 37885, "loss": 0.9468, "grad_norm": "1.856e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.001e+00", "anc_loss": "1.084e+00", "dlm_acc": "5.915e-01", "anc_acc": "5.718e-01", "epoch": 0.07577} {"step": 37890, "loss": 1.3462, "grad_norm": "2.507e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.085e+00", "anc_loss": "1.208e+00", "dlm_acc": "6.107e-01", "anc_acc": "5.813e-01", "epoch": 0.07578} {"step": 37895, "loss": 1.1439, "grad_norm": "4.166e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.231e+00", "anc_loss": "1.329e+00", "dlm_acc": "5.833e-01", "anc_acc": "5.589e-01", "epoch": 0.07579} {"step": 37900, "loss": 0.988, "grad_norm": "3.496e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.258e+00", "dlm_acc": "5.631e-01", "anc_acc": "5.324e-01", "epoch": 0.0758} {"step": 37905, "loss": 1.2146, "grad_norm": "5.908e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.532e+00", "dlm_acc": "5.249e-01", "anc_acc": "4.956e-01", "epoch": 0.07581} {"step": 37910, "loss": 1.0358, "grad_norm": "5.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.458e+00", "dlm_acc": "5.893e-01", "anc_acc": "5.621e-01", "epoch": 0.07582} {"step": 37915, "loss": 1.0955, "grad_norm": "3.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.192e+00", "dlm_acc": "6.045e-01", "anc_acc": "5.782e-01", "epoch": 0.07583} {"step": 37920, "loss": 1.3032, "grad_norm": "3.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.396e+00", "anc_loss": "1.519e+00", "dlm_acc": "5.278e-01", "anc_acc": "4.996e-01", "epoch": 0.07584} {"step": 37925, "loss": 1.1986, "grad_norm": "7.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.448e+00", "dlm_acc": "6.047e-01", "anc_acc": "5.793e-01", "epoch": 0.07585} {"step": 37930, "loss": 0.6576, "grad_norm": "3.306e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.719e-01", "anc_loss": "9.676e-01", "dlm_acc": "6.394e-01", "anc_acc": "6.114e-01", "epoch": 0.07586} {"step": 37935, "loss": 1.0783, "grad_norm": "4.214e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.118e+00", "anc_loss": "1.216e+00", "dlm_acc": "6.140e-01", "anc_acc": "5.873e-01", "epoch": 0.07587} {"step": 37940, "loss": 1.5185, "grad_norm": "3.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.287e+00", "dlm_acc": "5.466e-01", "anc_acc": "5.259e-01", "epoch": 0.07588} {"step": 37945, "loss": 1.3324, "grad_norm": "4.524e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.119e+00", "anc_loss": "1.238e+00", "dlm_acc": "6.308e-01", "anc_acc": "5.983e-01", "epoch": 0.07589} {"step": 37950, "loss": 0.9213, "grad_norm": "3.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.132e+00", "dlm_acc": "6.481e-01", "anc_acc": "6.139e-01", "epoch": 0.0759} {"step": 37955, "loss": 1.2385, "grad_norm": "2.914e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.656e+00", "dlm_acc": "5.213e-01", "anc_acc": "4.936e-01", "epoch": 0.07591} {"step": 37960, "loss": 1.132, "grad_norm": "1.968e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.551e+00", "anc_loss": "1.672e+00", "dlm_acc": "4.938e-01", "anc_acc": "4.656e-01", "epoch": 0.07592} {"step": 37965, "loss": 1.4683, "grad_norm": "4.166e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.657e+00", "anc_loss": "1.774e+00", "dlm_acc": "5.067e-01", "anc_acc": "4.813e-01", "epoch": 0.07593} {"step": 37970, "loss": 0.8913, "grad_norm": "4.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.258e-01", "anc_loss": "1.016e+00", "dlm_acc": "6.249e-01", "anc_acc": "6.005e-01", "epoch": 0.07594} {"step": 37975, "loss": 1.1931, "grad_norm": "4.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.171e-01", "anc_acc": "4.899e-01", "epoch": 0.07595} {"step": 37980, "loss": 1.2394, "grad_norm": "2.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.533e+00", "anc_loss": "1.654e+00", "dlm_acc": "5.203e-01", "anc_acc": "4.907e-01", "epoch": 0.07596} {"step": 37985, "loss": 1.2171, "grad_norm": "2.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.678e+00", "dlm_acc": "4.995e-01", "anc_acc": "4.687e-01", "epoch": 0.07597} {"step": 37990, "loss": 1.2397, "grad_norm": "4.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.961e-01", "anc_acc": "5.680e-01", "epoch": 0.07598} {"step": 37995, "loss": 1.1695, "grad_norm": "1.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.463e+00", "anc_loss": "1.595e+00", "dlm_acc": "5.112e-01", "anc_acc": "4.798e-01", "epoch": 0.07599} {"step": 38000, "loss": 0.7191, "grad_norm": "2.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.547e-01", "anc_loss": "5.079e-01", "dlm_acc": "8.175e-01", "anc_acc": "8.047e-01", "epoch": 0.076} {"step": 38005, "loss": 1.2512, "grad_norm": "3.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.361e+00", "dlm_acc": "6.063e-01", "anc_acc": "5.836e-01", "epoch": 0.07601} {"step": 38010, "loss": 0.9678, "grad_norm": "2.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.018e+00", "anc_loss": "1.137e+00", "dlm_acc": "6.271e-01", "anc_acc": "5.961e-01", "epoch": 0.07602} {"step": 38015, "loss": 0.8451, "grad_norm": "4.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.115e+00", "anc_loss": "1.226e+00", "dlm_acc": "5.439e-01", "anc_acc": "5.174e-01", "epoch": 0.07603} {"step": 38020, "loss": 1.1169, "grad_norm": "4.135e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.792e-01", "anc_acc": "5.502e-01", "epoch": 0.07604} {"step": 38025, "loss": 1.1115, "grad_norm": "4.296e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.706e+00", "anc_loss": "1.845e+00", "dlm_acc": "4.821e-01", "anc_acc": "4.541e-01", "epoch": 0.07605} {"step": 38030, "loss": 1.0561, "grad_norm": "3.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.408e+00", "dlm_acc": "5.498e-01", "anc_acc": "5.202e-01", "epoch": 0.07606} {"step": 38035, "loss": 1.0636, "grad_norm": "4.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.348e+00", "dlm_acc": "5.884e-01", "anc_acc": "5.583e-01", "epoch": 0.07607} {"step": 38040, "loss": 1.1381, "grad_norm": "3.539e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.290e+00", "anc_loss": "1.408e+00", "dlm_acc": "5.797e-01", "anc_acc": "5.531e-01", "epoch": 0.07608} {"step": 38045, "loss": 1.1704, "grad_norm": "5.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.008e+00", "anc_loss": "1.109e+00", "dlm_acc": "6.391e-01", "anc_acc": "6.133e-01", "epoch": 0.07609} {"step": 38050, "loss": 1.5649, "grad_norm": "1.629e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.630e+00", "anc_loss": "1.766e+00", "dlm_acc": "4.913e-01", "anc_acc": "4.643e-01", "epoch": 0.0761} {"step": 38055, "loss": 1.3235, "grad_norm": "4.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.392e+00", "dlm_acc": "5.894e-01", "anc_acc": "5.571e-01", "epoch": 0.07611} {"step": 38060, "loss": 1.3379, "grad_norm": "5.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.498e-01", "anc_loss": "8.373e-01", "dlm_acc": "7.293e-01", "anc_acc": "7.052e-01", "epoch": 0.07612} {"step": 38065, "loss": 1.0555, "grad_norm": "3.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.196e-01", "anc_loss": "9.160e-01", "dlm_acc": "7.126e-01", "anc_acc": "6.927e-01", "epoch": 0.07613} {"step": 38070, "loss": 1.2913, "grad_norm": "3.295e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.625e-01", "anc_acc": "5.374e-01", "epoch": 0.07614} {"step": 38075, "loss": 1.1784, "grad_norm": "5.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.619e-01", "anc_acc": "5.380e-01", "epoch": 0.07615} {"step": 38080, "loss": 0.9661, "grad_norm": "3.256e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.261e+00", "dlm_acc": "5.761e-01", "anc_acc": "5.487e-01", "epoch": 0.07616} {"step": 38085, "loss": 1.4558, "grad_norm": "2.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.647e+00", "anc_loss": "1.775e+00", "dlm_acc": "4.501e-01", "anc_acc": "4.226e-01", "epoch": 0.07617} {"step": 38090, "loss": 1.2195, "grad_norm": "4.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.697e-01", "anc_acc": "5.448e-01", "epoch": 0.07618} {"step": 38095, "loss": 1.2351, "grad_norm": "3.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.293e+00", "dlm_acc": "5.301e-01", "anc_acc": "5.074e-01", "epoch": 0.07619} {"step": 38100, "loss": 1.1794, "grad_norm": "5.154e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.758e-01", "anc_loss": "9.602e-01", "dlm_acc": "5.781e-01", "anc_acc": "5.540e-01", "epoch": 0.0762} {"step": 38105, "loss": 0.9973, "grad_norm": "8.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.938e-01", "anc_loss": "9.898e-01", "dlm_acc": "6.481e-01", "anc_acc": "6.189e-01", "epoch": 0.07621} {"step": 38110, "loss": 0.7507, "grad_norm": "1.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.281e-01", "anc_loss": "1.042e+00", "dlm_acc": "6.430e-01", "anc_acc": "6.131e-01", "epoch": 0.07622} {"step": 38115, "loss": 1.6502, "grad_norm": "4.312e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.720e+00", "anc_loss": "1.872e+00", "dlm_acc": "4.973e-01", "anc_acc": "4.679e-01", "epoch": 0.07623} {"step": 38120, "loss": 1.5786, "grad_norm": "2.972e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.517e+00", "dlm_acc": "5.634e-01", "anc_acc": "5.350e-01", "epoch": 0.07624} {"step": 38125, "loss": 1.0732, "grad_norm": "2.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.187e+00", "dlm_acc": "6.197e-01", "anc_acc": "5.958e-01", "epoch": 0.07625} {"step": 38130, "loss": 1.056, "grad_norm": "3.249e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.210e+00", "dlm_acc": "6.246e-01", "anc_acc": "5.901e-01", "epoch": 0.07626} {"step": 38135, "loss": 1.3637, "grad_norm": "4.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.418e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.402e-01", "anc_acc": "5.160e-01", "epoch": 0.07627} {"step": 38140, "loss": 1.207, "grad_norm": "2.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.289e-01", "anc_loss": "1.091e+00", "dlm_acc": "6.651e-01", "anc_acc": "6.236e-01", "epoch": 0.07628} {"step": 38145, "loss": 1.0028, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.106e-01", "anc_acc": "4.873e-01", "epoch": 0.07629} {"step": 38150, "loss": 1.2535, "grad_norm": "5.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.637e-01", "anc_loss": "1.067e+00", "dlm_acc": "6.730e-01", "anc_acc": "6.481e-01", "epoch": 0.0763} {"step": 38155, "loss": 1.0249, "grad_norm": "1.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.228e+00", "dlm_acc": "6.015e-01", "anc_acc": "5.698e-01", "epoch": 0.07631} {"step": 38160, "loss": 1.4213, "grad_norm": "3.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.901e-01", "anc_acc": "5.672e-01", "epoch": 0.07632} {"step": 38165, "loss": 0.976, "grad_norm": "3.497e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.574e-01", "anc_acc": "5.234e-01", "epoch": 0.07633} {"step": 38170, "loss": 1.1079, "grad_norm": "2.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.263e+00", "dlm_acc": "5.904e-01", "anc_acc": "5.627e-01", "epoch": 0.07634} {"step": 38175, "loss": 1.1434, "grad_norm": "5.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.499e-01", "anc_acc": "5.255e-01", "epoch": 0.07635} {"step": 38180, "loss": 1.2466, "grad_norm": "4.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.453e-01", "anc_loss": "1.068e+00", "dlm_acc": "6.664e-01", "anc_acc": "6.364e-01", "epoch": 0.07636} {"step": 38185, "loss": 1.1612, "grad_norm": "4.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.479e+00", "anc_loss": "1.620e+00", "dlm_acc": "5.514e-01", "anc_acc": "5.193e-01", "epoch": 0.07637} {"step": 38190, "loss": 1.072, "grad_norm": "3.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.878e-01", "anc_acc": "5.578e-01", "epoch": 0.07638} {"step": 38195, "loss": 1.2425, "grad_norm": "1.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.314e+00", "dlm_acc": "6.150e-01", "anc_acc": "5.802e-01", "epoch": 0.07639} {"step": 38200, "loss": 1.3016, "grad_norm": "2.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.412e+00", "dlm_acc": "5.788e-01", "anc_acc": "5.479e-01", "epoch": 0.0764} {"step": 38205, "loss": 1.1835, "grad_norm": "2.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.922e-01", "anc_loss": "7.828e-01", "dlm_acc": "7.059e-01", "anc_acc": "6.756e-01", "epoch": 0.07641} {"step": 38210, "loss": 1.2781, "grad_norm": "3.291e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.418e-01", "anc_loss": "1.036e+00", "dlm_acc": "6.724e-01", "anc_acc": "6.437e-01", "epoch": 0.07642} {"step": 38215, "loss": 1.2264, "grad_norm": "3.160e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.324e+00", "dlm_acc": "5.811e-01", "anc_acc": "5.542e-01", "epoch": 0.07643} {"step": 38220, "loss": 1.456, "grad_norm": "3.602e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.384e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.415e-01", "anc_acc": "5.134e-01", "epoch": 0.07644} {"step": 38225, "loss": 1.0667, "grad_norm": "4.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.651e-01", "anc_acc": "5.390e-01", "epoch": 0.07645} {"step": 38230, "loss": 1.0341, "grad_norm": "5.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.653e+00", "anc_loss": "1.770e+00", "dlm_acc": "4.884e-01", "anc_acc": "4.637e-01", "epoch": 0.07646} {"step": 38235, "loss": 1.0821, "grad_norm": "7.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.523e-01", "anc_loss": "1.052e+00", "dlm_acc": "6.616e-01", "anc_acc": "6.341e-01", "epoch": 0.07647} {"step": 38240, "loss": 1.4417, "grad_norm": "3.640e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.335e+00", "anc_loss": "1.464e+00", "dlm_acc": "5.872e-01", "anc_acc": "5.581e-01", "epoch": 0.07648} {"step": 38245, "loss": 0.8683, "grad_norm": "2.362e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.036e+00", "anc_loss": "1.140e+00", "dlm_acc": "6.284e-01", "anc_acc": "6.019e-01", "epoch": 0.07649} {"step": 38250, "loss": 1.1114, "grad_norm": "2.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.467e+00", "anc_loss": "1.569e+00", "dlm_acc": "5.020e-01", "anc_acc": "4.766e-01", "epoch": 0.0765} {"step": 38255, "loss": 1.263, "grad_norm": "2.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.885e-01", "anc_acc": "5.499e-01", "epoch": 0.07651} {"step": 38260, "loss": 1.0513, "grad_norm": "3.401e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.803e-01", "anc_acc": "5.528e-01", "epoch": 0.07652} {"step": 38265, "loss": 1.6365, "grad_norm": "6.111e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.502e+00", "anc_loss": "1.633e+00", "dlm_acc": "5.489e-01", "anc_acc": "5.194e-01", "epoch": 0.07653} {"step": 38270, "loss": 1.4175, "grad_norm": "3.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.310e+00", "dlm_acc": "5.733e-01", "anc_acc": "5.440e-01", "epoch": 0.07654} {"step": 38275, "loss": 1.2857, "grad_norm": "2.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.590e+00", "dlm_acc": "5.143e-01", "anc_acc": "4.877e-01", "epoch": 0.07655} {"step": 38280, "loss": 1.1566, "grad_norm": "2.507e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.539e-01", "anc_loss": "9.555e-01", "dlm_acc": "6.748e-01", "anc_acc": "6.471e-01", "epoch": 0.07656} {"step": 38285, "loss": 1.3183, "grad_norm": "1.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.346e+00", "dlm_acc": "6.085e-01", "anc_acc": "5.783e-01", "epoch": 0.07657} {"step": 38290, "loss": 1.2476, "grad_norm": "3.684e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.801e-01", "anc_acc": "5.487e-01", "epoch": 0.07658} {"step": 38295, "loss": 1.3943, "grad_norm": "2.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.361e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.473e-01", "anc_acc": "5.212e-01", "epoch": 0.07659} {"step": 38300, "loss": 0.8902, "grad_norm": "3.309e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.239e+00", "dlm_acc": "6.039e-01", "anc_acc": "5.754e-01", "epoch": 0.0766} {"step": 38305, "loss": 1.1081, "grad_norm": "4.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.591e+00", "anc_loss": "1.742e+00", "dlm_acc": "5.075e-01", "anc_acc": "4.775e-01", "epoch": 0.07661} {"step": 38310, "loss": 1.0231, "grad_norm": "4.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.525e+00", "anc_loss": "1.674e+00", "dlm_acc": "5.349e-01", "anc_acc": "5.025e-01", "epoch": 0.07662} {"step": 38315, "loss": 1.1669, "grad_norm": "4.472e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.339e+00", "anc_loss": "1.456e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.344e-01", "epoch": 0.07663} {"step": 38320, "loss": 1.5564, "grad_norm": "3.160e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.721e+00", "anc_loss": "1.822e+00", "dlm_acc": "4.439e-01", "anc_acc": "4.220e-01", "epoch": 0.07664} {"step": 38325, "loss": 1.7384, "grad_norm": "2.994e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.542e+00", "dlm_acc": "5.153e-01", "anc_acc": "4.856e-01", "epoch": 0.07665} {"step": 38330, "loss": 1.4588, "grad_norm": "2.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.639e+00", "dlm_acc": "5.306e-01", "anc_acc": "5.000e-01", "epoch": 0.07666} {"step": 38335, "loss": 1.1157, "grad_norm": "3.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.158e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.845e-01", "anc_acc": "5.555e-01", "epoch": 0.07667} {"step": 38340, "loss": 1.4936, "grad_norm": "6.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.453e+00", "dlm_acc": "5.474e-01", "anc_acc": "5.206e-01", "epoch": 0.07668} {"step": 38345, "loss": 1.4256, "grad_norm": "3.728e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.484e+00", "anc_loss": "1.603e+00", "dlm_acc": "5.211e-01", "anc_acc": "4.944e-01", "epoch": 0.07669} {"step": 38350, "loss": 1.4736, "grad_norm": "2.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.433e+00", "anc_loss": "1.549e+00", "dlm_acc": "5.487e-01", "anc_acc": "5.212e-01", "epoch": 0.0767} {"step": 38355, "loss": 1.4817, "grad_norm": "2.733e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.225e+00", "anc_loss": "2.275e+00", "dlm_acc": "2.306e-01", "anc_acc": "2.204e-01", "epoch": 0.07671} {"step": 38360, "loss": 1.109, "grad_norm": "1.358e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.918e-01", "anc_loss": "9.828e-01", "dlm_acc": "6.335e-01", "anc_acc": "6.044e-01", "epoch": 0.07672} {"step": 38365, "loss": 1.3408, "grad_norm": "2.846e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.548e+00", "anc_loss": "1.663e+00", "dlm_acc": "4.696e-01", "anc_acc": "4.442e-01", "epoch": 0.07673} {"step": 38370, "loss": 1.4668, "grad_norm": "3.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.638e+00", "anc_loss": "1.776e+00", "dlm_acc": "5.022e-01", "anc_acc": "4.742e-01", "epoch": 0.07674} {"step": 38375, "loss": 1.0257, "grad_norm": "3.942e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.180e-01", "anc_loss": "8.316e-01", "dlm_acc": "7.255e-01", "anc_acc": "6.923e-01", "epoch": 0.07675} {"step": 38380, "loss": 1.1265, "grad_norm": "5.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.173e+00", "dlm_acc": "6.191e-01", "anc_acc": "5.874e-01", "epoch": 0.07676} {"step": 38385, "loss": 1.3383, "grad_norm": "2.969e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.609e+00", "anc_loss": "1.739e+00", "dlm_acc": "5.026e-01", "anc_acc": "4.737e-01", "epoch": 0.07677} {"step": 38390, "loss": 0.9896, "grad_norm": "3.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.016e-01", "anc_loss": "6.613e-01", "dlm_acc": "7.959e-01", "anc_acc": "7.569e-01", "epoch": 0.07678} {"step": 38395, "loss": 1.0009, "grad_norm": "2.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.198e-01", "anc_loss": "6.416e-01", "dlm_acc": "7.852e-01", "anc_acc": "7.452e-01", "epoch": 0.07679} {"step": 38400, "loss": 1.4846, "grad_norm": "2.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.408e+00", "dlm_acc": "5.874e-01", "anc_acc": "5.571e-01", "epoch": 0.0768} {"step": 38405, "loss": 1.361, "grad_norm": "3.259e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.202e+00", "dlm_acc": "6.470e-01", "anc_acc": "6.107e-01", "epoch": 0.07681} {"step": 38410, "loss": 1.3783, "grad_norm": "3.398e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.242e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.707e-01", "anc_acc": "5.414e-01", "epoch": 0.07682} {"step": 38415, "loss": 1.0875, "grad_norm": "3.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.000e+00", "anc_loss": "1.106e+00", "dlm_acc": "6.245e-01", "anc_acc": "5.964e-01", "epoch": 0.07683} {"step": 38420, "loss": 1.5, "grad_norm": "5.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.332e+00", "anc_loss": "1.468e+00", "dlm_acc": "5.840e-01", "anc_acc": "5.542e-01", "epoch": 0.07684} {"step": 38425, "loss": 1.3534, "grad_norm": "9.479e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.325e+00", "anc_loss": "1.444e+00", "dlm_acc": "5.986e-01", "anc_acc": "5.703e-01", "epoch": 0.07685} {"step": 38430, "loss": 1.1432, "grad_norm": "3.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.197e+00", "dlm_acc": "5.930e-01", "anc_acc": "5.640e-01", "epoch": 0.07686} {"step": 38435, "loss": 1.408, "grad_norm": "2.263e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.141e+00", "dlm_acc": "6.649e-01", "anc_acc": "6.293e-01", "epoch": 0.07687} {"step": 38440, "loss": 1.2535, "grad_norm": "5.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.369e+00", "anc_loss": "1.508e+00", "dlm_acc": "5.651e-01", "anc_acc": "5.343e-01", "epoch": 0.07688} {"step": 38445, "loss": 1.0602, "grad_norm": "3.377e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.895e-01", "anc_acc": "5.577e-01", "epoch": 0.07689} {"step": 38450, "loss": 1.1732, "grad_norm": "2.529e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.300e+00", "dlm_acc": "5.780e-01", "anc_acc": "5.468e-01", "epoch": 0.0769} {"step": 38455, "loss": 1.2936, "grad_norm": "9.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.157e+00", "dlm_acc": "6.177e-01", "anc_acc": "5.886e-01", "epoch": 0.07691} {"step": 38460, "loss": 1.0422, "grad_norm": "7.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.758e-01", "anc_loss": "6.672e-01", "dlm_acc": "7.521e-01", "anc_acc": "7.236e-01", "epoch": 0.07692} {"step": 38465, "loss": 1.2053, "grad_norm": "5.932e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.548e-01", "anc_acc": "5.242e-01", "epoch": 0.07693} {"step": 38470, "loss": 1.0213, "grad_norm": "5.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.220e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.781e-01", "anc_acc": "5.496e-01", "epoch": 0.07694} {"step": 38475, "loss": 1.203, "grad_norm": "2.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.402e+00", "dlm_acc": "5.560e-01", "anc_acc": "5.238e-01", "epoch": 0.07695} {"step": 38480, "loss": 1.2608, "grad_norm": "2.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.128e+00", "anc_loss": "1.244e+00", "dlm_acc": "5.976e-01", "anc_acc": "5.665e-01", "epoch": 0.07696} {"step": 38485, "loss": 1.4555, "grad_norm": "3.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.306e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.877e-01", "anc_acc": "5.565e-01", "epoch": 0.07697} {"step": 38490, "loss": 1.2994, "grad_norm": "3.035e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.182e+00", "dlm_acc": "6.371e-01", "anc_acc": "6.066e-01", "epoch": 0.07698} {"step": 38495, "loss": 0.9766, "grad_norm": "3.893e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.074e-01", "anc_loss": "1.028e+00", "dlm_acc": "6.721e-01", "anc_acc": "6.361e-01", "epoch": 0.07699} {"step": 38500, "loss": 1.035, "grad_norm": "2.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.446e+00", "dlm_acc": "5.789e-01", "anc_acc": "5.506e-01", "epoch": 0.077} {"step": 38505, "loss": 1.0011, "grad_norm": "1.351e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.136e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.982e-01", "anc_acc": "5.702e-01", "epoch": 0.07701} {"step": 38510, "loss": 1.2353, "grad_norm": "2.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.485e+00", "dlm_acc": "5.577e-01", "anc_acc": "5.347e-01", "epoch": 0.07702} {"step": 38515, "loss": 1.6904, "grad_norm": "5.174e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.650e+00", "dlm_acc": "5.368e-01", "anc_acc": "5.108e-01", "epoch": 0.07703} {"step": 38520, "loss": 1.4495, "grad_norm": "3.553e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.520e-01", "anc_acc": "5.178e-01", "epoch": 0.07704} {"step": 38525, "loss": 1.3335, "grad_norm": "3.496e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.362e-01", "anc_acc": "5.061e-01", "epoch": 0.07705} {"step": 38530, "loss": 1.2492, "grad_norm": "2.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.460e+00", "anc_loss": "1.577e+00", "dlm_acc": "5.277e-01", "anc_acc": "5.025e-01", "epoch": 0.07706} {"step": 38535, "loss": 1.5059, "grad_norm": "4.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.521e+00", "anc_loss": "1.641e+00", "dlm_acc": "4.961e-01", "anc_acc": "4.710e-01", "epoch": 0.07707} {"step": 38540, "loss": 1.9076, "grad_norm": "2.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.690e+00", "anc_loss": "1.819e+00", "dlm_acc": "4.941e-01", "anc_acc": "4.678e-01", "epoch": 0.07708} {"step": 38545, "loss": 1.1109, "grad_norm": "2.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.146e+00", "dlm_acc": "6.121e-01", "anc_acc": "5.838e-01", "epoch": 0.07709} {"step": 38550, "loss": 1.3801, "grad_norm": "8.773e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.454e+00", "anc_loss": "1.579e+00", "dlm_acc": "5.354e-01", "anc_acc": "5.070e-01", "epoch": 0.0771} {"step": 38555, "loss": 1.0694, "grad_norm": "4.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.209e+00", "dlm_acc": "5.478e-01", "anc_acc": "5.208e-01", "epoch": 0.07711} {"step": 38560, "loss": 1.6043, "grad_norm": "5.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.590e+00", "anc_loss": "1.672e+00", "dlm_acc": "4.775e-01", "anc_acc": "4.568e-01", "epoch": 0.07712} {"step": 38565, "loss": 0.9649, "grad_norm": "4.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.445e-01", "anc_loss": "4.582e-01", "dlm_acc": "6.775e-01", "anc_acc": "6.733e-01", "epoch": 0.07713} {"step": 38570, "loss": 1.0383, "grad_norm": "3.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.074e-01", "anc_loss": "5.398e-01", "dlm_acc": "6.802e-01", "anc_acc": "6.728e-01", "epoch": 0.07714} {"step": 38575, "loss": 1.522, "grad_norm": "5.766e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.402e-01", "anc_loss": "1.036e+00", "dlm_acc": "6.677e-01", "anc_acc": "6.422e-01", "epoch": 0.07715} {"step": 38580, "loss": 1.1739, "grad_norm": "3.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.202e+00", "dlm_acc": "6.106e-01", "anc_acc": "5.820e-01", "epoch": 0.07716} {"step": 38585, "loss": 1.4143, "grad_norm": "4.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.631e-01", "anc_acc": "5.322e-01", "epoch": 0.07717} {"step": 38590, "loss": 1.602, "grad_norm": "3.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.586e+00", "anc_loss": "1.684e+00", "dlm_acc": "4.968e-01", "anc_acc": "4.757e-01", "epoch": 0.07718} {"step": 38595, "loss": 1.2406, "grad_norm": "2.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.671e+00", "dlm_acc": "5.170e-01", "anc_acc": "4.750e-01", "epoch": 0.07719} {"step": 38600, "loss": 1.3466, "grad_norm": "3.180e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.228e+00", "dlm_acc": "6.282e-01", "anc_acc": "6.004e-01", "epoch": 0.0772} {"step": 38605, "loss": 1.2043, "grad_norm": "1.942e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.303e+00", "dlm_acc": "5.779e-01", "anc_acc": "5.446e-01", "epoch": 0.07721} {"step": 38610, "loss": 1.4872, "grad_norm": "8.141e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.515e+00", "dlm_acc": "5.859e-01", "anc_acc": "5.599e-01", "epoch": 0.07722} {"step": 38615, "loss": 0.8291, "grad_norm": "1.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.728e-02", "anc_loss": "7.535e-02", "dlm_acc": "9.389e-01", "anc_acc": "9.321e-01", "epoch": 0.07723} {"step": 38620, "loss": 0.8849, "grad_norm": "4.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.805e-02", "anc_loss": "5.232e-02", "dlm_acc": "9.671e-01", "anc_acc": "9.578e-01", "epoch": 0.07724} {"step": 38625, "loss": 1.0198, "grad_norm": "2.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.770e-01", "anc_loss": "5.148e-01", "dlm_acc": "8.618e-01", "anc_acc": "8.232e-01", "epoch": 0.07725} {"step": 38630, "loss": 0.9819, "grad_norm": "2.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.226e+00", "dlm_acc": "6.028e-01", "anc_acc": "5.767e-01", "epoch": 0.07726} {"step": 38635, "loss": 1.1278, "grad_norm": "1.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.229e+00", "anc_loss": "1.326e+00", "dlm_acc": "5.683e-01", "anc_acc": "5.377e-01", "epoch": 0.07727} {"step": 38640, "loss": 1.5034, "grad_norm": "5.837e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.778e-01", "anc_acc": "5.522e-01", "epoch": 0.07728} {"step": 38645, "loss": 1.3642, "grad_norm": "3.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.548e+00", "dlm_acc": "5.438e-01", "anc_acc": "5.158e-01", "epoch": 0.07729} {"step": 38650, "loss": 1.2178, "grad_norm": "2.348e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.285e+00", "dlm_acc": "3.334e-01", "anc_acc": "3.222e-01", "epoch": 0.0773} {"step": 38655, "loss": 1.3194, "grad_norm": "2.820e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.199e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.822e-01", "anc_acc": "5.538e-01", "epoch": 0.07731} {"step": 38660, "loss": 1.302, "grad_norm": "9.672e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.486e+00", "anc_loss": "1.627e+00", "dlm_acc": "5.405e-01", "anc_acc": "5.069e-01", "epoch": 0.07732} {"step": 38665, "loss": 0.9108, "grad_norm": "3.338e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.443e+00", "dlm_acc": "5.410e-01", "anc_acc": "5.119e-01", "epoch": 0.07733} {"step": 38670, "loss": 1.1548, "grad_norm": "3.506e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.448e+00", "anc_loss": "1.553e+00", "dlm_acc": "4.943e-01", "anc_acc": "4.681e-01", "epoch": 0.07734} {"step": 38675, "loss": 1.3929, "grad_norm": "4.179e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.595e+00", "anc_loss": "1.663e+00", "dlm_acc": "4.015e-01", "anc_acc": "3.978e-01", "epoch": 0.07735} {"step": 38680, "loss": 0.9263, "grad_norm": "1.231e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.147e+00", "anc_loss": "1.235e+00", "dlm_acc": "5.632e-01", "anc_acc": "5.404e-01", "epoch": 0.07736} {"step": 38685, "loss": 0.9353, "grad_norm": "3.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.469e+00", "anc_loss": "1.561e+00", "dlm_acc": "4.392e-01", "anc_acc": "4.170e-01", "epoch": 0.07737} {"step": 38690, "loss": 1.1866, "grad_norm": "6.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.301e+00", "anc_loss": "1.397e+00", "dlm_acc": "5.105e-01", "anc_acc": "4.888e-01", "epoch": 0.07738} {"step": 38695, "loss": 1.4695, "grad_norm": "5.234e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.999e-01", "anc_acc": "5.760e-01", "epoch": 0.07739} {"step": 38700, "loss": 1.2384, "grad_norm": "2.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.257e+00", "dlm_acc": "6.081e-01", "anc_acc": "5.750e-01", "epoch": 0.0774} {"step": 38705, "loss": 1.0778, "grad_norm": "2.469e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.308e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.721e-01", "anc_acc": "5.432e-01", "epoch": 0.07741} {"step": 38710, "loss": 1.166, "grad_norm": "4.038e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.456e+00", "anc_loss": "1.566e+00", "dlm_acc": "5.751e-01", "anc_acc": "5.479e-01", "epoch": 0.07742} {"step": 38715, "loss": 1.1359, "grad_norm": "4.898e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.789e-01", "anc_loss": "1.093e+00", "dlm_acc": "6.456e-01", "anc_acc": "6.104e-01", "epoch": 0.07743} {"step": 38720, "loss": 1.2953, "grad_norm": "4.024e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.403e+00", "anc_loss": "1.551e+00", "dlm_acc": "5.618e-01", "anc_acc": "5.274e-01", "epoch": 0.07744} {"step": 38725, "loss": 1.4238, "grad_norm": "4.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.514e+00", "dlm_acc": "5.597e-01", "anc_acc": "5.367e-01", "epoch": 0.07745} {"step": 38730, "loss": 1.1633, "grad_norm": "2.517e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.313e+00", "dlm_acc": "5.739e-01", "anc_acc": "5.454e-01", "epoch": 0.07746} {"step": 38735, "loss": 0.8956, "grad_norm": "4.719e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.360e-01", "anc_loss": "3.641e-01", "dlm_acc": "9.030e-01", "anc_acc": "8.968e-01", "epoch": 0.07747} {"step": 38740, "loss": 1.0504, "grad_norm": "3.942e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.165e+00", "anc_loss": "1.274e+00", "dlm_acc": "6.085e-01", "anc_acc": "5.788e-01", "epoch": 0.07748} {"step": 38745, "loss": 1.2453, "grad_norm": "4.088e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.597e+00", "dlm_acc": "5.376e-01", "anc_acc": "5.118e-01", "epoch": 0.07749} {"step": 38750, "loss": 1.037, "grad_norm": "3.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.042e+00", "anc_loss": "1.167e+00", "dlm_acc": "6.038e-01", "anc_acc": "5.705e-01", "epoch": 0.0775} {"step": 38755, "loss": 1.1304, "grad_norm": "4.511e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.878e-01", "anc_acc": "5.567e-01", "epoch": 0.07751} {"step": 38760, "loss": 1.408, "grad_norm": "4.687e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.304e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.895e-01", "anc_acc": "5.555e-01", "epoch": 0.07752} {"step": 38765, "loss": 1.4944, "grad_norm": "3.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.584e+00", "anc_loss": "1.702e+00", "dlm_acc": "4.811e-01", "anc_acc": "4.554e-01", "epoch": 0.07753} {"step": 38770, "loss": 1.5696, "grad_norm": "1.358e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.697e+00", "dlm_acc": "5.137e-01", "anc_acc": "4.896e-01", "epoch": 0.07754} {"step": 38775, "loss": 1.5125, "grad_norm": "3.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.455e+00", "anc_loss": "2.502e+00", "dlm_acc": "2.011e-01", "anc_acc": "1.903e-01", "epoch": 0.07755} {"step": 38780, "loss": 1.0402, "grad_norm": "4.338e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.711e-01", "anc_loss": "1.079e+00", "dlm_acc": "6.600e-01", "anc_acc": "6.356e-01", "epoch": 0.07756} {"step": 38785, "loss": 1.3304, "grad_norm": "3.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.627e+00", "anc_loss": "1.759e+00", "dlm_acc": "5.176e-01", "anc_acc": "4.888e-01", "epoch": 0.07757} {"step": 38790, "loss": 0.8191, "grad_norm": "4.242e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.294e+00", "anc_loss": "1.403e+00", "dlm_acc": "5.565e-01", "anc_acc": "5.305e-01", "epoch": 0.07758} {"step": 38795, "loss": 1.05, "grad_norm": "6.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.532e+00", "dlm_acc": "4.775e-01", "anc_acc": "4.555e-01", "epoch": 0.07759} {"step": 38800, "loss": 1.1836, "grad_norm": "2.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.398e+00", "anc_loss": "1.521e+00", "dlm_acc": "5.102e-01", "anc_acc": "4.843e-01", "epoch": 0.0776} {"step": 38805, "loss": 0.8013, "grad_norm": "5.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.846e-01", "anc_loss": "5.159e-01", "dlm_acc": "7.569e-01", "anc_acc": "7.459e-01", "epoch": 0.07761} {"step": 38810, "loss": 0.859, "grad_norm": "3.400e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.218e+00", "dlm_acc": "6.156e-01", "anc_acc": "5.864e-01", "epoch": 0.07762} {"step": 38815, "loss": 1.2906, "grad_norm": "2.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.595e+00", "dlm_acc": "5.221e-01", "anc_acc": "4.918e-01", "epoch": 0.07763} {"step": 38820, "loss": 1.1478, "grad_norm": "2.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.294e-01", "anc_acc": "4.972e-01", "epoch": 0.07764} {"step": 38825, "loss": 1.2399, "grad_norm": "2.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.276e+00", "anc_loss": "1.391e+00", "dlm_acc": "6.207e-01", "anc_acc": "5.946e-01", "epoch": 0.07765} {"step": 38830, "loss": 1.2271, "grad_norm": "2.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.316e-01", "anc_acc": "5.010e-01", "epoch": 0.07766} {"step": 38835, "loss": 1.2614, "grad_norm": "1.207e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.239e+00", "dlm_acc": "4.186e-01", "anc_acc": "4.250e-01", "epoch": 0.07767} {"step": 38840, "loss": 1.2666, "grad_norm": "5.113e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.237e+00", "dlm_acc": "3.428e-01", "anc_acc": "3.429e-01", "epoch": 0.07768} {"step": 38845, "loss": 1.6388, "grad_norm": "3.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.337e+00", "dlm_acc": "3.323e-01", "anc_acc": "3.308e-01", "epoch": 0.07769} {"step": 38850, "loss": 1.1878, "grad_norm": "4.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.111e+00", "dlm_acc": "5.413e-01", "anc_acc": "5.207e-01", "epoch": 0.0777} {"step": 38855, "loss": 1.5506, "grad_norm": "2.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.628e+00", "anc_loss": "1.769e+00", "dlm_acc": "4.658e-01", "anc_acc": "4.358e-01", "epoch": 0.07771} {"step": 38860, "loss": 1.7345, "grad_norm": "4.321e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.447e+00", "anc_loss": "1.589e+00", "dlm_acc": "5.361e-01", "anc_acc": "5.052e-01", "epoch": 0.07772} {"step": 38865, "loss": 1.3185, "grad_norm": "2.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.089e+00", "anc_loss": "1.195e+00", "dlm_acc": "6.040e-01", "anc_acc": "5.752e-01", "epoch": 0.07773} {"step": 38870, "loss": 0.9777, "grad_norm": "4.445e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.267e+00", "dlm_acc": "5.364e-01", "anc_acc": "5.135e-01", "epoch": 0.07774} {"step": 38875, "loss": 1.4514, "grad_norm": "3.351e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.505e+00", "dlm_acc": "5.291e-01", "anc_acc": "5.012e-01", "epoch": 0.07775} {"step": 38880, "loss": 1.3717, "grad_norm": "4.762e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.382e+00", "anc_loss": "1.502e+00", "dlm_acc": "5.555e-01", "anc_acc": "5.292e-01", "epoch": 0.07776} {"step": 38885, "loss": 0.9567, "grad_norm": "1.294e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.019e+00", "anc_loss": "1.101e+00", "dlm_acc": "6.356e-01", "anc_acc": "6.159e-01", "epoch": 0.07777} {"step": 38890, "loss": 1.2013, "grad_norm": "2.292e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.752e-01", "anc_acc": "5.460e-01", "epoch": 0.07778} {"step": 38895, "loss": 1.4195, "grad_norm": "5.153e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.688e+00", "anc_loss": "1.802e+00", "dlm_acc": "5.052e-01", "anc_acc": "4.790e-01", "epoch": 0.07779} {"step": 38900, "loss": 1.1774, "grad_norm": "3.624e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.486e+00", "dlm_acc": "5.443e-01", "anc_acc": "5.137e-01", "epoch": 0.0778} {"step": 38905, "loss": 1.363, "grad_norm": "4.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.512e+00", "dlm_acc": "5.566e-01", "anc_acc": "5.242e-01", "epoch": 0.07781} {"step": 38910, "loss": 1.0789, "grad_norm": "2.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.166e+00", "dlm_acc": "6.072e-01", "anc_acc": "5.792e-01", "epoch": 0.07782} {"step": 38915, "loss": 1.2787, "grad_norm": "2.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.567e+00", "anc_loss": "1.705e+00", "dlm_acc": "5.350e-01", "anc_acc": "5.049e-01", "epoch": 0.07783} {"step": 38920, "loss": 1.0753, "grad_norm": "3.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.625e-01", "anc_acc": "5.356e-01", "epoch": 0.07784} {"step": 38925, "loss": 1.668, "grad_norm": "4.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.663e+00", "anc_loss": "1.798e+00", "dlm_acc": "5.122e-01", "anc_acc": "4.843e-01", "epoch": 0.07785} {"step": 38930, "loss": 1.3837, "grad_norm": "4.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.482e+00", "anc_loss": "1.596e+00", "dlm_acc": "5.259e-01", "anc_acc": "5.015e-01", "epoch": 0.07786} {"step": 38935, "loss": 1.1424, "grad_norm": "2.714e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.079e+00", "anc_loss": "1.196e+00", "dlm_acc": "5.835e-01", "anc_acc": "5.549e-01", "epoch": 0.07787} {"step": 38940, "loss": 1.0907, "grad_norm": "2.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.581e+00", "anc_loss": "1.745e+00", "dlm_acc": "5.092e-01", "anc_acc": "4.789e-01", "epoch": 0.07788} {"step": 38945, "loss": 1.7155, "grad_norm": "9.658e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.563e+00", "anc_loss": "1.680e+00", "dlm_acc": "4.671e-01", "anc_acc": "4.465e-01", "epoch": 0.07789} {"step": 38950, "loss": 1.1616, "grad_norm": "3.107e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.072e+00", "anc_loss": "1.195e+00", "dlm_acc": "5.849e-01", "anc_acc": "5.416e-01", "epoch": 0.0779} {"step": 38955, "loss": 1.2646, "grad_norm": "3.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.766e-01", "anc_loss": "8.844e-01", "dlm_acc": "6.944e-01", "anc_acc": "6.674e-01", "epoch": 0.07791} {"step": 38960, "loss": 1.1757, "grad_norm": "2.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.928e-01", "anc_loss": "1.095e+00", "dlm_acc": "5.999e-01", "anc_acc": "5.633e-01", "epoch": 0.07792} {"step": 38965, "loss": 1.1964, "grad_norm": "2.646e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.037e+00", "anc_loss": "1.163e+00", "dlm_acc": "6.087e-01", "anc_acc": "5.732e-01", "epoch": 0.07793} {"step": 38970, "loss": 1.527, "grad_norm": "4.050e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.395e+00", "anc_loss": "1.543e+00", "dlm_acc": "5.533e-01", "anc_acc": "5.210e-01", "epoch": 0.07794} {"step": 38975, "loss": 1.3008, "grad_norm": "4.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.165e+00", "anc_loss": "1.410e+00", "dlm_acc": "6.134e-01", "anc_acc": "5.531e-01", "epoch": 0.07795} {"step": 38980, "loss": 1.3808, "grad_norm": "4.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.645e-01", "anc_acc": "5.371e-01", "epoch": 0.07796} {"step": 38985, "loss": 1.3804, "grad_norm": "3.156e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.622e+00", "anc_loss": "1.750e+00", "dlm_acc": "4.731e-01", "anc_acc": "4.454e-01", "epoch": 0.07797} {"step": 38990, "loss": 1.3598, "grad_norm": "3.455e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.276e+00", "dlm_acc": "5.897e-01", "anc_acc": "5.541e-01", "epoch": 0.07798} {"step": 38995, "loss": 1.4941, "grad_norm": "3.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.216e+00", "dlm_acc": "5.767e-01", "anc_acc": "5.594e-01", "epoch": 0.07799} {"step": 39000, "loss": 1.4352, "grad_norm": "4.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.416e+00", "dlm_acc": "5.514e-01", "anc_acc": "5.196e-01", "epoch": 0.078} {"step": 39005, "loss": 1.5517, "grad_norm": "3.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.133e+00", "dlm_acc": "6.794e-01", "anc_acc": "6.503e-01", "epoch": 0.07801} {"step": 39010, "loss": 1.3245, "grad_norm": "1.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.875e-01", "anc_loss": "9.180e-01", "dlm_acc": "6.575e-01", "anc_acc": "6.128e-01", "epoch": 0.07802} {"step": 39015, "loss": 1.4392, "grad_norm": "1.773e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.135e+00", "dlm_acc": "5.638e-01", "anc_acc": "5.408e-01", "epoch": 0.07803} {"step": 39020, "loss": 1.4286, "grad_norm": "2.757e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.462e+00", "dlm_acc": "4.533e-01", "anc_acc": "4.180e-01", "epoch": 0.07804} {"step": 39025, "loss": 1.7474, "grad_norm": "3.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.369e+00", "dlm_acc": "6.096e-01", "anc_acc": "5.589e-01", "epoch": 0.07805} {"step": 39030, "loss": 1.2513, "grad_norm": "2.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.032e+00", "anc_loss": "2.122e+00", "dlm_acc": "3.137e-01", "anc_acc": "2.936e-01", "epoch": 0.07806} {"step": 39035, "loss": 1.0508, "grad_norm": "2.572e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.060e+00", "anc_loss": "1.204e+00", "dlm_acc": "5.786e-01", "anc_acc": "5.321e-01", "epoch": 0.07807} {"step": 39040, "loss": 1.0608, "grad_norm": "2.940e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.117e-01", "anc_loss": "1.002e+00", "dlm_acc": "5.920e-01", "anc_acc": "5.645e-01", "epoch": 0.07808} {"step": 39045, "loss": 1.2771, "grad_norm": "3.507e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.215e+00", "dlm_acc": "5.841e-01", "anc_acc": "5.610e-01", "epoch": 0.07809} {"step": 39050, "loss": 1.4405, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.565e-01", "anc_acc": "5.188e-01", "epoch": 0.0781} {"step": 39055, "loss": 1.2126, "grad_norm": "3.174e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.402e+00", "dlm_acc": "4.841e-01", "anc_acc": "4.503e-01", "epoch": 0.07811} {"step": 39060, "loss": 1.1871, "grad_norm": "2.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.043e-01", "anc_loss": "9.859e-01", "dlm_acc": "6.497e-01", "anc_acc": "6.235e-01", "epoch": 0.07812} {"step": 39065, "loss": 1.2012, "grad_norm": "6.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.957e-01", "anc_loss": "1.104e+00", "dlm_acc": "6.271e-01", "anc_acc": "5.948e-01", "epoch": 0.07813} {"step": 39070, "loss": 1.2663, "grad_norm": "3.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.219e-01", "anc_loss": "1.073e+00", "dlm_acc": "6.656e-01", "anc_acc": "6.205e-01", "epoch": 0.07814} {"step": 39075, "loss": 1.2521, "grad_norm": "2.538e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.218e+00", "anc_loss": "1.356e+00", "dlm_acc": "5.780e-01", "anc_acc": "5.379e-01", "epoch": 0.07815} {"step": 39080, "loss": 1.1656, "grad_norm": "2.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.977e-01", "anc_loss": "1.190e+00", "dlm_acc": "6.177e-01", "anc_acc": "5.561e-01", "epoch": 0.07816} {"step": 39085, "loss": 1.0816, "grad_norm": "7.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.797e-01", "anc_loss": "1.915e-01", "dlm_acc": "9.227e-01", "anc_acc": "9.183e-01", "epoch": 0.07817} {"step": 39090, "loss": 0.7837, "grad_norm": "6.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.400e-01", "anc_loss": "5.320e-01", "dlm_acc": "7.701e-01", "anc_acc": "7.285e-01", "epoch": 0.07818} {"step": 39095, "loss": 0.5772, "grad_norm": "2.823e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.260e-01", "anc_loss": "4.045e-01", "dlm_acc": "8.447e-01", "anc_acc": "8.078e-01", "epoch": 0.07819} {"step": 39100, "loss": 0.96, "grad_norm": "1.980e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.025e+00", "anc_loss": "1.136e+00", "dlm_acc": "5.985e-01", "anc_acc": "5.629e-01", "epoch": 0.0782} {"step": 39105, "loss": 1.4427, "grad_norm": "3.605e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.451e+00", "dlm_acc": "5.544e-01", "anc_acc": "5.253e-01", "epoch": 0.07821} {"step": 39110, "loss": 1.0372, "grad_norm": "1.707e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.218e+00", "dlm_acc": "6.042e-01", "anc_acc": "5.720e-01", "epoch": 0.07822} {"step": 39115, "loss": 1.07, "grad_norm": "3.294e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.549e-01", "anc_acc": "5.319e-01", "epoch": 0.07823} {"step": 39120, "loss": 1.216, "grad_norm": "4.689e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.589e+00", "anc_loss": "1.697e+00", "dlm_acc": "4.742e-01", "anc_acc": "4.486e-01", "epoch": 0.07824} {"step": 39125, "loss": 1.0926, "grad_norm": "3.107e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.089e+00", "anc_loss": "1.192e+00", "dlm_acc": "6.087e-01", "anc_acc": "5.873e-01", "epoch": 0.07825} {"step": 39130, "loss": 1.0452, "grad_norm": "2.610e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.429e+00", "dlm_acc": "5.636e-01", "anc_acc": "5.353e-01", "epoch": 0.07826} {"step": 39135, "loss": 1.1865, "grad_norm": "3.420e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.353e+00", "anc_loss": "1.461e+00", "dlm_acc": "5.221e-01", "anc_acc": "4.954e-01", "epoch": 0.07827} {"step": 39140, "loss": 1.1165, "grad_norm": "2.241e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.206e+00", "anc_loss": "1.322e+00", "dlm_acc": "5.742e-01", "anc_acc": "5.442e-01", "epoch": 0.07828} {"step": 39145, "loss": 1.5835, "grad_norm": "3.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.621e+00", "anc_loss": "1.764e+00", "dlm_acc": "5.118e-01", "anc_acc": "4.811e-01", "epoch": 0.07829} {"step": 39150, "loss": 1.4078, "grad_norm": "5.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.442e+00", "anc_loss": "1.573e+00", "dlm_acc": "5.567e-01", "anc_acc": "5.261e-01", "epoch": 0.0783} {"step": 39155, "loss": 1.1445, "grad_norm": "8.806e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.201e-01", "anc_loss": "1.012e+00", "dlm_acc": "6.455e-01", "anc_acc": "6.219e-01", "epoch": 0.07831} {"step": 39160, "loss": 1.2144, "grad_norm": "4.749e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.226e-01", "anc_loss": "9.018e-01", "dlm_acc": "6.783e-01", "anc_acc": "6.537e-01", "epoch": 0.07832} {"step": 39165, "loss": 1.4788, "grad_norm": "2.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.475e+00", "dlm_acc": "5.470e-01", "anc_acc": "5.191e-01", "epoch": 0.07833} {"step": 39170, "loss": 1.4377, "grad_norm": "2.783e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.076e+00", "anc_loss": "1.154e+00", "dlm_acc": "6.447e-01", "anc_acc": "6.284e-01", "epoch": 0.07834} {"step": 39175, "loss": 1.1749, "grad_norm": "3.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.098e-01", "anc_loss": "7.469e-01", "dlm_acc": "6.020e-01", "anc_acc": "5.895e-01", "epoch": 0.07835} {"step": 39180, "loss": 1.3984, "grad_norm": "2.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.408e+00", "anc_loss": "1.534e+00", "dlm_acc": "5.338e-01", "anc_acc": "5.059e-01", "epoch": 0.07836} {"step": 39185, "loss": 1.5192, "grad_norm": "6.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.293e-01", "anc_loss": "1.006e+00", "dlm_acc": "5.271e-01", "anc_acc": "4.987e-01", "epoch": 0.07837} {"step": 39190, "loss": 1.0335, "grad_norm": "3.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.633e-01", "anc_loss": "8.609e-01", "dlm_acc": "6.639e-01", "anc_acc": "6.348e-01", "epoch": 0.07838} {"step": 39195, "loss": 1.1974, "grad_norm": "4.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.391e-01", "anc_loss": "5.871e-01", "dlm_acc": "6.963e-01", "anc_acc": "6.773e-01", "epoch": 0.07839} {"step": 39200, "loss": 1.0096, "grad_norm": "2.252e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.098e-01", "anc_loss": "9.053e-01", "dlm_acc": "6.675e-01", "anc_acc": "6.392e-01", "epoch": 0.0784} {"step": 39205, "loss": 1.3859, "grad_norm": "7.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.289e+00", "dlm_acc": "6.368e-01", "anc_acc": "6.085e-01", "epoch": 0.07841} {"step": 39210, "loss": 1.4083, "grad_norm": "4.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.124e+00", "dlm_acc": "6.413e-01", "anc_acc": "6.132e-01", "epoch": 0.07842} {"step": 39215, "loss": 1.2877, "grad_norm": "2.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.141e-01", "anc_loss": "7.227e-01", "dlm_acc": "6.984e-01", "anc_acc": "6.532e-01", "epoch": 0.07843} {"step": 39220, "loss": 1.2243, "grad_norm": "2.272e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.977e-01", "anc_loss": "1.057e+00", "dlm_acc": "5.096e-01", "anc_acc": "4.907e-01", "epoch": 0.07844} {"step": 39225, "loss": 1.2009, "grad_norm": "4.149e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.050e+00", "anc_loss": "1.155e+00", "dlm_acc": "6.492e-01", "anc_acc": "6.212e-01", "epoch": 0.07845} {"step": 39230, "loss": 1.2297, "grad_norm": "6.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.135e+00", "dlm_acc": "4.917e-01", "anc_acc": "4.748e-01", "epoch": 0.07846} {"step": 39235, "loss": 1.4148, "grad_norm": "5.664e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.070e-01", "anc_loss": "7.625e-01", "dlm_acc": "5.844e-01", "anc_acc": "5.613e-01", "epoch": 0.07847} {"step": 39240, "loss": 1.095, "grad_norm": "3.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.914e-01", "anc_loss": "1.010e+00", "dlm_acc": "6.277e-01", "anc_acc": "5.898e-01", "epoch": 0.07848} {"step": 39245, "loss": 1.3069, "grad_norm": "2.658e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.672e-01", "anc_loss": "1.080e+00", "dlm_acc": "6.161e-01", "anc_acc": "5.882e-01", "epoch": 0.07849} {"step": 39250, "loss": 1.3837, "grad_norm": "4.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.428e-01", "anc_acc": "5.183e-01", "epoch": 0.0785} {"step": 39255, "loss": 1.3966, "grad_norm": "2.803e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.004e+00", "anc_loss": "1.087e+00", "dlm_acc": "5.915e-01", "anc_acc": "5.678e-01", "epoch": 0.07851} {"step": 39260, "loss": 1.337, "grad_norm": "3.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.695e-01", "anc_loss": "1.046e+00", "dlm_acc": "5.634e-01", "anc_acc": "5.391e-01", "epoch": 0.07852} {"step": 39265, "loss": 1.2831, "grad_norm": "2.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.867e-01", "anc_loss": "8.367e-01", "dlm_acc": "6.318e-01", "anc_acc": "6.153e-01", "epoch": 0.07853} {"step": 39270, "loss": 1.0522, "grad_norm": "5.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.973e-01", "anc_loss": "5.203e-01", "dlm_acc": "6.533e-01", "anc_acc": "6.446e-01", "epoch": 0.07854} {"step": 39275, "loss": 1.3742, "grad_norm": "3.228e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.926e-01", "anc_loss": "8.469e-01", "dlm_acc": "6.292e-01", "anc_acc": "6.131e-01", "epoch": 0.07855} {"step": 39280, "loss": 1.3172, "grad_norm": "2.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.706e-01", "anc_acc": "5.406e-01", "epoch": 0.07856} {"step": 39285, "loss": 0.9634, "grad_norm": "5.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.213e-01", "anc_loss": "7.979e-01", "dlm_acc": "6.762e-01", "anc_acc": "6.499e-01", "epoch": 0.07857} {"step": 39290, "loss": 1.0944, "grad_norm": "2.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.508e-01", "anc_loss": "1.036e+00", "dlm_acc": "5.724e-01", "anc_acc": "5.489e-01", "epoch": 0.07858} {"step": 39295, "loss": 1.1396, "grad_norm": "3.037e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.446e+00", "dlm_acc": "5.531e-01", "anc_acc": "5.273e-01", "epoch": 0.07859} {"step": 39300, "loss": 1.1312, "grad_norm": "3.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.338e+00", "dlm_acc": "5.149e-01", "anc_acc": "4.938e-01", "epoch": 0.0786} {"step": 39305, "loss": 0.9043, "grad_norm": "2.291e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.224e-01", "anc_loss": "6.916e-01", "dlm_acc": "7.402e-01", "anc_acc": "7.218e-01", "epoch": 0.07861} {"step": 39310, "loss": 1.1407, "grad_norm": "2.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.436e-01", "anc_loss": "8.156e-01", "dlm_acc": "6.362e-01", "anc_acc": "6.148e-01", "epoch": 0.07862} {"step": 39315, "loss": 1.1852, "grad_norm": "2.668e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.060e+00", "anc_loss": "1.106e+00", "dlm_acc": "5.597e-01", "anc_acc": "5.497e-01", "epoch": 0.07863} {"step": 39320, "loss": 0.9926, "grad_norm": "3.300e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.796e-02", "anc_loss": "8.153e-02", "dlm_acc": "9.574e-01", "anc_acc": "9.488e-01", "epoch": 0.07864} {"step": 39325, "loss": 1.0757, "grad_norm": "2.352e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.761e-02", "anc_loss": "1.078e-01", "dlm_acc": "9.355e-01", "anc_acc": "9.296e-01", "epoch": 0.07865} {"step": 39330, "loss": 1.6616, "grad_norm": "2.654e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.368e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.081e-01", "anc_acc": "4.822e-01", "epoch": 0.07866} {"step": 39335, "loss": 1.3595, "grad_norm": "3.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.122e+00", "anc_loss": "1.200e+00", "dlm_acc": "5.811e-01", "anc_acc": "5.601e-01", "epoch": 0.07867} {"step": 39340, "loss": 1.5538, "grad_norm": "3.141e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.271e+00", "dlm_acc": "5.109e-01", "anc_acc": "4.893e-01", "epoch": 0.07868} {"step": 39345, "loss": 1.2202, "grad_norm": "3.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.949e-01", "anc_loss": "9.043e-01", "dlm_acc": "6.563e-01", "anc_acc": "6.201e-01", "epoch": 0.07869} {"step": 39350, "loss": 1.2608, "grad_norm": "3.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.923e-01", "anc_acc": "5.662e-01", "epoch": 0.0787} {"step": 39355, "loss": 1.4603, "grad_norm": "3.411e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.094e-01", "anc_loss": "1.048e+00", "dlm_acc": "7.486e-01", "anc_acc": "7.107e-01", "epoch": 0.07871} {"step": 39360, "loss": 1.4625, "grad_norm": "3.481e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.499e+00", "anc_loss": "1.623e+00", "dlm_acc": "5.286e-01", "anc_acc": "5.016e-01", "epoch": 0.07872} {"step": 39365, "loss": 1.0398, "grad_norm": "7.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.691e-01", "anc_acc": "5.401e-01", "epoch": 0.07873} {"step": 39370, "loss": 1.4634, "grad_norm": "3.658e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.745e+00", "anc_loss": "1.873e+00", "dlm_acc": "4.863e-01", "anc_acc": "4.569e-01", "epoch": 0.07874} {"step": 39375, "loss": 1.2784, "grad_norm": "1.930e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.428e+00", "anc_loss": "1.568e+00", "dlm_acc": "5.629e-01", "anc_acc": "5.339e-01", "epoch": 0.07875} {"step": 39380, "loss": 1.0899, "grad_norm": "3.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.939e-01", "anc_acc": "5.642e-01", "epoch": 0.07876} {"step": 39385, "loss": 1.2616, "grad_norm": "2.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.842e-01", "anc_acc": "5.569e-01", "epoch": 0.07877} {"step": 39390, "loss": 1.5301, "grad_norm": "5.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.537e+00", "anc_loss": "1.649e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.387e-01", "epoch": 0.07878} {"step": 39395, "loss": 1.0251, "grad_norm": "3.281e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.278e+00", "dlm_acc": "6.077e-01", "anc_acc": "5.791e-01", "epoch": 0.07879} {"step": 39400, "loss": 0.9571, "grad_norm": "2.880e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.295e+00", "dlm_acc": "6.218e-01", "anc_acc": "5.937e-01", "epoch": 0.0788} {"step": 39405, "loss": 0.8833, "grad_norm": "1.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.217e+00", "dlm_acc": "6.075e-01", "anc_acc": "5.741e-01", "epoch": 0.07881} {"step": 39410, "loss": 0.928, "grad_norm": "2.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.403e+00", "anc_loss": "1.533e+00", "dlm_acc": "5.397e-01", "anc_acc": "5.078e-01", "epoch": 0.07882} {"step": 39415, "loss": 0.9234, "grad_norm": "3.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.199e+00", "anc_loss": "1.302e+00", "dlm_acc": "5.745e-01", "anc_acc": "5.429e-01", "epoch": 0.07883} {"step": 39420, "loss": 0.8455, "grad_norm": "2.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.026e+00", "anc_loss": "1.133e+00", "dlm_acc": "6.285e-01", "anc_acc": "5.983e-01", "epoch": 0.07884} {"step": 39425, "loss": 1.214, "grad_norm": "4.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.410e+00", "dlm_acc": "5.975e-01", "anc_acc": "5.700e-01", "epoch": 0.07885} {"step": 39430, "loss": 1.2957, "grad_norm": "4.243e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.445e+00", "anc_loss": "1.568e+00", "dlm_acc": "5.637e-01", "anc_acc": "5.367e-01", "epoch": 0.07886} {"step": 39435, "loss": 0.8738, "grad_norm": "3.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.825e-01", "anc_acc": "5.540e-01", "epoch": 0.07887} {"step": 39440, "loss": 1.2249, "grad_norm": "4.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.146e+00", "anc_loss": "1.273e+00", "dlm_acc": "6.211e-01", "anc_acc": "5.902e-01", "epoch": 0.07888} {"step": 39445, "loss": 1.6242, "grad_norm": "3.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.636e+00", "anc_loss": "1.769e+00", "dlm_acc": "5.060e-01", "anc_acc": "4.783e-01", "epoch": 0.07889} {"step": 39450, "loss": 0.9451, "grad_norm": "3.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.051e+00", "anc_loss": "1.178e+00", "dlm_acc": "6.245e-01", "anc_acc": "5.931e-01", "epoch": 0.0789} {"step": 39455, "loss": 0.8911, "grad_norm": "3.456e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.188e-01", "anc_loss": "8.082e-01", "dlm_acc": "7.098e-01", "anc_acc": "6.868e-01", "epoch": 0.07891} {"step": 39460, "loss": 1.3571, "grad_norm": "4.208e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.251e+00", "anc_loss": "1.360e+00", "dlm_acc": "5.755e-01", "anc_acc": "5.487e-01", "epoch": 0.07892} {"step": 39465, "loss": 1.1829, "grad_norm": "2.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.331e-01", "anc_acc": "5.075e-01", "epoch": 0.07893} {"step": 39470, "loss": 1.3119, "grad_norm": "4.532e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.933e-01", "anc_acc": "5.683e-01", "epoch": 0.07894} {"step": 39475, "loss": 1.2101, "grad_norm": "7.405e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.304e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.643e-01", "anc_acc": "5.375e-01", "epoch": 0.07895} {"step": 39480, "loss": 1.2871, "grad_norm": "3.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.319e+00", "dlm_acc": "5.756e-01", "anc_acc": "5.425e-01", "epoch": 0.07896} {"step": 39485, "loss": 1.3705, "grad_norm": "9.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.214e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.757e-01", "anc_acc": "5.466e-01", "epoch": 0.07897} {"step": 39490, "loss": 1.3002, "grad_norm": "2.370e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.150e-01", "anc_loss": "9.430e-01", "dlm_acc": "6.924e-01", "anc_acc": "6.557e-01", "epoch": 0.07898} {"step": 39495, "loss": 0.8223, "grad_norm": "2.094e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.707e-01", "anc_loss": "8.657e-01", "dlm_acc": "6.925e-01", "anc_acc": "6.657e-01", "epoch": 0.07899} {"step": 39500, "loss": 1.0431, "grad_norm": "6.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.431e-01", "anc_loss": "1.035e+00", "dlm_acc": "6.795e-01", "anc_acc": "6.555e-01", "epoch": 0.079} {"step": 39505, "loss": 1.0722, "grad_norm": "4.432e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.281e-01", "anc_loss": "8.946e-01", "dlm_acc": "7.149e-01", "anc_acc": "6.948e-01", "epoch": 0.07901} {"step": 39510, "loss": 1.1952, "grad_norm": "1.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.973e-01", "anc_loss": "8.906e-01", "dlm_acc": "6.434e-01", "anc_acc": "6.105e-01", "epoch": 0.07902} {"step": 39515, "loss": 1.1299, "grad_norm": "3.921e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.217e+00", "dlm_acc": "6.028e-01", "anc_acc": "5.750e-01", "epoch": 0.07903} {"step": 39520, "loss": 0.8434, "grad_norm": "2.324e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.836e-01", "anc_loss": "7.633e-01", "dlm_acc": "6.873e-01", "anc_acc": "6.634e-01", "epoch": 0.07904} {"step": 39525, "loss": 0.9745, "grad_norm": "2.620e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.237e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.454e-01", "anc_acc": "5.231e-01", "epoch": 0.07905} {"step": 39530, "loss": 1.3094, "grad_norm": "2.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.268e+00", "dlm_acc": "5.999e-01", "anc_acc": "5.788e-01", "epoch": 0.07906} {"step": 39535, "loss": 0.9248, "grad_norm": "2.192e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.359e-01", "anc_loss": "8.035e-01", "dlm_acc": "6.801e-01", "anc_acc": "6.577e-01", "epoch": 0.07907} {"step": 39540, "loss": 0.8745, "grad_norm": "4.132e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.941e-01", "anc_loss": "9.048e-01", "dlm_acc": "7.308e-01", "anc_acc": "7.023e-01", "epoch": 0.07908} {"step": 39545, "loss": 0.6038, "grad_norm": "3.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.281e-01", "anc_loss": "6.102e-01", "dlm_acc": "6.408e-01", "anc_acc": "5.904e-01", "epoch": 0.07909} {"step": 39550, "loss": 0.6436, "grad_norm": "2.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.574e-01", "anc_loss": "9.957e-01", "dlm_acc": "5.287e-01", "anc_acc": "5.085e-01", "epoch": 0.0791} {"step": 39555, "loss": 0.7157, "grad_norm": "5.337e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.581e-01", "anc_loss": "9.348e-01", "dlm_acc": "6.453e-01", "anc_acc": "6.268e-01", "epoch": 0.07911} {"step": 39560, "loss": 0.6833, "grad_norm": "2.333e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.068e-01", "anc_loss": "3.486e-01", "dlm_acc": "8.027e-01", "anc_acc": "7.841e-01", "epoch": 0.07912} {"step": 39565, "loss": 0.6334, "grad_norm": "2.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.305e-01", "anc_loss": "9.000e-01", "dlm_acc": "6.322e-01", "anc_acc": "6.136e-01", "epoch": 0.07913} {"step": 39570, "loss": 1.1073, "grad_norm": "3.380e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.367e+00", "dlm_acc": "5.826e-01", "anc_acc": "5.559e-01", "epoch": 0.07914} {"step": 39575, "loss": 1.6046, "grad_norm": "3.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.376e+00", "dlm_acc": "6.374e-01", "anc_acc": "6.122e-01", "epoch": 0.07915} {"step": 39580, "loss": 0.9657, "grad_norm": "4.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.264e-01", "anc_loss": "1.018e+00", "dlm_acc": "6.999e-01", "anc_acc": "6.766e-01", "epoch": 0.07916} {"step": 39585, "loss": 1.0979, "grad_norm": "2.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.301e+00", "anc_loss": "1.458e+00", "dlm_acc": "5.655e-01", "anc_acc": "5.390e-01", "epoch": 0.07917} {"step": 39590, "loss": 1.044, "grad_norm": "2.481e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.062e-01", "anc_loss": "9.340e-01", "dlm_acc": "5.703e-01", "anc_acc": "5.640e-01", "epoch": 0.07918} {"step": 39595, "loss": 0.7532, "grad_norm": "7.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.188e-01", "anc_loss": "7.662e-01", "dlm_acc": "7.072e-01", "anc_acc": "6.940e-01", "epoch": 0.07919} {"step": 39600, "loss": 1.1428, "grad_norm": "2.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.008e+00", "anc_loss": "1.078e+00", "dlm_acc": "5.636e-01", "anc_acc": "5.483e-01", "epoch": 0.0792} {"step": 39605, "loss": 0.9899, "grad_norm": "4.068e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.627e-01", "anc_loss": "8.656e-01", "dlm_acc": "7.271e-01", "anc_acc": "7.012e-01", "epoch": 0.07921} {"step": 39610, "loss": 0.9222, "grad_norm": "4.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.500e-01", "anc_loss": "7.242e-01", "dlm_acc": "7.433e-01", "anc_acc": "7.244e-01", "epoch": 0.07922} {"step": 39615, "loss": 0.8663, "grad_norm": "1.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.226e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.670e-01", "anc_acc": "5.382e-01", "epoch": 0.07923} {"step": 39620, "loss": 0.9824, "grad_norm": "2.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.008e-01", "anc_loss": "5.339e-01", "dlm_acc": "7.964e-01", "anc_acc": "7.838e-01", "epoch": 0.07924} {"step": 39625, "loss": 1.2545, "grad_norm": "4.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.500e-01", "anc_loss": "9.070e-01", "dlm_acc": "6.748e-01", "anc_acc": "6.619e-01", "epoch": 0.07925} {"step": 39630, "loss": 1.4156, "grad_norm": "4.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.301e+00", "dlm_acc": "5.802e-01", "anc_acc": "5.619e-01", "epoch": 0.07926} {"step": 39635, "loss": 1.2718, "grad_norm": "5.124e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.695e-01", "anc_loss": "7.727e-01", "dlm_acc": "5.663e-01", "anc_acc": "5.642e-01", "epoch": 0.07927} {"step": 39640, "loss": 1.201, "grad_norm": "3.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.320e-01", "anc_loss": "7.383e-01", "dlm_acc": "5.696e-01", "anc_acc": "5.678e-01", "epoch": 0.07928} {"step": 39645, "loss": 1.1629, "grad_norm": "4.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.500e-01", "anc_loss": "1.020e+00", "dlm_acc": "5.668e-01", "anc_acc": "5.521e-01", "epoch": 0.07929} {"step": 39650, "loss": 0.9125, "grad_norm": "8.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.273e-01", "anc_loss": "8.105e-01", "dlm_acc": "7.099e-01", "anc_acc": "6.892e-01", "epoch": 0.0793} {"step": 39655, "loss": 0.8549, "grad_norm": "3.216e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.266e-01", "anc_loss": "9.043e-01", "dlm_acc": "6.598e-01", "anc_acc": "6.358e-01", "epoch": 0.07931} {"step": 39660, "loss": 0.9782, "grad_norm": "6.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.301e-01", "anc_loss": "5.827e-01", "dlm_acc": "7.995e-01", "anc_acc": "7.843e-01", "epoch": 0.07932} {"step": 39665, "loss": 1.5136, "grad_norm": "3.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.197e+00", "dlm_acc": "6.384e-01", "anc_acc": "6.195e-01", "epoch": 0.07933} {"step": 39670, "loss": 1.3847, "grad_norm": "8.572e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.123e+00", "dlm_acc": "6.214e-01", "anc_acc": "6.014e-01", "epoch": 0.07934} {"step": 39675, "loss": 1.3214, "grad_norm": "4.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.266e-01", "anc_loss": "9.781e-01", "dlm_acc": "5.522e-01", "anc_acc": "5.382e-01", "epoch": 0.07935} {"step": 39680, "loss": 1.572, "grad_norm": "6.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.218e+00", "dlm_acc": "6.119e-01", "anc_acc": "5.894e-01", "epoch": 0.07936} {"step": 39685, "loss": 1.2372, "grad_norm": "3.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.037e+00", "dlm_acc": "4.318e-01", "anc_acc": "4.157e-01", "epoch": 0.07937} {"step": 39690, "loss": 1.0689, "grad_norm": "5.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.016e-01", "anc_loss": "6.652e-01", "dlm_acc": "6.870e-01", "anc_acc": "6.613e-01", "epoch": 0.07938} {"step": 39695, "loss": 0.9079, "grad_norm": "2.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.262e-01", "anc_loss": "4.949e-01", "dlm_acc": "7.412e-01", "anc_acc": "7.069e-01", "epoch": 0.07939} {"step": 39700, "loss": 1.1759, "grad_norm": "4.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.812e-01", "anc_loss": "9.383e-01", "dlm_acc": "5.231e-01", "anc_acc": "5.041e-01", "epoch": 0.0794} {"step": 39705, "loss": 1.1629, "grad_norm": "4.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.195e-01", "anc_loss": "5.641e-01", "dlm_acc": "6.588e-01", "anc_acc": "6.341e-01", "epoch": 0.07941} {"step": 39710, "loss": 1.2293, "grad_norm": "2.081e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.156e-01", "anc_loss": "5.484e-01", "dlm_acc": "6.423e-01", "anc_acc": "6.195e-01", "epoch": 0.07942} {"step": 39715, "loss": 0.8509, "grad_norm": "1.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.219e-01", "anc_loss": "4.527e-01", "dlm_acc": "6.695e-01", "anc_acc": "6.459e-01", "epoch": 0.07943} {"step": 39720, "loss": 1.1639, "grad_norm": "4.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.152e-01", "anc_loss": "5.359e-01", "dlm_acc": "6.285e-01", "anc_acc": "6.156e-01", "epoch": 0.07944} {"step": 39725, "loss": 1.0309, "grad_norm": "2.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.348e-01", "anc_loss": "4.574e-01", "dlm_acc": "6.808e-01", "anc_acc": "6.655e-01", "epoch": 0.07945} {"step": 39730, "loss": 1.2087, "grad_norm": "7.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.313e-01", "anc_loss": "8.727e-01", "dlm_acc": "4.917e-01", "anc_acc": "4.810e-01", "epoch": 0.07946} {"step": 39735, "loss": 0.7822, "grad_norm": "2.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.188e-01", "anc_loss": "5.426e-01", "dlm_acc": "6.151e-01", "anc_acc": "6.029e-01", "epoch": 0.07947} {"step": 39740, "loss": 0.9177, "grad_norm": "1.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.551e-01", "anc_loss": "8.047e-01", "dlm_acc": "6.724e-01", "anc_acc": "6.585e-01", "epoch": 0.07948} {"step": 39745, "loss": 0.6473, "grad_norm": "2.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.584e-01", "anc_loss": "5.496e-01", "dlm_acc": "7.392e-01", "anc_acc": "7.044e-01", "epoch": 0.07949} {"step": 39750, "loss": 1.3457, "grad_norm": "3.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.105e-01", "anc_loss": "7.863e-01", "dlm_acc": "6.431e-01", "anc_acc": "6.106e-01", "epoch": 0.0795} {"step": 39755, "loss": 1.6502, "grad_norm": "5.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.816e-01", "anc_acc": "5.551e-01", "epoch": 0.07951} {"step": 39760, "loss": 1.1344, "grad_norm": "2.559e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.850e-01", "anc_loss": "5.523e-01", "dlm_acc": "7.479e-01", "anc_acc": "7.249e-01", "epoch": 0.07952} {"step": 39765, "loss": 1.4015, "grad_norm": "4.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.492e+00", "dlm_acc": "4.483e-01", "anc_acc": "4.304e-01", "epoch": 0.07953} {"step": 39770, "loss": 1.177, "grad_norm": "5.012e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.570e-01", "anc_loss": "1.008e+00", "dlm_acc": "5.909e-01", "anc_acc": "5.770e-01", "epoch": 0.07954} {"step": 39775, "loss": 1.2558, "grad_norm": "2.171e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.740e-01", "anc_loss": "7.129e-01", "dlm_acc": "6.194e-01", "anc_acc": "6.080e-01", "epoch": 0.07955} {"step": 39780, "loss": 1.3823, "grad_norm": "4.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.020e+00", "anc_loss": "1.091e+00", "dlm_acc": "4.936e-01", "anc_acc": "4.746e-01", "epoch": 0.07956} {"step": 39785, "loss": 1.4959, "grad_norm": "6.366e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.070e+00", "dlm_acc": "3.127e-01", "anc_acc": "3.047e-01", "epoch": 0.07957} {"step": 39790, "loss": 1.2501, "grad_norm": "3.199e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.398e-01", "anc_loss": "8.516e-01", "dlm_acc": "3.437e-01", "anc_acc": "3.350e-01", "epoch": 0.07958} {"step": 39795, "loss": 1.102, "grad_norm": "2.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.000e-01", "anc_loss": "8.141e-01", "dlm_acc": "3.325e-01", "anc_acc": "3.252e-01", "epoch": 0.07959} {"step": 39800, "loss": 1.4096, "grad_norm": "3.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.128e+00", "anc_loss": "1.176e+00", "dlm_acc": "3.639e-01", "anc_acc": "3.481e-01", "epoch": 0.0796} {"step": 39805, "loss": 0.9595, "grad_norm": "3.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.672e-01", "anc_loss": "4.310e-01", "dlm_acc": "8.539e-01", "anc_acc": "8.338e-01", "epoch": 0.07961} {"step": 39810, "loss": 0.9891, "grad_norm": "2.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.461e-01", "anc_loss": "8.668e-01", "dlm_acc": "7.105e-01", "anc_acc": "6.855e-01", "epoch": 0.07962} {"step": 39815, "loss": 1.5054, "grad_norm": "3.947e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.094e+00", "anc_loss": "1.170e+00", "dlm_acc": "5.456e-01", "anc_acc": "5.154e-01", "epoch": 0.07963} {"step": 39820, "loss": 1.7423, "grad_norm": "3.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.626e+00", "anc_loss": "1.752e+00", "dlm_acc": "4.882e-01", "anc_acc": "4.586e-01", "epoch": 0.07964} {"step": 39825, "loss": 1.2763, "grad_norm": "3.925e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.766e-01", "anc_loss": "7.836e-01", "dlm_acc": "5.386e-01", "anc_acc": "5.364e-01", "epoch": 0.07965} {"step": 39830, "loss": 1.409, "grad_norm": "3.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.156e+00", "dlm_acc": "5.812e-01", "anc_acc": "5.502e-01", "epoch": 0.07966} {"step": 39835, "loss": 1.1285, "grad_norm": "3.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.277e-01", "anc_loss": "7.961e-01", "dlm_acc": "6.145e-01", "anc_acc": "5.802e-01", "epoch": 0.07967} {"step": 39840, "loss": 1.1748, "grad_norm": "3.997e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.194e+00", "dlm_acc": "5.867e-01", "anc_acc": "5.573e-01", "epoch": 0.07968} {"step": 39845, "loss": 1.1125, "grad_norm": "3.068e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.039e-01", "anc_loss": "8.617e-01", "dlm_acc": "6.023e-01", "anc_acc": "5.802e-01", "epoch": 0.07969} {"step": 39850, "loss": 0.9208, "grad_norm": "3.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.563e-01", "anc_loss": "1.022e+00", "dlm_acc": "4.998e-01", "anc_acc": "4.816e-01", "epoch": 0.0797} {"step": 39855, "loss": 1.2717, "grad_norm": "2.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.676e-01", "anc_loss": "9.473e-01", "dlm_acc": "6.084e-01", "anc_acc": "5.745e-01", "epoch": 0.07971} {"step": 39860, "loss": 0.8896, "grad_norm": "2.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.758e-01", "anc_loss": "7.332e-01", "dlm_acc": "6.260e-01", "anc_acc": "6.030e-01", "epoch": 0.07972} {"step": 39865, "loss": 1.3069, "grad_norm": "4.447e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.226e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.431e-01", "anc_acc": "5.186e-01", "epoch": 0.07973} {"step": 39870, "loss": 0.9149, "grad_norm": "6.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.441e-01", "anc_loss": "7.152e-01", "dlm_acc": "6.597e-01", "anc_acc": "6.327e-01", "epoch": 0.07974} {"step": 39875, "loss": 1.1552, "grad_norm": "4.610e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.094e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.785e-01", "anc_acc": "5.428e-01", "epoch": 0.07975} {"step": 39880, "loss": 0.8249, "grad_norm": "4.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.680e-01", "anc_loss": "8.176e-01", "dlm_acc": "5.234e-01", "anc_acc": "5.079e-01", "epoch": 0.07976} {"step": 39885, "loss": 0.9762, "grad_norm": "4.324e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.410e-01", "anc_loss": "1.032e+00", "dlm_acc": "6.006e-01", "anc_acc": "5.775e-01", "epoch": 0.07977} {"step": 39890, "loss": 1.3176, "grad_norm": "1.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.324e+00", "anc_loss": "1.443e+00", "dlm_acc": "5.569e-01", "anc_acc": "5.243e-01", "epoch": 0.07978} {"step": 39895, "loss": 1.0723, "grad_norm": "4.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.505e-01", "anc_loss": "1.058e+00", "dlm_acc": "7.059e-01", "anc_acc": "6.814e-01", "epoch": 0.07979} {"step": 39900, "loss": 1.3716, "grad_norm": "4.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.007e+00", "anc_loss": "1.085e+00", "dlm_acc": "6.169e-01", "anc_acc": "5.981e-01", "epoch": 0.0798} {"step": 39905, "loss": 1.1757, "grad_norm": "5.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.025e+00", "anc_loss": "1.132e+00", "dlm_acc": "5.680e-01", "anc_acc": "5.403e-01", "epoch": 0.07981} {"step": 39910, "loss": 1.0479, "grad_norm": "2.911e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.555e-01", "anc_loss": "8.680e-01", "dlm_acc": "3.416e-01", "anc_acc": "3.355e-01", "epoch": 0.07982} {"step": 39915, "loss": 0.9719, "grad_norm": "2.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.183e+00", "dlm_acc": "5.959e-01", "anc_acc": "5.664e-01", "epoch": 0.07983} {"step": 39920, "loss": 1.3259, "grad_norm": "2.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.562e+00", "anc_loss": "1.686e+00", "dlm_acc": "4.955e-01", "anc_acc": "4.686e-01", "epoch": 0.07984} {"step": 39925, "loss": 1.137, "grad_norm": "2.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.971e-01", "anc_acc": "5.691e-01", "epoch": 0.07985} {"step": 39930, "loss": 1.1443, "grad_norm": "3.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.173e+00", "dlm_acc": "6.045e-01", "anc_acc": "5.793e-01", "epoch": 0.07986} {"step": 39935, "loss": 1.0821, "grad_norm": "3.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.212e+00", "dlm_acc": "6.225e-01", "anc_acc": "5.911e-01", "epoch": 0.07987} {"step": 39940, "loss": 1.5735, "grad_norm": "4.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.525e+00", "anc_loss": "1.641e+00", "dlm_acc": "5.441e-01", "anc_acc": "5.193e-01", "epoch": 0.07988} {"step": 39945, "loss": 1.1887, "grad_norm": "3.061e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.347e-01", "anc_acc": "5.107e-01", "epoch": 0.07989} {"step": 39950, "loss": 1.0932, "grad_norm": "2.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.294e+00", "anc_loss": "1.416e+00", "dlm_acc": "5.537e-01", "anc_acc": "5.246e-01", "epoch": 0.0799} {"step": 39955, "loss": 0.8637, "grad_norm": "2.068e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.182e+00", "anc_loss": "1.296e+00", "dlm_acc": "5.909e-01", "anc_acc": "5.625e-01", "epoch": 0.07991} {"step": 39960, "loss": 0.9717, "grad_norm": "8.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.378e-01", "anc_loss": "8.215e-01", "dlm_acc": "7.197e-01", "anc_acc": "7.025e-01", "epoch": 0.07992} {"step": 39965, "loss": 1.2553, "grad_norm": "3.893e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.411e-01", "anc_loss": "9.268e-01", "dlm_acc": "7.421e-01", "anc_acc": "7.237e-01", "epoch": 0.07993} {"step": 39970, "loss": 1.5505, "grad_norm": "4.068e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.993e-01", "anc_acc": "5.730e-01", "epoch": 0.07994} {"step": 39975, "loss": 0.9374, "grad_norm": "2.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.031e+00", "anc_loss": "1.121e+00", "dlm_acc": "6.317e-01", "anc_acc": "6.096e-01", "epoch": 0.07995} {"step": 39980, "loss": 1.7794, "grad_norm": "2.432e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.994e+00", "anc_loss": "2.128e+00", "dlm_acc": "4.525e-01", "anc_acc": "4.254e-01", "epoch": 0.07996} {"step": 39985, "loss": 1.2948, "grad_norm": "1.081e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.569e+00", "anc_loss": "1.689e+00", "dlm_acc": "4.961e-01", "anc_acc": "4.654e-01", "epoch": 0.07997} {"step": 39990, "loss": 1.1002, "grad_norm": "1.808e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.259e+00", "dlm_acc": "5.739e-01", "anc_acc": "5.454e-01", "epoch": 0.07998} {"step": 39995, "loss": 1.1372, "grad_norm": "2.461e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.435e+00", "dlm_acc": "5.465e-01", "anc_acc": "5.205e-01", "epoch": 0.07999} {"step": 40000, "loss": 1.1576, "grad_norm": "2.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.776e-01", "anc_acc": "5.478e-01", "epoch": 0.08} {"step": 40005, "loss": 1.4812, "grad_norm": "3.008e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.397e+00", "anc_loss": "1.514e+00", "dlm_acc": "5.322e-01", "anc_acc": "5.042e-01", "epoch": 0.08001} {"step": 40010, "loss": 1.2283, "grad_norm": "4.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.309e+00", "dlm_acc": "5.901e-01", "anc_acc": "5.589e-01", "epoch": 0.08002} {"step": 40015, "loss": 1.1406, "grad_norm": "4.039e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.965e-01", "anc_acc": "5.667e-01", "epoch": 0.08003} {"step": 40020, "loss": 1.0514, "grad_norm": "5.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.115e-01", "anc_loss": "4.678e-01", "dlm_acc": "8.417e-01", "anc_acc": "7.942e-01", "epoch": 0.08004} {"step": 40025, "loss": 1.1644, "grad_norm": "3.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.527e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.426e-01", "anc_acc": "6.141e-01", "epoch": 0.08005} {"step": 40030, "loss": 1.2508, "grad_norm": "3.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.626e+00", "anc_loss": "1.745e+00", "dlm_acc": "4.928e-01", "anc_acc": "4.665e-01", "epoch": 0.08006} {"step": 40035, "loss": 1.0989, "grad_norm": "2.456e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.399e+00", "anc_loss": "1.547e+00", "dlm_acc": "5.602e-01", "anc_acc": "5.255e-01", "epoch": 0.08007} {"step": 40040, "loss": 1.0382, "grad_norm": "3.335e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.421e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.519e-01", "anc_acc": "5.238e-01", "epoch": 0.08008} {"step": 40045, "loss": 1.0523, "grad_norm": "5.510e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.449e+00", "dlm_acc": "5.395e-01", "anc_acc": "5.097e-01", "epoch": 0.08009} {"step": 40050, "loss": 1.0407, "grad_norm": "2.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.441e+00", "dlm_acc": "6.130e-01", "anc_acc": "5.900e-01", "epoch": 0.0801} {"step": 40055, "loss": 1.0706, "grad_norm": "3.689e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.974e-01", "anc_loss": "5.589e-01", "dlm_acc": "8.420e-01", "anc_acc": "8.286e-01", "epoch": 0.08011} {"step": 40060, "loss": 0.8998, "grad_norm": "2.283e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.398e-01", "anc_loss": "1.034e+00", "dlm_acc": "5.597e-01", "anc_acc": "5.343e-01", "epoch": 0.08012} {"step": 40065, "loss": 1.0064, "grad_norm": "2.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.246e+00", "dlm_acc": "6.074e-01", "anc_acc": "5.779e-01", "epoch": 0.08013} {"step": 40070, "loss": 0.7808, "grad_norm": "2.260e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.980e-01", "anc_loss": "1.099e+00", "dlm_acc": "6.166e-01", "anc_acc": "5.843e-01", "epoch": 0.08014} {"step": 40075, "loss": 1.2206, "grad_norm": "3.630e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.641e-01", "anc_loss": "8.633e-01", "dlm_acc": "6.824e-01", "anc_acc": "6.424e-01", "epoch": 0.08015} {"step": 40080, "loss": 0.9575, "grad_norm": "3.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.730e-01", "anc_loss": "1.149e+00", "dlm_acc": "6.233e-01", "anc_acc": "5.713e-01", "epoch": 0.08016} {"step": 40085, "loss": 1.1226, "grad_norm": "2.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.489e-01", "anc_acc": "5.302e-01", "epoch": 0.08017} {"step": 40090, "loss": 0.8599, "grad_norm": "3.331e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.040e+00", "anc_loss": "1.148e+00", "dlm_acc": "5.510e-01", "anc_acc": "5.165e-01", "epoch": 0.08018} {"step": 40095, "loss": 1.4404, "grad_norm": "2.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.563e+00", "dlm_acc": "5.029e-01", "anc_acc": "4.747e-01", "epoch": 0.08019} {"step": 40100, "loss": 1.3115, "grad_norm": "1.834e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.525e+00", "anc_loss": "1.659e+00", "dlm_acc": "4.973e-01", "anc_acc": "4.653e-01", "epoch": 0.0802} {"step": 40105, "loss": 1.5514, "grad_norm": "5.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.505e+00", "anc_loss": "2.562e+00", "dlm_acc": "1.955e-01", "anc_acc": "1.854e-01", "epoch": 0.08021} {"step": 40110, "loss": 1.105, "grad_norm": "4.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.440e+00", "dlm_acc": "4.620e-01", "anc_acc": "4.383e-01", "epoch": 0.08022} {"step": 40115, "loss": 1.0337, "grad_norm": "3.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.145e+00", "dlm_acc": "5.599e-01", "anc_acc": "5.396e-01", "epoch": 0.08023} {"step": 40120, "loss": 1.2285, "grad_norm": "2.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.170e+00", "dlm_acc": "5.848e-01", "anc_acc": "5.426e-01", "epoch": 0.08024} {"step": 40125, "loss": 1.0334, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.480e-01", "anc_loss": "8.125e-01", "dlm_acc": "6.331e-01", "anc_acc": "6.059e-01", "epoch": 0.08025} {"step": 40130, "loss": 0.9346, "grad_norm": "1.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.340e-01", "anc_loss": "9.246e-01", "dlm_acc": "6.418e-01", "anc_acc": "6.181e-01", "epoch": 0.08026} {"step": 40135, "loss": 1.144, "grad_norm": "2.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.438e+00", "anc_loss": "1.516e+00", "dlm_acc": "4.651e-01", "anc_acc": "4.441e-01", "epoch": 0.08027} {"step": 40140, "loss": 1.0163, "grad_norm": "4.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.168e+00", "dlm_acc": "5.980e-01", "anc_acc": "5.626e-01", "epoch": 0.08028} {"step": 40145, "loss": 1.2277, "grad_norm": "2.092e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.037e+00", "anc_loss": "1.143e+00", "dlm_acc": "6.396e-01", "anc_acc": "6.122e-01", "epoch": 0.08029} {"step": 40150, "loss": 1.2722, "grad_norm": "4.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.762e-01", "anc_loss": "1.191e+00", "dlm_acc": "6.219e-01", "anc_acc": "5.536e-01", "epoch": 0.0803} {"step": 40155, "loss": 1.228, "grad_norm": "4.112e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.182e+00", "dlm_acc": "5.960e-01", "anc_acc": "5.748e-01", "epoch": 0.08031} {"step": 40160, "loss": 1.401, "grad_norm": "9.114e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.118e+00", "dlm_acc": "6.218e-01", "anc_acc": "5.980e-01", "epoch": 0.08032} {"step": 40165, "loss": 1.0292, "grad_norm": "3.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.756e-01", "anc_loss": "9.969e-01", "dlm_acc": "6.390e-01", "anc_acc": "6.004e-01", "epoch": 0.08033} {"step": 40170, "loss": 0.7578, "grad_norm": "3.977e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.289e-01", "anc_loss": "6.992e-01", "dlm_acc": "5.993e-01", "anc_acc": "5.622e-01", "epoch": 0.08034} {"step": 40175, "loss": 1.6056, "grad_norm": "2.701e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.764e+00", "anc_loss": "1.877e+00", "dlm_acc": "3.935e-01", "anc_acc": "3.604e-01", "epoch": 0.08035} {"step": 40180, "loss": 0.8146, "grad_norm": "2.406e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.391e-01", "anc_loss": "1.088e+00", "dlm_acc": "5.830e-01", "anc_acc": "5.370e-01", "epoch": 0.08036} {"step": 40185, "loss": 1.7421, "grad_norm": "4.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.500e+00", "dlm_acc": "5.712e-01", "anc_acc": "5.232e-01", "epoch": 0.08037} {"step": 40190, "loss": 1.3194, "grad_norm": "2.716e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.070e-01", "anc_loss": "9.961e-01", "dlm_acc": "5.964e-01", "anc_acc": "5.701e-01", "epoch": 0.08038} {"step": 40195, "loss": 1.2844, "grad_norm": "3.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.138e+00", "anc_loss": "1.319e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.089e-01", "epoch": 0.08039} {"step": 40200, "loss": 1.0176, "grad_norm": "3.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.165e+00", "dlm_acc": "6.142e-01", "anc_acc": "5.821e-01", "epoch": 0.0804} {"step": 40205, "loss": 1.3735, "grad_norm": "5.877e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.431e+00", "anc_loss": "1.517e+00", "dlm_acc": "4.887e-01", "anc_acc": "4.634e-01", "epoch": 0.08041} {"step": 40210, "loss": 1.2102, "grad_norm": "7.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.304e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.518e-01", "anc_acc": "5.070e-01", "epoch": 0.08042} {"step": 40215, "loss": 1.2033, "grad_norm": "5.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.514e+00", "dlm_acc": "4.985e-01", "anc_acc": "4.688e-01", "epoch": 0.08043} {"step": 40220, "loss": 1.0625, "grad_norm": "3.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.318e-01", "epoch": 0.08044} {"step": 40225, "loss": 1.0924, "grad_norm": "4.182e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.104e+00", "anc_loss": "1.231e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.330e-01", "epoch": 0.08045} {"step": 40230, "loss": 1.413, "grad_norm": "4.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.262e+00", "dlm_acc": "6.104e-01", "anc_acc": "5.721e-01", "epoch": 0.08046} {"step": 40235, "loss": 1.0724, "grad_norm": "3.137e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.289e-01", "anc_loss": "9.383e-01", "dlm_acc": "6.554e-01", "anc_acc": "6.196e-01", "epoch": 0.08047} {"step": 40240, "loss": 1.4571, "grad_norm": "7.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.368e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.692e-01", "anc_acc": "5.422e-01", "epoch": 0.08048} {"step": 40245, "loss": 1.1711, "grad_norm": "5.467e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.519e+00", "dlm_acc": "5.249e-01", "anc_acc": "4.937e-01", "epoch": 0.08049} {"step": 40250, "loss": 0.705, "grad_norm": "2.734e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.266e+00", "dlm_acc": "5.997e-01", "anc_acc": "5.681e-01", "epoch": 0.0805} {"step": 40255, "loss": 0.9822, "grad_norm": "2.513e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.919e-01", "anc_acc": "5.601e-01", "epoch": 0.08051} {"step": 40260, "loss": 1.1723, "grad_norm": "5.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.356e+00", "anc_loss": "1.471e+00", "dlm_acc": "5.442e-01", "anc_acc": "5.165e-01", "epoch": 0.08052} {"step": 40265, "loss": 1.0835, "grad_norm": "3.525e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.076e+00", "anc_loss": "1.185e+00", "dlm_acc": "6.039e-01", "anc_acc": "5.767e-01", "epoch": 0.08053} {"step": 40270, "loss": 1.9373, "grad_norm": "3.752e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.250e+00", "anc_loss": "1.383e+00", "dlm_acc": "5.975e-01", "anc_acc": "5.653e-01", "epoch": 0.08054} {"step": 40275, "loss": 1.6909, "grad_norm": "3.196e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.342e+00", "dlm_acc": "5.887e-01", "anc_acc": "5.537e-01", "epoch": 0.08055} {"step": 40280, "loss": 1.8672, "grad_norm": "3.623e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.511e+00", "dlm_acc": "5.508e-01", "anc_acc": "5.249e-01", "epoch": 0.08056} {"step": 40285, "loss": 1.8306, "grad_norm": "2.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.528e+00", "anc_loss": "1.658e+00", "dlm_acc": "5.158e-01", "anc_acc": "4.887e-01", "epoch": 0.08057} {"step": 40290, "loss": 1.6329, "grad_norm": "2.649e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.537e+00", "dlm_acc": "5.622e-01", "anc_acc": "5.345e-01", "epoch": 0.08058} {"step": 40295, "loss": 1.8802, "grad_norm": "2.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.706e+00", "anc_loss": "1.858e+00", "dlm_acc": "5.105e-01", "anc_acc": "4.812e-01", "epoch": 0.08059} {"step": 40300, "loss": 1.4917, "grad_norm": "5.858e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.979e-01", "anc_loss": "1.111e+00", "dlm_acc": "6.895e-01", "anc_acc": "6.595e-01", "epoch": 0.0806} {"step": 40305, "loss": 1.622, "grad_norm": "2.531e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.196e+00", "anc_loss": "1.321e+00", "dlm_acc": "6.066e-01", "anc_acc": "5.771e-01", "epoch": 0.08061} {"step": 40310, "loss": 1.7176, "grad_norm": "3.964e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.362e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.817e-01", "anc_acc": "5.540e-01", "epoch": 0.08062} {"step": 40315, "loss": 1.3382, "grad_norm": "2.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.577e+00", "dlm_acc": "5.263e-01", "anc_acc": "4.998e-01", "epoch": 0.08063} {"step": 40320, "loss": 1.1618, "grad_norm": "4.288e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.162e-01", "anc_loss": "9.066e-01", "dlm_acc": "6.841e-01", "anc_acc": "6.613e-01", "epoch": 0.08064} {"step": 40325, "loss": 1.4033, "grad_norm": "5.406e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.132e+00", "anc_loss": "1.252e+00", "dlm_acc": "6.495e-01", "anc_acc": "6.161e-01", "epoch": 0.08065} {"step": 40330, "loss": 1.5986, "grad_norm": "2.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.496e+00", "anc_loss": "1.625e+00", "dlm_acc": "4.471e-01", "anc_acc": "4.220e-01", "epoch": 0.08066} {"step": 40335, "loss": 1.3784, "grad_norm": "5.293e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.471e+00", "dlm_acc": "5.755e-01", "anc_acc": "5.447e-01", "epoch": 0.08067} {"step": 40340, "loss": 1.3016, "grad_norm": "4.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.400e+00", "anc_loss": "1.519e+00", "dlm_acc": "5.239e-01", "anc_acc": "4.954e-01", "epoch": 0.08068} {"step": 40345, "loss": 0.722, "grad_norm": "1.032e+00", "learning_rate": "1.000e-04", "dlm_loss": "4.687e-01", "anc_loss": "5.611e-01", "dlm_acc": "7.991e-01", "anc_acc": "7.647e-01", "epoch": 0.08069} {"step": 40350, "loss": 1.4266, "grad_norm": "3.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.275e+00", "anc_loss": "1.414e+00", "dlm_acc": "5.627e-01", "anc_acc": "5.317e-01", "epoch": 0.0807} {"step": 40355, "loss": 1.3908, "grad_norm": "3.239e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.334e+00", "dlm_acc": "5.872e-01", "anc_acc": "5.562e-01", "epoch": 0.08071} {"step": 40360, "loss": 1.338, "grad_norm": "4.480e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.180e+00", "dlm_acc": "6.003e-01", "anc_acc": "5.714e-01", "epoch": 0.08072} {"step": 40365, "loss": 1.1559, "grad_norm": "5.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.522e+00", "anc_loss": "1.662e+00", "dlm_acc": "5.602e-01", "anc_acc": "5.313e-01", "epoch": 0.08073} {"step": 40370, "loss": 0.9825, "grad_norm": "2.219e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.230e+00", "anc_loss": "1.339e+00", "dlm_acc": "5.665e-01", "anc_acc": "5.394e-01", "epoch": 0.08074} {"step": 40375, "loss": 1.1759, "grad_norm": "1.120e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.152e+00", "dlm_acc": "6.575e-01", "anc_acc": "6.306e-01", "epoch": 0.08075} {"step": 40380, "loss": 1.3708, "grad_norm": "6.909e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.147e+00", "anc_loss": "1.251e+00", "dlm_acc": "6.168e-01", "anc_acc": "5.895e-01", "epoch": 0.08076} {"step": 40385, "loss": 1.1249, "grad_norm": "2.961e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.770e-01", "anc_loss": "8.980e-01", "dlm_acc": "6.700e-01", "anc_acc": "6.308e-01", "epoch": 0.08077} {"step": 40390, "loss": 1.7223, "grad_norm": "4.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.675e+00", "anc_loss": "1.811e+00", "dlm_acc": "5.259e-01", "anc_acc": "4.991e-01", "epoch": 0.08078} {"step": 40395, "loss": 1.6234, "grad_norm": "5.171e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.098e+00", "anc_loss": "2.195e+00", "dlm_acc": "3.086e-01", "anc_acc": "2.867e-01", "epoch": 0.08079} {"step": 40400, "loss": 1.5915, "grad_norm": "4.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.722e+00", "anc_loss": "2.753e+00", "dlm_acc": "7.251e-02", "anc_acc": "6.785e-02", "epoch": 0.0808} {"step": 40405, "loss": 1.1685, "grad_norm": "2.866e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.022e+00", "anc_loss": "1.132e+00", "dlm_acc": "6.091e-01", "anc_acc": "5.719e-01", "epoch": 0.08081} {"step": 40410, "loss": 1.1164, "grad_norm": "4.713e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.434e-01", "anc_loss": "9.766e-01", "dlm_acc": "6.434e-01", "anc_acc": "5.917e-01", "epoch": 0.08082} {"step": 40415, "loss": 1.2042, "grad_norm": "2.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.461e-01", "anc_loss": "1.051e+00", "dlm_acc": "6.381e-01", "anc_acc": "6.075e-01", "epoch": 0.08083} {"step": 40420, "loss": 1.3105, "grad_norm": "7.112e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.672e-01", "anc_acc": "5.334e-01", "epoch": 0.08084} {"step": 40425, "loss": 1.2051, "grad_norm": "1.149e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.031e-01", "anc_loss": "1.029e+00", "dlm_acc": "5.587e-01", "anc_acc": "5.155e-01", "epoch": 0.08085} {"step": 40430, "loss": 1.5424, "grad_norm": "4.259e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.285e+00", "anc_loss": "1.355e+00", "dlm_acc": "4.535e-01", "anc_acc": "4.339e-01", "epoch": 0.08086} {"step": 40435, "loss": 1.3711, "grad_norm": "7.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.365e+00", "dlm_acc": "5.343e-01", "anc_acc": "5.074e-01", "epoch": 0.08087} {"step": 40440, "loss": 0.9507, "grad_norm": "2.738e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.232e+00", "dlm_acc": "5.048e-01", "anc_acc": "4.762e-01", "epoch": 0.08088} {"step": 40445, "loss": 0.7716, "grad_norm": "2.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.520e-01", "anc_loss": "7.223e-01", "dlm_acc": "6.630e-01", "anc_acc": "6.365e-01", "epoch": 0.08089} {"step": 40450, "loss": 1.4846, "grad_norm": "3.516e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.733e+00", "dlm_acc": "4.499e-01", "anc_acc": "3.920e-01", "epoch": 0.0809} {"step": 40455, "loss": 1.3437, "grad_norm": "3.449e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.570e+00", "dlm_acc": "5.486e-01", "anc_acc": "5.036e-01", "epoch": 0.08091} {"step": 40460, "loss": 1.4465, "grad_norm": "1.367e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.355e+00", "dlm_acc": "5.781e-01", "anc_acc": "5.506e-01", "epoch": 0.08092} {"step": 40465, "loss": 1.5129, "grad_norm": "3.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.343e-01", "anc_acc": "5.043e-01", "epoch": 0.08093} {"step": 40470, "loss": 2.0698, "grad_norm": "3.578e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.190e+00", "dlm_acc": "5.714e-01", "anc_acc": "5.470e-01", "epoch": 0.08094} {"step": 40475, "loss": 1.6805, "grad_norm": "3.765e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.394e+00", "dlm_acc": "5.441e-01", "anc_acc": "5.207e-01", "epoch": 0.08095} {"step": 40480, "loss": 1.2106, "grad_norm": "4.136e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.223e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.313e-01", "epoch": 0.08096} {"step": 40485, "loss": 1.3722, "grad_norm": "2.799e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.173e+00", "dlm_acc": "5.406e-01", "anc_acc": "5.158e-01", "epoch": 0.08097} {"step": 40490, "loss": 1.1079, "grad_norm": "3.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.369e+00", "dlm_acc": "5.548e-01", "anc_acc": "5.208e-01", "epoch": 0.08098} {"step": 40495, "loss": 1.304, "grad_norm": "2.905e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.292e+00", "anc_loss": "1.402e+00", "dlm_acc": "5.312e-01", "anc_acc": "5.031e-01", "epoch": 0.08099} {"step": 40500, "loss": 1.3656, "grad_norm": "5.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.248e+00", "dlm_acc": "6.287e-01", "anc_acc": "5.950e-01", "epoch": 0.081} {"step": 40505, "loss": 1.5292, "grad_norm": "4.139e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.271e+00", "dlm_acc": "6.362e-01", "anc_acc": "6.124e-01", "epoch": 0.08101} {"step": 40510, "loss": 1.2481, "grad_norm": "3.393e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.216e+00", "dlm_acc": "6.248e-01", "anc_acc": "5.923e-01", "epoch": 0.08102} {"step": 40515, "loss": 1.6204, "grad_norm": "3.636e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.400e-01", "anc_acc": "5.028e-01", "epoch": 0.08103} {"step": 40520, "loss": 1.2321, "grad_norm": "2.855e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.597e+00", "anc_loss": "1.706e+00", "dlm_acc": "4.386e-01", "anc_acc": "4.126e-01", "epoch": 0.08104} {"step": 40525, "loss": 0.9498, "grad_norm": "3.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.341e+00", "anc_loss": "1.505e+00", "dlm_acc": "5.781e-01", "anc_acc": "5.466e-01", "epoch": 0.08105} {"step": 40530, "loss": 0.8781, "grad_norm": "3.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.294e+00", "anc_loss": "1.427e+00", "dlm_acc": "5.451e-01", "anc_acc": "5.060e-01", "epoch": 0.08106} {"step": 40535, "loss": 1.3875, "grad_norm": "1.365e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.526e-01", "anc_acc": "5.196e-01", "epoch": 0.08107} {"step": 40540, "loss": 1.2926, "grad_norm": "3.968e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.334e+00", "dlm_acc": "6.006e-01", "anc_acc": "5.740e-01", "epoch": 0.08108} {"step": 40545, "loss": 1.2887, "grad_norm": "7.216e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.953e-01", "anc_loss": "1.107e+00", "dlm_acc": "6.422e-01", "anc_acc": "6.132e-01", "epoch": 0.08109} {"step": 40550, "loss": 1.3211, "grad_norm": "4.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.349e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.139e-01", "epoch": 0.0811} {"step": 40555, "loss": 1.5334, "grad_norm": "3.229e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.425e+00", "anc_loss": "1.550e+00", "dlm_acc": "5.086e-01", "anc_acc": "4.781e-01", "epoch": 0.08111} {"step": 40560, "loss": 0.9693, "grad_norm": "8.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.459e-01", "anc_loss": "9.443e-01", "dlm_acc": "7.061e-01", "anc_acc": "6.782e-01", "epoch": 0.08112} {"step": 40565, "loss": 1.6548, "grad_norm": "3.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.673e+00", "dlm_acc": "5.113e-01", "anc_acc": "4.801e-01", "epoch": 0.08113} {"step": 40570, "loss": 1.3071, "grad_norm": "2.620e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.128e+00", "anc_loss": "1.242e+00", "dlm_acc": "5.928e-01", "anc_acc": "5.640e-01", "epoch": 0.08114} {"step": 40575, "loss": 1.7556, "grad_norm": "4.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.156e+00", "anc_loss": "1.272e+00", "dlm_acc": "6.312e-01", "anc_acc": "6.033e-01", "epoch": 0.08115} {"step": 40580, "loss": 1.5199, "grad_norm": "3.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.256e+00", "anc_loss": "1.397e+00", "dlm_acc": "6.023e-01", "anc_acc": "5.736e-01", "epoch": 0.08116} {"step": 40585, "loss": 1.0669, "grad_norm": "3.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.020e+00", "anc_loss": "1.135e+00", "dlm_acc": "6.262e-01", "anc_acc": "5.951e-01", "epoch": 0.08117} {"step": 40590, "loss": 1.6074, "grad_norm": "3.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.974e+00", "anc_loss": "2.116e+00", "dlm_acc": "4.766e-01", "anc_acc": "4.506e-01", "epoch": 0.08118} {"step": 40595, "loss": 0.9188, "grad_norm": "1.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.165e+00", "dlm_acc": "6.102e-01", "anc_acc": "5.831e-01", "epoch": 0.08119} {"step": 40600, "loss": 1.2694, "grad_norm": "2.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.635e+00", "dlm_acc": "5.044e-01", "anc_acc": "4.764e-01", "epoch": 0.0812} {"step": 40605, "loss": 1.0261, "grad_norm": "4.077e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.018e+00", "anc_loss": "1.118e+00", "dlm_acc": "6.024e-01", "anc_acc": "5.746e-01", "epoch": 0.08121} {"step": 40610, "loss": 1.1985, "grad_norm": "2.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.128e+00", "anc_loss": "1.273e+00", "dlm_acc": "6.287e-01", "anc_acc": "5.927e-01", "epoch": 0.08122} {"step": 40615, "loss": 1.0606, "grad_norm": "3.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.839e-01", "anc_loss": "1.088e+00", "dlm_acc": "6.361e-01", "anc_acc": "6.080e-01", "epoch": 0.08123} {"step": 40620, "loss": 0.7809, "grad_norm": "2.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.836e-01", "anc_loss": "1.087e+00", "dlm_acc": "6.109e-01", "anc_acc": "5.828e-01", "epoch": 0.08124} {"step": 40625, "loss": 1.3331, "grad_norm": "3.803e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.376e+00", "anc_loss": "1.497e+00", "dlm_acc": "5.655e-01", "anc_acc": "5.368e-01", "epoch": 0.08125} {"step": 40630, "loss": 1.4551, "grad_norm": "5.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.219e+00", "anc_loss": "1.329e+00", "dlm_acc": "5.930e-01", "anc_acc": "5.613e-01", "epoch": 0.08126} {"step": 40635, "loss": 1.5046, "grad_norm": "4.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.295e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.714e-01", "anc_acc": "5.428e-01", "epoch": 0.08127} {"step": 40640, "loss": 1.3077, "grad_norm": "3.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.204e+00", "dlm_acc": "6.326e-01", "anc_acc": "6.048e-01", "epoch": 0.08128} {"step": 40645, "loss": 1.0585, "grad_norm": "4.168e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.071e+00", "anc_loss": "1.188e+00", "dlm_acc": "6.679e-01", "anc_acc": "6.377e-01", "epoch": 0.08129} {"step": 40650, "loss": 1.3395, "grad_norm": "2.775e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.481e+00", "dlm_acc": "5.662e-01", "anc_acc": "5.362e-01", "epoch": 0.0813} {"step": 40655, "loss": 1.4742, "grad_norm": "3.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.711e-01", "anc_acc": "5.484e-01", "epoch": 0.08131} {"step": 40660, "loss": 1.102, "grad_norm": "2.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.460e-01", "epoch": 0.08132} {"step": 40665, "loss": 1.2771, "grad_norm": "3.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.478e+00", "dlm_acc": "5.525e-01", "anc_acc": "5.252e-01", "epoch": 0.08133} {"step": 40670, "loss": 1.3073, "grad_norm": "5.261e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.828e-01", "anc_acc": "5.541e-01", "epoch": 0.08134} {"step": 40675, "loss": 1.1247, "grad_norm": "4.008e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.273e-01", "anc_loss": "1.028e+00", "dlm_acc": "6.596e-01", "anc_acc": "6.334e-01", "epoch": 0.08135} {"step": 40680, "loss": 1.2535, "grad_norm": "4.334e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.482e+00", "dlm_acc": "5.746e-01", "anc_acc": "5.435e-01", "epoch": 0.08136} {"step": 40685, "loss": 1.2686, "grad_norm": "2.619e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.742e-01", "anc_loss": "9.805e-01", "dlm_acc": "6.441e-01", "anc_acc": "6.161e-01", "epoch": 0.08137} {"step": 40690, "loss": 1.8249, "grad_norm": "4.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.594e+00", "anc_loss": "1.706e+00", "dlm_acc": "4.724e-01", "anc_acc": "4.479e-01", "epoch": 0.08138} {"step": 40695, "loss": 1.585, "grad_norm": "4.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.361e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.778e-01", "anc_acc": "5.452e-01", "epoch": 0.08139} {"step": 40700, "loss": 1.32, "grad_norm": "2.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.793e-01", "anc_acc": "5.522e-01", "epoch": 0.0814} {"step": 40705, "loss": 1.228, "grad_norm": "3.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.329e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.413e-01", "anc_acc": "5.157e-01", "epoch": 0.08141} {"step": 40710, "loss": 1.0365, "grad_norm": "1.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.026e+00", "anc_loss": "1.137e+00", "dlm_acc": "6.086e-01", "anc_acc": "5.782e-01", "epoch": 0.08142} {"step": 40715, "loss": 1.2287, "grad_norm": "3.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.222e+00", "anc_loss": "1.348e+00", "dlm_acc": "5.631e-01", "anc_acc": "5.351e-01", "epoch": 0.08143} {"step": 40720, "loss": 1.433, "grad_norm": "6.322e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.061e+00", "anc_loss": "1.157e+00", "dlm_acc": "6.553e-01", "anc_acc": "6.316e-01", "epoch": 0.08144} {"step": 40725, "loss": 1.3494, "grad_norm": "3.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.359e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.370e-01", "anc_acc": "5.080e-01", "epoch": 0.08145} {"step": 40730, "loss": 1.933, "grad_norm": "5.432e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.692e+00", "anc_loss": "1.828e+00", "dlm_acc": "5.017e-01", "anc_acc": "4.724e-01", "epoch": 0.08146} {"step": 40735, "loss": 1.0877, "grad_norm": "2.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.145e+00", "dlm_acc": "5.842e-01", "anc_acc": "5.547e-01", "epoch": 0.08147} {"step": 40740, "loss": 1.1721, "grad_norm": "2.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.180e+00", "dlm_acc": "5.698e-01", "anc_acc": "5.433e-01", "epoch": 0.08148} {"step": 40745, "loss": 0.9338, "grad_norm": "1.892e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.248e+00", "dlm_acc": "5.714e-01", "anc_acc": "5.421e-01", "epoch": 0.08149} {"step": 40750, "loss": 1.5138, "grad_norm": "3.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.191e+00", "anc_loss": "1.290e+00", "dlm_acc": "6.153e-01", "anc_acc": "5.836e-01", "epoch": 0.0815} {"step": 40755, "loss": 1.4431, "grad_norm": "3.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.852e-01", "anc_loss": "1.038e+00", "dlm_acc": "5.477e-01", "anc_acc": "5.281e-01", "epoch": 0.08151} {"step": 40760, "loss": 1.313, "grad_norm": "6.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.171e+00", "dlm_acc": "5.617e-01", "anc_acc": "5.391e-01", "epoch": 0.08152} {"step": 40765, "loss": 1.8448, "grad_norm": "4.961e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.250e+00", "anc_loss": "1.353e+00", "dlm_acc": "5.769e-01", "anc_acc": "5.542e-01", "epoch": 0.08153} {"step": 40770, "loss": 1.1085, "grad_norm": "3.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.160e-01", "anc_loss": "9.379e-01", "dlm_acc": "6.499e-01", "anc_acc": "6.117e-01", "epoch": 0.08154} {"step": 40775, "loss": 1.3208, "grad_norm": "3.666e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.352e-01", "anc_loss": "1.012e+00", "dlm_acc": "5.197e-01", "anc_acc": "4.953e-01", "epoch": 0.08155} {"step": 40780, "loss": 1.2389, "grad_norm": "5.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.809e-01", "anc_loss": "6.883e-01", "dlm_acc": "4.958e-01", "anc_acc": "4.926e-01", "epoch": 0.08156} {"step": 40785, "loss": 1.1686, "grad_norm": "3.718e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.687e-01", "anc_loss": "6.750e-01", "dlm_acc": "5.148e-01", "anc_acc": "5.116e-01", "epoch": 0.08157} {"step": 40790, "loss": 1.0775, "grad_norm": "3.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.234e-01", "anc_loss": "7.312e-01", "dlm_acc": "4.938e-01", "anc_acc": "4.883e-01", "epoch": 0.08158} {"step": 40795, "loss": 0.9889, "grad_norm": "2.691e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.195e-01", "anc_loss": "6.254e-01", "dlm_acc": "5.225e-01", "anc_acc": "5.210e-01", "epoch": 0.08159} {"step": 40800, "loss": 0.9926, "grad_norm": "3.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.344e-01", "anc_loss": "9.056e-01", "dlm_acc": "6.710e-01", "anc_acc": "6.525e-01", "epoch": 0.0816} {"step": 40805, "loss": 1.0028, "grad_norm": "3.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.435e+00", "dlm_acc": "5.511e-01", "anc_acc": "5.226e-01", "epoch": 0.08161} {"step": 40810, "loss": 0.8303, "grad_norm": "5.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.016e-01", "anc_loss": "8.742e-01", "dlm_acc": "6.154e-01", "anc_acc": "5.925e-01", "epoch": 0.08162} {"step": 40815, "loss": 1.1063, "grad_norm": "2.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.125e+00", "dlm_acc": "6.394e-01", "anc_acc": "6.108e-01", "epoch": 0.08163} {"step": 40820, "loss": 1.301, "grad_norm": "1.276e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.271e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.286e-01", "anc_acc": "5.021e-01", "epoch": 0.08164} {"step": 40825, "loss": 1.1714, "grad_norm": "5.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.621e-01", "anc_loss": "9.484e-01", "dlm_acc": "6.283e-01", "anc_acc": "5.808e-01", "epoch": 0.08165} {"step": 40830, "loss": 1.452, "grad_norm": "2.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.272e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.692e-01", "anc_acc": "5.479e-01", "epoch": 0.08166} {"step": 40835, "loss": 0.9612, "grad_norm": "3.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.437e-01", "anc_loss": "1.047e+00", "dlm_acc": "5.898e-01", "anc_acc": "5.623e-01", "epoch": 0.08167} {"step": 40840, "loss": 1.2555, "grad_norm": "1.805e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.846e-01", "anc_loss": "1.060e+00", "dlm_acc": "6.744e-01", "anc_acc": "6.541e-01", "epoch": 0.08168} {"step": 40845, "loss": 0.7838, "grad_norm": "2.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.792e-01", "anc_loss": "3.993e-01", "dlm_acc": "6.802e-01", "anc_acc": "6.682e-01", "epoch": 0.08169} {"step": 40850, "loss": 1.3174, "grad_norm": "3.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.212e+00", "dlm_acc": "6.609e-01", "anc_acc": "6.414e-01", "epoch": 0.0817} {"step": 40855, "loss": 1.2813, "grad_norm": "3.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.358e+00", "anc_loss": "1.489e+00", "dlm_acc": "5.105e-01", "anc_acc": "4.732e-01", "epoch": 0.08171} {"step": 40860, "loss": 1.3954, "grad_norm": "4.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.361e+00", "dlm_acc": "5.878e-01", "anc_acc": "5.563e-01", "epoch": 0.08172} {"step": 40865, "loss": 1.0508, "grad_norm": "3.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.798e-01", "anc_loss": "5.811e-01", "dlm_acc": "7.831e-01", "anc_acc": "7.564e-01", "epoch": 0.08173} {"step": 40870, "loss": 1.2314, "grad_norm": "3.739e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.219e-01", "anc_loss": "9.949e-01", "dlm_acc": "5.921e-01", "anc_acc": "5.658e-01", "epoch": 0.08174} {"step": 40875, "loss": 1.3341, "grad_norm": "4.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.047e+00", "anc_loss": "1.137e+00", "dlm_acc": "6.179e-01", "anc_acc": "5.904e-01", "epoch": 0.08175} {"step": 40880, "loss": 0.9035, "grad_norm": "2.424e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.764e-01", "anc_loss": "5.127e-01", "dlm_acc": "7.290e-01", "anc_acc": "7.087e-01", "epoch": 0.08176} {"step": 40885, "loss": 1.0546, "grad_norm": "2.094e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.500e-01", "anc_loss": "6.906e-01", "dlm_acc": "5.862e-01", "anc_acc": "5.691e-01", "epoch": 0.08177} {"step": 40890, "loss": 1.3303, "grad_norm": "4.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.229e+00", "dlm_acc": "6.470e-01", "anc_acc": "6.264e-01", "epoch": 0.08178} {"step": 40895, "loss": 1.6072, "grad_norm": "4.171e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.087e+00", "dlm_acc": "6.362e-01", "anc_acc": "6.156e-01", "epoch": 0.08179} {"step": 40900, "loss": 1.3948, "grad_norm": "5.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.234e-01", "anc_loss": "9.883e-01", "dlm_acc": "5.841e-01", "anc_acc": "5.656e-01", "epoch": 0.0818} {"step": 40905, "loss": 1.2542, "grad_norm": "2.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.828e-01", "anc_loss": "8.477e-01", "dlm_acc": "6.072e-01", "anc_acc": "5.792e-01", "epoch": 0.08181} {"step": 40910, "loss": 0.8897, "grad_norm": "2.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.014e-01", "anc_loss": "6.668e-01", "dlm_acc": "7.959e-01", "anc_acc": "7.799e-01", "epoch": 0.08182} {"step": 40915, "loss": 0.8991, "grad_norm": "3.437e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.331e-01", "anc_acc": "5.055e-01", "epoch": 0.08183} {"step": 40920, "loss": 0.6169, "grad_norm": "5.243e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.122e+00", "anc_loss": "1.228e+00", "dlm_acc": "5.420e-01", "anc_acc": "5.135e-01", "epoch": 0.08184} {"step": 40925, "loss": 0.8449, "grad_norm": "2.105e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.421e+00", "dlm_acc": "5.673e-01", "anc_acc": "5.347e-01", "epoch": 0.08185} {"step": 40930, "loss": 1.0886, "grad_norm": "8.089e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.134e+00", "dlm_acc": "5.901e-01", "anc_acc": "5.702e-01", "epoch": 0.08186} {"step": 40935, "loss": 1.1046, "grad_norm": "2.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.226e-01", "anc_acc": "4.937e-01", "epoch": 0.08187} {"step": 40940, "loss": 0.9469, "grad_norm": "8.395e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.474e-01", "anc_acc": "5.132e-01", "epoch": 0.08188} {"step": 40945, "loss": 1.207, "grad_norm": "3.617e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.537e+00", "dlm_acc": "4.521e-01", "anc_acc": "4.305e-01", "epoch": 0.08189} {"step": 40950, "loss": 0.9378, "grad_norm": "5.019e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.260e+00", "dlm_acc": "5.970e-01", "anc_acc": "5.675e-01", "epoch": 0.0819} {"step": 40955, "loss": 1.1983, "grad_norm": "4.469e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.332e-01", "anc_loss": "8.898e-01", "dlm_acc": "7.061e-01", "anc_acc": "6.926e-01", "epoch": 0.08191} {"step": 40960, "loss": 1.3054, "grad_norm": "3.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.503e+00", "anc_loss": "1.617e+00", "dlm_acc": "5.255e-01", "anc_acc": "4.974e-01", "epoch": 0.08192} {"step": 40965, "loss": 1.2718, "grad_norm": "3.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.269e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.679e-01", "anc_acc": "5.359e-01", "epoch": 0.08193} {"step": 40970, "loss": 1.4906, "grad_norm": "2.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.602e+00", "anc_loss": "1.716e+00", "dlm_acc": "4.796e-01", "anc_acc": "4.524e-01", "epoch": 0.08194} {"step": 40975, "loss": 0.8317, "grad_norm": "2.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.719e-01", "anc_loss": "9.605e-01", "dlm_acc": "6.459e-01", "anc_acc": "6.186e-01", "epoch": 0.08195} {"step": 40980, "loss": 0.9133, "grad_norm": "2.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.180e-01", "anc_loss": "1.014e+00", "dlm_acc": "6.215e-01", "anc_acc": "5.919e-01", "epoch": 0.08196} {"step": 40985, "loss": 1.3926, "grad_norm": "4.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.523e+00", "anc_loss": "1.630e+00", "dlm_acc": "5.047e-01", "anc_acc": "4.819e-01", "epoch": 0.08197} {"step": 40990, "loss": 1.3671, "grad_norm": "4.626e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.602e+00", "anc_loss": "1.730e+00", "dlm_acc": "5.065e-01", "anc_acc": "4.791e-01", "epoch": 0.08198} {"step": 40995, "loss": 1.1521, "grad_norm": "2.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.294e+00", "anc_loss": "1.382e+00", "dlm_acc": "5.981e-01", "anc_acc": "5.760e-01", "epoch": 0.08199} {"step": 41000, "loss": 1.4793, "grad_norm": "2.029e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.421e+00", "dlm_acc": "5.538e-01", "anc_acc": "5.225e-01", "epoch": 0.082} {"step": 41005, "loss": 1.7346, "grad_norm": "8.410e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.397e+00", "anc_loss": "1.525e+00", "dlm_acc": "5.474e-01", "anc_acc": "5.199e-01", "epoch": 0.08201} {"step": 41010, "loss": 1.6732, "grad_norm": "3.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.020e+00", "anc_loss": "1.134e+00", "dlm_acc": "6.384e-01", "anc_acc": "6.073e-01", "epoch": 0.08202} {"step": 41015, "loss": 1.298, "grad_norm": "4.372e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.197e+00", "dlm_acc": "6.304e-01", "anc_acc": "6.030e-01", "epoch": 0.08203} {"step": 41020, "loss": 1.1828, "grad_norm": "3.420e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.039e-01", "anc_loss": "8.125e-01", "dlm_acc": "7.085e-01", "anc_acc": "6.781e-01", "epoch": 0.08204} {"step": 41025, "loss": 0.7201, "grad_norm": "2.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.844e-01", "anc_loss": "6.406e-01", "dlm_acc": "5.763e-01", "anc_acc": "5.447e-01", "epoch": 0.08205} {"step": 41030, "loss": 1.3033, "grad_norm": "1.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.499e+00", "anc_loss": "1.590e+00", "dlm_acc": "5.000e-01", "anc_acc": "4.766e-01", "epoch": 0.08206} {"step": 41035, "loss": 0.9442, "grad_norm": "2.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.211e-01", "anc_loss": "8.742e-01", "dlm_acc": "6.049e-01", "anc_acc": "5.854e-01", "epoch": 0.08207} {"step": 41040, "loss": 1.2993, "grad_norm": "4.835e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.562e-01", "anc_loss": "9.777e-01", "dlm_acc": "6.221e-01", "anc_acc": "5.857e-01", "epoch": 0.08208} {"step": 41045, "loss": 1.2677, "grad_norm": "3.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.551e-01", "anc_loss": "4.652e-01", "dlm_acc": "6.741e-01", "anc_acc": "6.693e-01", "epoch": 0.08209} {"step": 41050, "loss": 1.3074, "grad_norm": "2.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.234e-01", "anc_loss": "4.332e-01", "dlm_acc": "6.934e-01", "anc_acc": "6.891e-01", "epoch": 0.0821} {"step": 41055, "loss": 1.0361, "grad_norm": "3.748e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.795e-01", "anc_loss": "6.312e-01", "dlm_acc": "7.015e-01", "anc_acc": "6.840e-01", "epoch": 0.08211} {"step": 41060, "loss": 0.9594, "grad_norm": "1.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.179e+00", "dlm_acc": "6.031e-01", "anc_acc": "5.715e-01", "epoch": 0.08212} {"step": 41065, "loss": 1.3557, "grad_norm": "3.050e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.617e-01", "anc_loss": "1.091e+00", "dlm_acc": "6.261e-01", "anc_acc": "5.930e-01", "epoch": 0.08213} {"step": 41070, "loss": 0.9858, "grad_norm": "1.578e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.523e-01", "anc_loss": "6.648e-01", "dlm_acc": "4.608e-01", "anc_acc": "4.542e-01", "epoch": 0.08214} {"step": 41075, "loss": 0.9629, "grad_norm": "2.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.039e-01", "anc_loss": "5.441e-01", "dlm_acc": "7.308e-01", "anc_acc": "7.195e-01", "epoch": 0.08215} {"step": 41080, "loss": 1.1288, "grad_norm": "3.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.734e-01", "anc_loss": "1.052e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.319e-01", "epoch": 0.08216} {"step": 41085, "loss": 1.2219, "grad_norm": "3.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.555e-01", "anc_loss": "8.141e-01", "dlm_acc": "5.609e-01", "anc_acc": "5.427e-01", "epoch": 0.08217} {"step": 41090, "loss": 1.2013, "grad_norm": "3.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.578e-01", "anc_loss": "9.437e-01", "dlm_acc": "5.596e-01", "anc_acc": "5.353e-01", "epoch": 0.08218} {"step": 41095, "loss": 1.2579, "grad_norm": "3.403e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.797e-01", "anc_acc": "5.463e-01", "epoch": 0.08219} {"step": 41100, "loss": 1.446, "grad_norm": "4.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.108e+00", "anc_loss": "1.185e+00", "dlm_acc": "5.315e-01", "anc_acc": "5.045e-01", "epoch": 0.0822} {"step": 41105, "loss": 1.2831, "grad_norm": "2.605e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.820e-01", "anc_loss": "9.211e-01", "dlm_acc": "4.985e-01", "anc_acc": "4.894e-01", "epoch": 0.08221} {"step": 41110, "loss": 1.4988, "grad_norm": "2.774e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.172e-01", "anc_loss": "9.625e-01", "dlm_acc": "4.931e-01", "anc_acc": "4.756e-01", "epoch": 0.08222} {"step": 41115, "loss": 1.4331, "grad_norm": "3.168e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.124e+00", "dlm_acc": "4.982e-01", "anc_acc": "4.746e-01", "epoch": 0.08223} {"step": 41120, "loss": 1.2469, "grad_norm": "3.530e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.441e-01", "anc_loss": "1.070e+00", "dlm_acc": "6.366e-01", "anc_acc": "5.910e-01", "epoch": 0.08224} {"step": 41125, "loss": 1.3899, "grad_norm": "3.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.096e-01", "anc_loss": "7.744e-01", "dlm_acc": "6.628e-01", "anc_acc": "6.419e-01", "epoch": 0.08225} {"step": 41130, "loss": 1.1493, "grad_norm": "2.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.815e-01", "anc_loss": "9.799e-01", "dlm_acc": "6.632e-01", "anc_acc": "6.382e-01", "epoch": 0.08226} {"step": 41135, "loss": 1.5556, "grad_norm": "3.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.343e+00", "anc_loss": "1.484e+00", "dlm_acc": "6.006e-01", "anc_acc": "5.729e-01", "epoch": 0.08227} {"step": 41140, "loss": 1.1189, "grad_norm": "2.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.594e-01", "anc_loss": "6.008e-01", "dlm_acc": "6.732e-01", "anc_acc": "6.613e-01", "epoch": 0.08228} {"step": 41145, "loss": 1.2404, "grad_norm": "2.381e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.168e-01", "anc_loss": "4.391e-01", "dlm_acc": "6.788e-01", "anc_acc": "6.699e-01", "epoch": 0.08229} {"step": 41150, "loss": 1.2201, "grad_norm": "3.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.891e-01", "anc_loss": "4.133e-01", "dlm_acc": "6.931e-01", "anc_acc": "6.810e-01", "epoch": 0.0823} {"step": 41155, "loss": 1.1805, "grad_norm": "3.497e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.859e-01", "anc_loss": "4.016e-01", "dlm_acc": "7.149e-01", "anc_acc": "7.052e-01", "epoch": 0.08231} {"step": 41160, "loss": 1.2379, "grad_norm": "6.632e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.148e-01", "anc_loss": "4.340e-01", "dlm_acc": "7.018e-01", "anc_acc": "6.931e-01", "epoch": 0.08232} {"step": 41165, "loss": 1.2916, "grad_norm": "2.422e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.379e-01", "anc_loss": "4.539e-01", "dlm_acc": "6.891e-01", "anc_acc": "6.827e-01", "epoch": 0.08233} {"step": 41170, "loss": 1.5726, "grad_norm": "3.979e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.574e-01", "anc_loss": "5.813e-01", "dlm_acc": "6.158e-01", "anc_acc": "6.061e-01", "epoch": 0.08234} {"step": 41175, "loss": 0.9068, "grad_norm": "2.966e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.080e-01", "anc_loss": "8.031e-01", "dlm_acc": "7.095e-01", "anc_acc": "6.804e-01", "epoch": 0.08235} {"step": 41180, "loss": 1.2156, "grad_norm": "4.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.146e+00", "dlm_acc": "5.601e-01", "anc_acc": "5.400e-01", "epoch": 0.08236} {"step": 41185, "loss": 0.971, "grad_norm": "1.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.023e-01", "anc_loss": "7.461e-01", "dlm_acc": "5.941e-01", "anc_acc": "5.772e-01", "epoch": 0.08237} {"step": 41190, "loss": 1.5137, "grad_norm": "4.436e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.129e-01", "anc_loss": "9.734e-01", "dlm_acc": "5.929e-01", "anc_acc": "5.726e-01", "epoch": 0.08238} {"step": 41195, "loss": 1.5076, "grad_norm": "4.424e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.406e-01", "anc_loss": "9.141e-01", "dlm_acc": "6.348e-01", "anc_acc": "6.108e-01", "epoch": 0.08239} {"step": 41200, "loss": 1.1069, "grad_norm": "2.926e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.165e+00", "dlm_acc": "5.961e-01", "anc_acc": "5.697e-01", "epoch": 0.0824} {"step": 41205, "loss": 0.9524, "grad_norm": "4.787e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.207e-01", "anc_loss": "8.746e-01", "dlm_acc": "5.737e-01", "anc_acc": "5.512e-01", "epoch": 0.08241} {"step": 41210, "loss": 1.1415, "grad_norm": "3.997e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.430e-01", "anc_loss": "6.937e-01", "dlm_acc": "5.961e-01", "anc_acc": "5.745e-01", "epoch": 0.08242} {"step": 41215, "loss": 1.285, "grad_norm": "5.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.627e+00", "anc_loss": "1.752e+00", "dlm_acc": "5.096e-01", "anc_acc": "4.846e-01", "epoch": 0.08243} {"step": 41220, "loss": 0.8218, "grad_norm": "2.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.262e-01", "anc_loss": "5.883e-01", "dlm_acc": "6.761e-01", "anc_acc": "6.436e-01", "epoch": 0.08244} {"step": 41225, "loss": 0.9957, "grad_norm": "4.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.111e-01", "anc_loss": "4.371e-01", "dlm_acc": "6.884e-01", "anc_acc": "6.719e-01", "epoch": 0.08245} {"step": 41230, "loss": 0.995, "grad_norm": "3.137e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.699e-01", "anc_loss": "5.086e-01", "dlm_acc": "6.747e-01", "anc_acc": "6.523e-01", "epoch": 0.08246} {"step": 41235, "loss": 0.7336, "grad_norm": "2.309e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.611e-01", "anc_loss": "3.885e-01", "dlm_acc": "7.085e-01", "anc_acc": "6.901e-01", "epoch": 0.08247} {"step": 41240, "loss": 1.1665, "grad_norm": "3.434e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.863e-01", "anc_loss": "5.309e-01", "dlm_acc": "6.808e-01", "anc_acc": "6.532e-01", "epoch": 0.08248} {"step": 41245, "loss": 1.3356, "grad_norm": "2.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.289e-01", "anc_loss": "8.531e-01", "dlm_acc": "5.578e-01", "anc_acc": "5.497e-01", "epoch": 0.08249} {"step": 41250, "loss": 1.0074, "grad_norm": "3.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.609e-01", "anc_loss": "6.625e-01", "dlm_acc": "5.525e-01", "anc_acc": "5.522e-01", "epoch": 0.0825} {"step": 41255, "loss": 1.0756, "grad_norm": "8.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.473e-01", "anc_loss": "7.672e-01", "dlm_acc": "5.677e-01", "anc_acc": "5.623e-01", "epoch": 0.08251} {"step": 41260, "loss": 0.8472, "grad_norm": "3.375e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.750e-01", "anc_loss": "3.980e-01", "dlm_acc": "7.681e-01", "anc_acc": "7.553e-01", "epoch": 0.08252} {"step": 41265, "loss": 1.0822, "grad_norm": "3.304e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.932e-01", "anc_loss": "1.120e+00", "dlm_acc": "6.498e-01", "anc_acc": "6.168e-01", "epoch": 0.08253} {"step": 41270, "loss": 1.3706, "grad_norm": "3.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.459e+00", "anc_loss": "1.616e+00", "dlm_acc": "5.169e-01", "anc_acc": "4.800e-01", "epoch": 0.08254} {"step": 41275, "loss": 1.3549, "grad_norm": "2.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.573e+00", "anc_loss": "1.704e+00", "dlm_acc": "5.302e-01", "anc_acc": "5.021e-01", "epoch": 0.08255} {"step": 41280, "loss": 1.1423, "grad_norm": "5.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.489e+00", "anc_loss": "1.591e+00", "dlm_acc": "4.742e-01", "anc_acc": "4.494e-01", "epoch": 0.08256} {"step": 41285, "loss": 1.1976, "grad_norm": "9.134e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.733e-01", "anc_acc": "5.446e-01", "epoch": 0.08257} {"step": 41290, "loss": 1.2996, "grad_norm": "5.010e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.367e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.402e-01", "anc_acc": "6.095e-01", "epoch": 0.08258} {"step": 41295, "loss": 1.0931, "grad_norm": "2.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.922e-01", "anc_loss": "1.094e+00", "dlm_acc": "6.366e-01", "anc_acc": "6.089e-01", "epoch": 0.08259} {"step": 41300, "loss": 1.24, "grad_norm": "3.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.103e+00", "anc_loss": "1.233e+00", "dlm_acc": "5.998e-01", "anc_acc": "5.664e-01", "epoch": 0.0826} {"step": 41305, "loss": 1.5658, "grad_norm": "5.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.267e-01", "anc_acc": "5.030e-01", "epoch": 0.08261} {"step": 41310, "loss": 1.2171, "grad_norm": "3.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.693e-01", "anc_acc": "5.414e-01", "epoch": 0.08262} {"step": 41315, "loss": 1.2405, "grad_norm": "3.220e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.545e+00", "dlm_acc": "5.503e-01", "anc_acc": "5.218e-01", "epoch": 0.08263} {"step": 41320, "loss": 1.4549, "grad_norm": "5.162e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.548e+00", "anc_loss": "1.672e+00", "dlm_acc": "5.055e-01", "anc_acc": "4.753e-01", "epoch": 0.08264} {"step": 41325, "loss": 0.9632, "grad_norm": "6.139e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.096e-01", "anc_loss": "9.891e-01", "dlm_acc": "6.822e-01", "anc_acc": "6.523e-01", "epoch": 0.08265} {"step": 41330, "loss": 1.3258, "grad_norm": "3.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.676e-01", "anc_acc": "5.366e-01", "epoch": 0.08266} {"step": 41335, "loss": 1.0237, "grad_norm": "4.112e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.252e+00", "dlm_acc": "5.840e-01", "anc_acc": "5.564e-01", "epoch": 0.08267} {"step": 41340, "loss": 1.5518, "grad_norm": "3.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.634e+00", "anc_loss": "1.781e+00", "dlm_acc": "5.213e-01", "anc_acc": "4.897e-01", "epoch": 0.08268} {"step": 41345, "loss": 1.1096, "grad_norm": "3.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.153e+00", "dlm_acc": "6.442e-01", "anc_acc": "6.155e-01", "epoch": 0.08269} {"step": 41350, "loss": 1.1241, "grad_norm": "2.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.392e+00", "dlm_acc": "5.463e-01", "anc_acc": "5.144e-01", "epoch": 0.0827} {"step": 41355, "loss": 1.3102, "grad_norm": "3.908e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.471e+00", "anc_loss": "1.610e+00", "dlm_acc": "5.694e-01", "anc_acc": "5.398e-01", "epoch": 0.08271} {"step": 41360, "loss": 0.7998, "grad_norm": "1.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.406e-01", "anc_loss": "1.053e+00", "dlm_acc": "6.268e-01", "anc_acc": "5.930e-01", "epoch": 0.08272} {"step": 41365, "loss": 0.9385, "grad_norm": "2.816e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.309e-01", "anc_loss": "1.055e+00", "dlm_acc": "6.733e-01", "anc_acc": "6.387e-01", "epoch": 0.08273} {"step": 41370, "loss": 1.1391, "grad_norm": "3.067e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.300e+00", "anc_loss": "1.406e+00", "dlm_acc": "5.448e-01", "anc_acc": "5.212e-01", "epoch": 0.08274} {"step": 41375, "loss": 1.1471, "grad_norm": "3.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.618e-01", "anc_acc": "5.348e-01", "epoch": 0.08275} {"step": 41380, "loss": 1.3691, "grad_norm": "2.969e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.400e+00", "anc_loss": "1.525e+00", "dlm_acc": "5.639e-01", "anc_acc": "5.376e-01", "epoch": 0.08276} {"step": 41385, "loss": 1.6217, "grad_norm": "4.726e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.609e+00", "anc_loss": "1.736e+00", "dlm_acc": "5.199e-01", "anc_acc": "4.901e-01", "epoch": 0.08277} {"step": 41390, "loss": 1.3959, "grad_norm": "6.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.524e+00", "anc_loss": "1.659e+00", "dlm_acc": "5.422e-01", "anc_acc": "5.116e-01", "epoch": 0.08278} {"step": 41395, "loss": 1.1482, "grad_norm": "4.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.160e+00", "anc_loss": "1.276e+00", "dlm_acc": "5.903e-01", "anc_acc": "5.604e-01", "epoch": 0.08279} {"step": 41400, "loss": 2.0343, "grad_norm": "5.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.903e+00", "anc_loss": "2.048e+00", "dlm_acc": "4.780e-01", "anc_acc": "4.506e-01", "epoch": 0.0828} {"step": 41405, "loss": 0.9596, "grad_norm": "2.924e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.157e+00", "dlm_acc": "5.956e-01", "anc_acc": "5.682e-01", "epoch": 0.08281} {"step": 41410, "loss": 1.3547, "grad_norm": "3.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.867e-01", "anc_acc": "5.481e-01", "epoch": 0.08282} {"step": 41415, "loss": 1.3654, "grad_norm": "8.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.465e+00", "dlm_acc": "5.683e-01", "anc_acc": "5.414e-01", "epoch": 0.08283} {"step": 41420, "loss": 1.2006, "grad_norm": "4.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.428e+00", "anc_loss": "1.544e+00", "dlm_acc": "5.207e-01", "anc_acc": "4.948e-01", "epoch": 0.08284} {"step": 41425, "loss": 1.2336, "grad_norm": "2.898e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.300e+00", "dlm_acc": "5.824e-01", "anc_acc": "5.534e-01", "epoch": 0.08285} {"step": 41430, "loss": 1.3818, "grad_norm": "7.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.008e+00", "anc_loss": "1.108e+00", "dlm_acc": "6.554e-01", "anc_acc": "6.316e-01", "epoch": 0.08286} {"step": 41435, "loss": 1.1527, "grad_norm": "3.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.917e-01", "anc_acc": "5.637e-01", "epoch": 0.08287} {"step": 41440, "loss": 1.301, "grad_norm": "2.752e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.442e+00", "anc_loss": "1.561e+00", "dlm_acc": "5.094e-01", "anc_acc": "4.815e-01", "epoch": 0.08288} {"step": 41445, "loss": 1.0961, "grad_norm": "2.452e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.148e-01", "anc_loss": "1.013e+00", "dlm_acc": "6.527e-01", "anc_acc": "6.212e-01", "epoch": 0.08289} {"step": 41450, "loss": 1.0977, "grad_norm": "4.984e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.217e+00", "dlm_acc": "5.770e-01", "anc_acc": "5.475e-01", "epoch": 0.0829} {"step": 41455, "loss": 1.3227, "grad_norm": "3.478e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.278e+00", "anc_loss": "1.434e+00", "dlm_acc": "6.114e-01", "anc_acc": "5.722e-01", "epoch": 0.08291} {"step": 41460, "loss": 1.2022, "grad_norm": "4.908e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.509e+00", "dlm_acc": "5.641e-01", "anc_acc": "5.347e-01", "epoch": 0.08292} {"step": 41465, "loss": 1.3866, "grad_norm": "4.381e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.568e+00", "anc_loss": "1.672e+00", "dlm_acc": "5.088e-01", "anc_acc": "4.855e-01", "epoch": 0.08293} {"step": 41470, "loss": 1.1194, "grad_norm": "1.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.461e-01", "anc_loss": "9.547e-01", "dlm_acc": "6.773e-01", "anc_acc": "6.459e-01", "epoch": 0.08294} {"step": 41475, "loss": 1.1785, "grad_norm": "3.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.660e-01", "anc_acc": "5.376e-01", "epoch": 0.08295} {"step": 41480, "loss": 1.1664, "grad_norm": "6.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.305e-01", "anc_acc": "5.011e-01", "epoch": 0.08296} {"step": 41485, "loss": 1.0084, "grad_norm": "3.968e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.321e+00", "dlm_acc": "4.458e-01", "anc_acc": "4.229e-01", "epoch": 0.08297} {"step": 41490, "loss": 1.0217, "grad_norm": "5.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.172e-01", "anc_loss": "9.219e-01", "dlm_acc": "3.165e-01", "anc_acc": "3.167e-01", "epoch": 0.08298} {"step": 41495, "loss": 1.1041, "grad_norm": "4.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.359e-01", "anc_loss": "9.406e-01", "dlm_acc": "3.143e-01", "anc_acc": "3.127e-01", "epoch": 0.08299} {"step": 41500, "loss": 1.0672, "grad_norm": "2.183e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.313e-01", "anc_loss": "8.586e-01", "dlm_acc": "3.923e-01", "anc_acc": "3.847e-01", "epoch": 0.083} {"step": 41505, "loss": 1.3284, "grad_norm": "3.134e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.832e-01", "anc_loss": "8.430e-01", "dlm_acc": "5.729e-01", "anc_acc": "5.558e-01", "epoch": 0.08301} {"step": 41510, "loss": 1.4679, "grad_norm": "3.152e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.230e+00", "dlm_acc": "5.685e-01", "anc_acc": "5.257e-01", "epoch": 0.08302} {"step": 41515, "loss": 0.6618, "grad_norm": "2.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.055e-01", "anc_loss": "1.032e+00", "dlm_acc": "6.374e-01", "anc_acc": "5.984e-01", "epoch": 0.08303} {"step": 41520, "loss": 1.0502, "grad_norm": "7.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.986e-01", "anc_loss": "1.091e+00", "dlm_acc": "6.616e-01", "anc_acc": "6.379e-01", "epoch": 0.08304} {"step": 41525, "loss": 0.9878, "grad_norm": "4.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.500e-02", "anc_loss": "6.423e-02", "dlm_acc": "9.793e-01", "anc_acc": "9.675e-01", "epoch": 0.08305} {"step": 41530, "loss": 1.1961, "grad_norm": "2.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.126e+00", "anc_loss": "1.264e+00", "dlm_acc": "5.888e-01", "anc_acc": "5.573e-01", "epoch": 0.08306} {"step": 41535, "loss": 1.5163, "grad_norm": "1.438e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.149e+00", "anc_loss": "1.298e+00", "dlm_acc": "6.138e-01", "anc_acc": "5.744e-01", "epoch": 0.08307} {"step": 41540, "loss": 1.98, "grad_norm": "6.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.741e+00", "anc_loss": "2.819e+00", "dlm_acc": "5.840e-02", "anc_acc": "3.614e-02", "epoch": 0.08308} {"step": 41545, "loss": 1.8415, "grad_norm": "9.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.475e+00", "anc_loss": "2.570e+00", "dlm_acc": "1.760e-01", "anc_acc": "1.536e-01", "epoch": 0.08309} {"step": 41550, "loss": 1.1898, "grad_norm": "3.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.262e-01", "anc_acc": "5.006e-01", "epoch": 0.0831} {"step": 41555, "loss": 1.5127, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.406e+00", "anc_loss": "1.567e+00", "dlm_acc": "5.440e-01", "anc_acc": "5.073e-01", "epoch": 0.08311} {"step": 41560, "loss": 1.3233, "grad_norm": "3.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.293e+00", "dlm_acc": "6.102e-01", "anc_acc": "5.643e-01", "epoch": 0.08312} {"step": 41565, "loss": 1.4328, "grad_norm": "3.158e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.574e+00", "dlm_acc": "5.678e-01", "anc_acc": "5.207e-01", "epoch": 0.08313} {"step": 41570, "loss": 1.4513, "grad_norm": "2.873e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.090e+00", "anc_loss": "1.215e+00", "dlm_acc": "6.113e-01", "anc_acc": "5.769e-01", "epoch": 0.08314} {"step": 41575, "loss": 1.7326, "grad_norm": "7.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.756e+00", "anc_loss": "1.898e+00", "dlm_acc": "4.770e-01", "anc_acc": "4.414e-01", "epoch": 0.08315} {"step": 41580, "loss": 1.2794, "grad_norm": "3.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.477e+00", "anc_loss": "1.622e+00", "dlm_acc": "4.088e-01", "anc_acc": "3.624e-01", "epoch": 0.08316} {"step": 41585, "loss": 1.281, "grad_norm": "3.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.047e-01", "anc_loss": "9.187e-01", "dlm_acc": "5.139e-01", "anc_acc": "4.757e-01", "epoch": 0.08317} {"step": 41590, "loss": 1.7828, "grad_norm": "4.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.473e+00", "anc_loss": "1.658e+00", "dlm_acc": "5.579e-01", "anc_acc": "5.075e-01", "epoch": 0.08318} {"step": 41595, "loss": 1.5975, "grad_norm": "6.152e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.620e+00", "anc_loss": "1.741e+00", "dlm_acc": "4.589e-01", "anc_acc": "4.320e-01", "epoch": 0.08319} {"step": 41600, "loss": 1.5634, "grad_norm": "1.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.203e-01", "anc_loss": "1.038e+00", "dlm_acc": "6.694e-01", "anc_acc": "6.396e-01", "epoch": 0.0832} {"step": 41605, "loss": 1.0656, "grad_norm": "2.767e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.340e-01", "anc_loss": "8.902e-01", "dlm_acc": "7.207e-01", "anc_acc": "6.670e-01", "epoch": 0.08321} {"step": 41610, "loss": 1.0832, "grad_norm": "2.856e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.168e-01", "anc_loss": "9.160e-01", "dlm_acc": "6.805e-01", "anc_acc": "6.559e-01", "epoch": 0.08322} {"step": 41615, "loss": 0.8705, "grad_norm": "4.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.746e-01", "anc_loss": "8.754e-01", "dlm_acc": "6.642e-01", "anc_acc": "6.282e-01", "epoch": 0.08323} {"step": 41620, "loss": 1.2663, "grad_norm": "2.198e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.278e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.346e-01", "epoch": 0.08324} {"step": 41625, "loss": 1.4967, "grad_norm": "3.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.492e+00", "anc_loss": "1.617e+00", "dlm_acc": "4.851e-01", "anc_acc": "4.531e-01", "epoch": 0.08325} {"step": 41630, "loss": 1.2045, "grad_norm": "3.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.999e+00", "anc_loss": "2.004e+00", "dlm_acc": "9.761e-02", "anc_acc": "9.697e-02", "epoch": 0.08326} {"step": 41635, "loss": 1.6697, "grad_norm": "3.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.795e+00", "anc_loss": "1.905e+00", "dlm_acc": "4.107e-01", "anc_acc": "3.837e-01", "epoch": 0.08327} {"step": 41640, "loss": 1.5365, "grad_norm": "7.153e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.792e+00", "anc_loss": "1.965e+00", "dlm_acc": "3.902e-01", "anc_acc": "3.448e-01", "epoch": 0.08328} {"step": 41645, "loss": 1.3319, "grad_norm": "3.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.399e+00", "anc_loss": "1.602e+00", "dlm_acc": "5.241e-01", "anc_acc": "4.731e-01", "epoch": 0.08329} {"step": 41650, "loss": 1.2072, "grad_norm": "2.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.636e-01", "anc_acc": "5.183e-01", "epoch": 0.0833} {"step": 41655, "loss": 1.2354, "grad_norm": "2.139e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.246e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.191e-01", "epoch": 0.08331} {"step": 41660, "loss": 1.3135, "grad_norm": "3.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.452e+00", "dlm_acc": "5.179e-01", "anc_acc": "4.799e-01", "epoch": 0.08332} {"step": 41665, "loss": 1.3285, "grad_norm": "3.736e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.457e-01", "anc_loss": "9.789e-01", "dlm_acc": "6.721e-01", "anc_acc": "6.291e-01", "epoch": 0.08333} {"step": 41670, "loss": 1.5607, "grad_norm": "2.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.193e+00", "anc_loss": "1.360e+00", "dlm_acc": "5.988e-01", "anc_acc": "5.487e-01", "epoch": 0.08334} {"step": 41675, "loss": 1.3412, "grad_norm": "2.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.156e+00", "dlm_acc": "6.147e-01", "anc_acc": "5.832e-01", "epoch": 0.08335} {"step": 41680, "loss": 1.5487, "grad_norm": "3.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.240e+00", "dlm_acc": "6.242e-01", "anc_acc": "5.872e-01", "epoch": 0.08336} {"step": 41685, "loss": 1.3424, "grad_norm": "2.634e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.225e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.591e-01", "anc_acc": "5.270e-01", "epoch": 0.08337} {"step": 41690, "loss": 0.9211, "grad_norm": "3.602e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.189e+00", "dlm_acc": "5.962e-01", "anc_acc": "5.674e-01", "epoch": 0.08338} {"step": 41695, "loss": 1.0363, "grad_norm": "3.547e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.331e+00", "anc_loss": "1.452e+00", "dlm_acc": "5.636e-01", "anc_acc": "5.373e-01", "epoch": 0.08339} {"step": 41700, "loss": 0.9963, "grad_norm": "8.926e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.895e-01", "anc_loss": "1.004e+00", "dlm_acc": "6.741e-01", "anc_acc": "6.421e-01", "epoch": 0.0834} {"step": 41705, "loss": 1.033, "grad_norm": "4.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.066e-01", "anc_loss": "3.309e-01", "dlm_acc": "8.004e-01", "anc_acc": "7.900e-01", "epoch": 0.08341} {"step": 41710, "loss": 1.0354, "grad_norm": "2.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.313e-01", "anc_loss": "9.172e-01", "dlm_acc": "6.676e-01", "anc_acc": "6.423e-01", "epoch": 0.08342} {"step": 41715, "loss": 0.9004, "grad_norm": "2.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.354e-01", "anc_loss": "1.043e+00", "dlm_acc": "6.348e-01", "anc_acc": "6.084e-01", "epoch": 0.08343} {"step": 41720, "loss": 1.0843, "grad_norm": "2.718e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.213e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.619e-01", "anc_acc": "5.316e-01", "epoch": 0.08344} {"step": 41725, "loss": 1.2744, "grad_norm": "5.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.375e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.374e-01", "anc_acc": "5.086e-01", "epoch": 0.08345} {"step": 41730, "loss": 1.2727, "grad_norm": "3.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.227e+00", "anc_loss": "1.335e+00", "dlm_acc": "5.573e-01", "anc_acc": "5.292e-01", "epoch": 0.08346} {"step": 41735, "loss": 1.4238, "grad_norm": "5.028e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.651e+00", "dlm_acc": "5.322e-01", "anc_acc": "4.968e-01", "epoch": 0.08347} {"step": 41740, "loss": 1.0532, "grad_norm": "2.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.258e-01", "anc_loss": "1.024e+00", "dlm_acc": "6.416e-01", "anc_acc": "6.153e-01", "epoch": 0.08348} {"step": 41745, "loss": 1.6141, "grad_norm": "3.034e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.791e+00", "anc_loss": "1.929e+00", "dlm_acc": "4.842e-01", "anc_acc": "4.580e-01", "epoch": 0.08349} {"step": 41750, "loss": 1.3791, "grad_norm": "4.799e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.509e+00", "dlm_acc": "5.938e-01", "anc_acc": "5.673e-01", "epoch": 0.0835} {"step": 41755, "loss": 1.0821, "grad_norm": "2.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.563e-01", "anc_loss": "1.020e+00", "dlm_acc": "5.510e-01", "anc_acc": "5.364e-01", "epoch": 0.08351} {"step": 41760, "loss": 1.1433, "grad_norm": "2.904e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.719e-01", "anc_loss": "6.805e-01", "dlm_acc": "5.818e-01", "anc_acc": "5.772e-01", "epoch": 0.08352} {"step": 41765, "loss": 1.307, "grad_norm": "6.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.537e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.295e-01", "anc_acc": "5.100e-01", "epoch": 0.08353} {"step": 41770, "loss": 1.6455, "grad_norm": "4.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.437e+00", "dlm_acc": "5.239e-01", "anc_acc": "4.990e-01", "epoch": 0.08354} {"step": 41775, "loss": 1.3404, "grad_norm": "2.662e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.854e-01", "anc_loss": "9.688e-01", "dlm_acc": "6.456e-01", "anc_acc": "6.199e-01", "epoch": 0.08355} {"step": 41780, "loss": 1.0687, "grad_norm": "3.436e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.611e-01", "anc_loss": "4.879e-01", "dlm_acc": "7.123e-01", "anc_acc": "6.963e-01", "epoch": 0.08356} {"step": 41785, "loss": 0.9897, "grad_norm": "3.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.438e-01", "anc_loss": "6.469e-01", "dlm_acc": "5.839e-01", "anc_acc": "5.820e-01", "epoch": 0.08357} {"step": 41790, "loss": 1.1385, "grad_norm": "1.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.133e-01", "anc_loss": "9.715e-01", "dlm_acc": "5.184e-01", "anc_acc": "4.992e-01", "epoch": 0.08358} {"step": 41795, "loss": 1.041, "grad_norm": "4.773e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.840e-01", "anc_loss": "7.352e-01", "dlm_acc": "6.059e-01", "anc_acc": "5.916e-01", "epoch": 0.08359} {"step": 41800, "loss": 0.9436, "grad_norm": "5.957e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.996e-01", "anc_loss": "8.973e-01", "dlm_acc": "6.477e-01", "anc_acc": "6.165e-01", "epoch": 0.0836} {"step": 41805, "loss": 1.6521, "grad_norm": "4.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.562e+00", "dlm_acc": "5.258e-01", "anc_acc": "4.964e-01", "epoch": 0.08361} {"step": 41810, "loss": 1.1286, "grad_norm": "3.458e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.219e-01", "anc_loss": "7.746e-01", "dlm_acc": "6.192e-01", "anc_acc": "6.013e-01", "epoch": 0.08362} {"step": 41815, "loss": 1.0349, "grad_norm": "5.520e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.645e-01", "anc_loss": "5.969e-01", "dlm_acc": "5.831e-01", "anc_acc": "5.630e-01", "epoch": 0.08363} {"step": 41820, "loss": 1.29, "grad_norm": "3.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.345e+00", "dlm_acc": "4.820e-01", "anc_acc": "4.626e-01", "epoch": 0.08364} {"step": 41825, "loss": 0.9757, "grad_norm": "2.398e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.742e-01", "anc_loss": "8.117e-01", "dlm_acc": "4.838e-01", "anc_acc": "4.672e-01", "epoch": 0.08365} {"step": 41830, "loss": 1.1965, "grad_norm": "2.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.621e-01", "anc_acc": "5.309e-01", "epoch": 0.08366} {"step": 41835, "loss": 1.5557, "grad_norm": "2.498e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.703e-01", "anc_loss": "1.043e+00", "dlm_acc": "6.107e-01", "anc_acc": "5.896e-01", "epoch": 0.08367} {"step": 41840, "loss": 0.9496, "grad_norm": "2.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.813e-01", "anc_loss": "6.129e-01", "dlm_acc": "5.784e-01", "anc_acc": "5.641e-01", "epoch": 0.08368} {"step": 41845, "loss": 1.1134, "grad_norm": "3.090e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.477e-01", "anc_loss": "1.047e+00", "dlm_acc": "6.004e-01", "anc_acc": "5.741e-01", "epoch": 0.08369} {"step": 41850, "loss": 1.3127, "grad_norm": "2.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.085e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.735e-01", "anc_acc": "5.302e-01", "epoch": 0.0837} {"step": 41855, "loss": 1.2155, "grad_norm": "3.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.157e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.920e-01", "anc_acc": "5.653e-01", "epoch": 0.08371} {"step": 41860, "loss": 1.1246, "grad_norm": "5.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.369e+00", "dlm_acc": "5.166e-01", "anc_acc": "4.931e-01", "epoch": 0.08372} {"step": 41865, "loss": 1.0266, "grad_norm": "2.620e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.162e-01", "anc_loss": "9.055e-01", "dlm_acc": "6.603e-01", "anc_acc": "6.358e-01", "epoch": 0.08373} {"step": 41870, "loss": 1.1337, "grad_norm": "4.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.444e+00", "anc_loss": "1.558e+00", "dlm_acc": "4.822e-01", "anc_acc": "4.558e-01", "epoch": 0.08374} {"step": 41875, "loss": 0.9818, "grad_norm": "6.754e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.410e-01", "anc_loss": "9.414e-01", "dlm_acc": "6.541e-01", "anc_acc": "6.241e-01", "epoch": 0.08375} {"step": 41880, "loss": 0.9087, "grad_norm": "7.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.836e-01", "anc_loss": "9.992e-01", "dlm_acc": "6.575e-01", "anc_acc": "6.256e-01", "epoch": 0.08376} {"step": 41885, "loss": 0.9174, "grad_norm": "3.970e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.836e-01", "anc_loss": "5.715e-01", "dlm_acc": "7.557e-01", "anc_acc": "7.242e-01", "epoch": 0.08377} {"step": 41890, "loss": 1.0428, "grad_norm": "2.884e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.097e+00", "dlm_acc": "6.234e-01", "anc_acc": "6.049e-01", "epoch": 0.08378} {"step": 41895, "loss": 1.0946, "grad_norm": "2.438e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.574e-01", "anc_loss": "9.217e-01", "dlm_acc": "6.222e-01", "anc_acc": "5.994e-01", "epoch": 0.08379} {"step": 41900, "loss": 1.1623, "grad_norm": "3.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.887e-01", "anc_loss": "7.617e-01", "dlm_acc": "7.651e-01", "anc_acc": "7.091e-01", "epoch": 0.0838} {"step": 41905, "loss": 0.8147, "grad_norm": "4.062e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.313e-01", "anc_loss": "9.781e-01", "dlm_acc": "4.786e-01", "anc_acc": "4.622e-01", "epoch": 0.08381} {"step": 41910, "loss": 0.9185, "grad_norm": "2.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.184e-01", "anc_loss": "5.961e-01", "dlm_acc": "7.127e-01", "anc_acc": "6.791e-01", "epoch": 0.08382} {"step": 41915, "loss": 1.2028, "grad_norm": "4.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.551e+00", "dlm_acc": "5.538e-01", "anc_acc": "5.209e-01", "epoch": 0.08383} {"step": 41920, "loss": 1.0557, "grad_norm": "2.617e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.115e+00", "anc_loss": "1.215e+00", "dlm_acc": "5.722e-01", "anc_acc": "5.482e-01", "epoch": 0.08384} {"step": 41925, "loss": 0.7887, "grad_norm": "4.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.026e-01", "anc_loss": "4.815e-01", "dlm_acc": "8.339e-01", "anc_acc": "7.977e-01", "epoch": 0.08385} {"step": 41930, "loss": 1.3285, "grad_norm": "3.545e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.478e+00", "dlm_acc": "5.445e-01", "anc_acc": "5.117e-01", "epoch": 0.08386} {"step": 41935, "loss": 1.0954, "grad_norm": "4.367e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.313e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.478e-01", "anc_acc": "6.108e-01", "epoch": 0.08387} {"step": 41940, "loss": 1.0947, "grad_norm": "4.239e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.898e-01", "anc_loss": "6.863e-01", "dlm_acc": "6.978e-01", "anc_acc": "6.632e-01", "epoch": 0.08388} {"step": 41945, "loss": 1.3206, "grad_norm": "5.074e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.314e+00", "dlm_acc": "5.852e-01", "anc_acc": "5.435e-01", "epoch": 0.08389} {"step": 41950, "loss": 1.5898, "grad_norm": "5.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.300e+00", "anc_loss": "1.416e+00", "dlm_acc": "5.399e-01", "anc_acc": "5.095e-01", "epoch": 0.0839} {"step": 41955, "loss": 0.9887, "grad_norm": "3.392e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.171e+00", "anc_loss": "1.300e+00", "dlm_acc": "5.548e-01", "anc_acc": "5.152e-01", "epoch": 0.08391} {"step": 41960, "loss": 1.2449, "grad_norm": "1.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.720e+00", "anc_loss": "1.811e+00", "dlm_acc": "3.927e-01", "anc_acc": "3.739e-01", "epoch": 0.08392} {"step": 41965, "loss": 1.0818, "grad_norm": "1.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.409e+00", "anc_loss": "1.507e+00", "dlm_acc": "5.219e-01", "anc_acc": "4.951e-01", "epoch": 0.08393} {"step": 41970, "loss": 1.5419, "grad_norm": "2.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.720e+00", "dlm_acc": "5.258e-01", "anc_acc": "4.762e-01", "epoch": 0.08394} {"step": 41975, "loss": 1.1237, "grad_norm": "4.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.875e-01", "anc_loss": "5.617e-01", "dlm_acc": "7.535e-01", "anc_acc": "7.330e-01", "epoch": 0.08395} {"step": 41980, "loss": 1.2686, "grad_norm": "2.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.430e-01", "anc_loss": "9.570e-01", "dlm_acc": "6.537e-01", "anc_acc": "6.256e-01", "epoch": 0.08396} {"step": 41985, "loss": 1.2048, "grad_norm": "3.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.043e-01", "anc_loss": "1.037e+00", "dlm_acc": "6.184e-01", "anc_acc": "5.672e-01", "epoch": 0.08397} {"step": 41990, "loss": 1.4983, "grad_norm": "4.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.341e+00", "dlm_acc": "5.422e-01", "anc_acc": "4.788e-01", "epoch": 0.08398} {"step": 41995, "loss": 1.3382, "grad_norm": "3.479e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.691e+00", "anc_loss": "1.769e+00", "dlm_acc": "3.530e-01", "anc_acc": "3.315e-01", "epoch": 0.08399} {"step": 42000, "loss": 0.944, "grad_norm": "6.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.130e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.455e-01", "anc_acc": "5.236e-01", "epoch": 0.084} {"step": 42005, "loss": 1.1648, "grad_norm": "3.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.203e+00", "dlm_acc": "5.538e-01", "anc_acc": "5.221e-01", "epoch": 0.08401} {"step": 42010, "loss": 1.5031, "grad_norm": "5.473e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.220e+00", "dlm_acc": "5.865e-01", "anc_acc": "5.572e-01", "epoch": 0.08402} {"step": 42015, "loss": 1.7079, "grad_norm": "2.091e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.639e+00", "anc_loss": "1.766e+00", "dlm_acc": "4.293e-01", "anc_acc": "4.010e-01", "epoch": 0.08403} {"step": 42020, "loss": 1.5034, "grad_norm": "4.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.366e+00", "anc_loss": "1.477e+00", "dlm_acc": "4.684e-01", "anc_acc": "4.412e-01", "epoch": 0.08404} {"step": 42025, "loss": 1.4434, "grad_norm": "3.427e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.162e+00", "dlm_acc": "5.875e-01", "anc_acc": "5.465e-01", "epoch": 0.08405} {"step": 42030, "loss": 1.1933, "grad_norm": "3.418e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.191e+00", "dlm_acc": "5.368e-01", "anc_acc": "4.957e-01", "epoch": 0.08406} {"step": 42035, "loss": 1.2593, "grad_norm": "3.895e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.841e-01", "anc_acc": "5.446e-01", "epoch": 0.08407} {"step": 42040, "loss": 1.4489, "grad_norm": "3.400e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.361e+00", "dlm_acc": "5.051e-01", "anc_acc": "4.711e-01", "epoch": 0.08408} {"step": 42045, "loss": 1.0751, "grad_norm": "3.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.047e-01", "anc_acc": "4.685e-01", "epoch": 0.08409} {"step": 42050, "loss": 1.1424, "grad_norm": "1.172e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.397e+00", "anc_loss": "1.534e+00", "dlm_acc": "4.940e-01", "anc_acc": "4.629e-01", "epoch": 0.0841} {"step": 42055, "loss": 0.9067, "grad_norm": "5.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.065e-01", "anc_acc": "4.788e-01", "epoch": 0.08411} {"step": 42060, "loss": 0.652, "grad_norm": "3.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.305e-01", "anc_loss": "8.285e-01", "dlm_acc": "7.096e-01", "anc_acc": "6.799e-01", "epoch": 0.08412} {"step": 42065, "loss": 0.8411, "grad_norm": "1.755e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.680e-01", "anc_loss": "9.508e-01", "dlm_acc": "5.759e-01", "anc_acc": "5.517e-01", "epoch": 0.08413} {"step": 42070, "loss": 1.0595, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.026e+00", "anc_loss": "1.185e+00", "dlm_acc": "6.011e-01", "anc_acc": "5.575e-01", "epoch": 0.08414} {"step": 42075, "loss": 0.88, "grad_norm": "2.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.028e+00", "anc_loss": "1.129e+00", "dlm_acc": "6.352e-01", "anc_acc": "6.063e-01", "epoch": 0.08415} {"step": 42080, "loss": 0.78, "grad_norm": "3.107e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.250e-01", "anc_loss": "7.031e-01", "dlm_acc": "6.836e-01", "anc_acc": "6.534e-01", "epoch": 0.08416} {"step": 42085, "loss": 1.3132, "grad_norm": "3.636e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.219e-01", "anc_loss": "5.574e-01", "dlm_acc": "6.722e-01", "anc_acc": "6.561e-01", "epoch": 0.08417} {"step": 42090, "loss": 0.7964, "grad_norm": "2.204e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.699e-01", "anc_loss": "3.947e-01", "dlm_acc": "6.984e-01", "anc_acc": "6.857e-01", "epoch": 0.08418} {"step": 42095, "loss": 1.0191, "grad_norm": "2.957e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.348e-01", "anc_loss": "4.527e-01", "dlm_acc": "6.911e-01", "anc_acc": "6.809e-01", "epoch": 0.08419} {"step": 42100, "loss": 1.2398, "grad_norm": "7.067e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.789e-01", "anc_loss": "9.797e-01", "dlm_acc": "5.704e-01", "anc_acc": "5.354e-01", "epoch": 0.0842} {"step": 42105, "loss": 1.1622, "grad_norm": "5.317e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.313e+00", "anc_loss": "1.413e+00", "dlm_acc": "4.306e-01", "anc_acc": "4.015e-01", "epoch": 0.08421} {"step": 42110, "loss": 0.9767, "grad_norm": "2.103e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.164e+00", "dlm_acc": "4.889e-01", "anc_acc": "4.468e-01", "epoch": 0.08422} {"step": 42115, "loss": 1.5545, "grad_norm": "2.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.181e+00", "anc_loss": "1.311e+00", "dlm_acc": "5.626e-01", "anc_acc": "5.190e-01", "epoch": 0.08423} {"step": 42120, "loss": 1.1412, "grad_norm": "4.569e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.144e+00", "anc_loss": "1.327e+00", "dlm_acc": "5.638e-01", "anc_acc": "4.965e-01", "epoch": 0.08424} {"step": 42125, "loss": 1.0091, "grad_norm": "5.664e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.367e-01", "anc_loss": "1.020e+00", "dlm_acc": "6.342e-01", "anc_acc": "5.690e-01", "epoch": 0.08425} {"step": 42130, "loss": 0.8948, "grad_norm": "2.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.223e-01", "anc_loss": "1.044e+00", "dlm_acc": "6.174e-01", "anc_acc": "5.794e-01", "epoch": 0.08426} {"step": 42135, "loss": 1.3089, "grad_norm": "2.681e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.094e+00", "anc_loss": "1.177e+00", "dlm_acc": "6.395e-01", "anc_acc": "6.257e-01", "epoch": 0.08427} {"step": 42140, "loss": 1.2752, "grad_norm": "4.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.477e-01", "anc_loss": "9.313e-01", "dlm_acc": "7.697e-01", "anc_acc": "7.590e-01", "epoch": 0.08428} {"step": 42145, "loss": 1.1528, "grad_norm": "3.537e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.229e+00", "anc_loss": "1.340e+00", "dlm_acc": "5.471e-01", "anc_acc": "5.186e-01", "epoch": 0.08429} {"step": 42150, "loss": 1.4612, "grad_norm": "4.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.447e+00", "dlm_acc": "5.898e-01", "anc_acc": "5.461e-01", "epoch": 0.0843} {"step": 42155, "loss": 1.2903, "grad_norm": "3.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.362e+00", "dlm_acc": "5.741e-01", "anc_acc": "5.244e-01", "epoch": 0.08431} {"step": 42160, "loss": 1.4408, "grad_norm": "5.330e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.416e+00", "anc_loss": "1.574e+00", "dlm_acc": "5.727e-01", "anc_acc": "5.359e-01", "epoch": 0.08432} {"step": 42165, "loss": 1.2086, "grad_norm": "2.410e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.570e-01", "anc_loss": "6.641e-01", "dlm_acc": "5.993e-01", "anc_acc": "5.964e-01", "epoch": 0.08433} {"step": 42170, "loss": 1.005, "grad_norm": "2.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.203e-01", "anc_loss": "5.242e-01", "dlm_acc": "6.472e-01", "anc_acc": "6.466e-01", "epoch": 0.08434} {"step": 42175, "loss": 0.7773, "grad_norm": "2.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.570e-01", "anc_loss": "4.602e-01", "dlm_acc": "6.502e-01", "anc_acc": "6.506e-01", "epoch": 0.08435} {"step": 42180, "loss": 1.0626, "grad_norm": "1.869e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.895e-01", "anc_loss": "9.982e-01", "dlm_acc": "6.837e-01", "anc_acc": "6.563e-01", "epoch": 0.08436} {"step": 42185, "loss": 1.0391, "grad_norm": "3.153e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.188e+00", "dlm_acc": "5.909e-01", "anc_acc": "5.660e-01", "epoch": 0.08437} {"step": 42190, "loss": 0.9857, "grad_norm": "4.043e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.150e-02", "anc_loss": "3.043e-02", "dlm_acc": "9.868e-01", "anc_acc": "9.833e-01", "epoch": 0.08438} {"step": 42195, "loss": 0.9438, "grad_norm": "3.137e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.138e-03", "anc_loss": "5.088e-03", "dlm_acc": "9.987e-01", "anc_acc": "9.970e-01", "epoch": 0.08439} {"step": 42200, "loss": 0.7063, "grad_norm": "2.671e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.885e-01", "anc_loss": "3.092e-01", "dlm_acc": "8.441e-01", "anc_acc": "8.378e-01", "epoch": 0.0844} {"step": 42205, "loss": 0.8915, "grad_norm": "2.906e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.363e-01", "anc_loss": "2.604e-01", "dlm_acc": "9.086e-01", "anc_acc": "9.022e-01", "epoch": 0.08441} {"step": 42210, "loss": 0.8929, "grad_norm": "2.518e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.024e-01", "anc_loss": "6.392e-01", "dlm_acc": "7.126e-01", "anc_acc": "7.010e-01", "epoch": 0.08442} {"step": 42215, "loss": 1.1031, "grad_norm": "8.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.726e-01", "anc_loss": "1.055e+00", "dlm_acc": "6.306e-01", "anc_acc": "6.089e-01", "epoch": 0.08443} {"step": 42220, "loss": 1.4031, "grad_norm": "3.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.555e-01", "anc_loss": "9.266e-01", "dlm_acc": "6.300e-01", "anc_acc": "6.092e-01", "epoch": 0.08444} {"step": 42225, "loss": 1.3827, "grad_norm": "4.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.160e+00", "dlm_acc": "6.564e-01", "anc_acc": "6.230e-01", "epoch": 0.08445} {"step": 42230, "loss": 1.25, "grad_norm": "3.461e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.883e-01", "anc_loss": "6.914e-01", "dlm_acc": "7.494e-01", "anc_acc": "7.163e-01", "epoch": 0.08446} {"step": 42235, "loss": 0.8936, "grad_norm": "2.429e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.896e-01", "anc_loss": "3.152e-01", "dlm_acc": "8.264e-01", "anc_acc": "8.140e-01", "epoch": 0.08447} {"step": 42240, "loss": 1.0579, "grad_norm": "1.896e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.211e-01", "anc_loss": "4.576e-01", "dlm_acc": "7.822e-01", "anc_acc": "7.693e-01", "epoch": 0.08448} {"step": 42245, "loss": 1.2774, "grad_norm": "2.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.508e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.974e-01", "anc_acc": "6.672e-01", "epoch": 0.08449} {"step": 42250, "loss": 0.985, "grad_norm": "3.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.330e-01", "anc_loss": "3.922e-01", "dlm_acc": "8.360e-01", "anc_acc": "8.205e-01", "epoch": 0.0845} {"step": 42255, "loss": 1.3987, "grad_norm": "6.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.465e+00", "dlm_acc": "5.139e-01", "anc_acc": "4.841e-01", "epoch": 0.08451} {"step": 42260, "loss": 1.1146, "grad_norm": "2.156e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.180e-01", "anc_loss": "9.766e-01", "dlm_acc": "5.747e-01", "anc_acc": "5.598e-01", "epoch": 0.08452} {"step": 42265, "loss": 1.388, "grad_norm": "3.119e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.371e-01", "anc_loss": "6.328e-01", "dlm_acc": "6.127e-01", "anc_acc": "6.117e-01", "epoch": 0.08453} {"step": 42270, "loss": 1.6843, "grad_norm": "1.921e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.117e-01", "anc_loss": "7.195e-01", "dlm_acc": "5.881e-01", "anc_acc": "5.864e-01", "epoch": 0.08454} {"step": 42275, "loss": 1.3288, "grad_norm": "4.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.055e-01", "anc_loss": "6.395e-01", "dlm_acc": "6.730e-01", "anc_acc": "6.644e-01", "epoch": 0.08455} {"step": 42280, "loss": 1.1776, "grad_norm": "2.246e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.258e-01", "anc_loss": "9.336e-01", "dlm_acc": "2.785e-01", "anc_acc": "2.762e-01", "epoch": 0.08456} {"step": 42285, "loss": 1.335, "grad_norm": "4.800e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.492e-01", "anc_loss": "9.563e-01", "dlm_acc": "2.670e-01", "anc_acc": "2.650e-01", "epoch": 0.08457} {"step": 42290, "loss": 1.0259, "grad_norm": "2.755e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.487e-01", "anc_loss": "8.066e-01", "dlm_acc": "5.707e-01", "anc_acc": "5.541e-01", "epoch": 0.08458} {"step": 42295, "loss": 1.0997, "grad_norm": "2.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.160e-01", "anc_loss": "6.783e-01", "dlm_acc": "7.146e-01", "anc_acc": "6.974e-01", "epoch": 0.08459} {"step": 42300, "loss": 1.2052, "grad_norm": "1.998e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.668e-01", "anc_loss": "9.539e-01", "dlm_acc": "6.759e-01", "anc_acc": "6.530e-01", "epoch": 0.0846} {"step": 42305, "loss": 1.0641, "grad_norm": "2.803e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.043e-01", "anc_loss": "7.734e-01", "dlm_acc": "7.049e-01", "anc_acc": "6.796e-01", "epoch": 0.08461} {"step": 42310, "loss": 1.3414, "grad_norm": "2.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.879e-01", "anc_loss": "8.961e-01", "dlm_acc": "7.243e-01", "anc_acc": "6.976e-01", "epoch": 0.08462} {"step": 42315, "loss": 1.1488, "grad_norm": "2.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.540e-01", "anc_acc": "5.297e-01", "epoch": 0.08463} {"step": 42320, "loss": 1.3149, "grad_norm": "3.014e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.529e+00", "anc_loss": "1.648e+00", "dlm_acc": "5.207e-01", "anc_acc": "4.912e-01", "epoch": 0.08464} {"step": 42325, "loss": 1.3809, "grad_norm": "6.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.261e+00", "dlm_acc": "6.588e-01", "anc_acc": "6.348e-01", "epoch": 0.08465} {"step": 42330, "loss": 1.1978, "grad_norm": "2.804e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.651e-01", "anc_loss": "7.200e-01", "dlm_acc": "7.641e-01", "anc_acc": "7.506e-01", "epoch": 0.08466} {"step": 42335, "loss": 0.9733, "grad_norm": "2.678e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.254e-01", "anc_loss": "4.912e-01", "dlm_acc": "7.989e-01", "anc_acc": "7.756e-01", "epoch": 0.08467} {"step": 42340, "loss": 1.2866, "grad_norm": "3.506e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.815e-01", "anc_loss": "8.384e-01", "dlm_acc": "7.350e-01", "anc_acc": "7.176e-01", "epoch": 0.08468} {"step": 42345, "loss": 1.2452, "grad_norm": "5.128e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.201e-01", "anc_loss": "7.395e-01", "dlm_acc": "5.355e-01", "anc_acc": "5.258e-01", "epoch": 0.08469} {"step": 42350, "loss": 1.2099, "grad_norm": "8.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.625e-01", "anc_loss": "7.820e-01", "dlm_acc": "4.578e-01", "anc_acc": "4.458e-01", "epoch": 0.0847} {"step": 42355, "loss": 0.8869, "grad_norm": "3.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.336e-01", "anc_loss": "6.523e-01", "dlm_acc": "5.072e-01", "anc_acc": "4.985e-01", "epoch": 0.08471} {"step": 42360, "loss": 0.9014, "grad_norm": "2.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.000e-01", "anc_loss": "7.211e-01", "dlm_acc": "5.070e-01", "anc_acc": "5.011e-01", "epoch": 0.08472} {"step": 42365, "loss": 0.9478, "grad_norm": "4.106e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.879e-01", "anc_loss": "7.094e-01", "dlm_acc": "5.044e-01", "anc_acc": "4.938e-01", "epoch": 0.08473} {"step": 42370, "loss": 1.2904, "grad_norm": "2.587e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.717e-01", "anc_loss": "7.048e-01", "dlm_acc": "5.968e-01", "anc_acc": "5.856e-01", "epoch": 0.08474} {"step": 42375, "loss": 1.0591, "grad_norm": "6.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.259e-01", "anc_loss": "6.979e-01", "dlm_acc": "7.701e-01", "anc_acc": "7.542e-01", "epoch": 0.08475} {"step": 42380, "loss": 0.9763, "grad_norm": "2.580e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.125e-01", "anc_loss": "6.820e-01", "dlm_acc": "7.744e-01", "anc_acc": "7.637e-01", "epoch": 0.08476} {"step": 42385, "loss": 1.2105, "grad_norm": "5.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.165e+00", "anc_loss": "1.277e+00", "dlm_acc": "6.009e-01", "anc_acc": "5.736e-01", "epoch": 0.08477} {"step": 42390, "loss": 0.9401, "grad_norm": "2.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.932e-01", "anc_loss": "4.493e-01", "dlm_acc": "8.384e-01", "anc_acc": "8.129e-01", "epoch": 0.08478} {"step": 42395, "loss": 1.3673, "grad_norm": "9.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.256e+00", "dlm_acc": "5.948e-01", "anc_acc": "5.672e-01", "epoch": 0.08479} {"step": 42400, "loss": 1.1834, "grad_norm": "9.082e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.441e-01", "anc_loss": "4.673e-01", "dlm_acc": "6.782e-01", "anc_acc": "6.686e-01", "epoch": 0.0848} {"step": 42405, "loss": 1.2872, "grad_norm": "3.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.437e+00", "dlm_acc": "5.576e-01", "anc_acc": "5.292e-01", "epoch": 0.08481} {"step": 42410, "loss": 1.1434, "grad_norm": "2.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.591e-01", "anc_loss": "7.255e-01", "dlm_acc": "7.387e-01", "anc_acc": "7.154e-01", "epoch": 0.08482} {"step": 42415, "loss": 1.2525, "grad_norm": "4.729e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.532e-01", "anc_acc": "6.298e-01", "epoch": 0.08483} {"step": 42420, "loss": 0.887, "grad_norm": "2.059e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.330e-01", "anc_loss": "8.947e-01", "dlm_acc": "6.517e-01", "anc_acc": "6.302e-01", "epoch": 0.08484} {"step": 42425, "loss": 0.862, "grad_norm": "5.062e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.023e-01", "anc_loss": "6.832e-01", "dlm_acc": "6.815e-01", "anc_acc": "6.507e-01", "epoch": 0.08485} {"step": 42430, "loss": 1.0777, "grad_norm": "5.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.862e-01", "anc_loss": "8.528e-01", "dlm_acc": "7.355e-01", "anc_acc": "7.164e-01", "epoch": 0.08486} {"step": 42435, "loss": 1.1346, "grad_norm": "3.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.244e+00", "dlm_acc": "5.742e-01", "anc_acc": "5.573e-01", "epoch": 0.08487} {"step": 42440, "loss": 0.8, "grad_norm": "2.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.654e-01", "anc_loss": "2.891e-01", "dlm_acc": "8.256e-01", "anc_acc": "8.145e-01", "epoch": 0.08488} {"step": 42445, "loss": 0.7948, "grad_norm": "4.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.855e-01", "anc_loss": "3.178e-01", "dlm_acc": "8.186e-01", "anc_acc": "8.048e-01", "epoch": 0.08489} {"step": 42450, "loss": 0.9175, "grad_norm": "4.033e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.338e-01", "anc_loss": "3.801e-01", "dlm_acc": "7.961e-01", "anc_acc": "7.811e-01", "epoch": 0.0849} {"step": 42455, "loss": 1.0682, "grad_norm": "3.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.574e-01", "anc_loss": "5.186e-01", "dlm_acc": "7.434e-01", "anc_acc": "7.168e-01", "epoch": 0.08491} {"step": 42460, "loss": 0.9319, "grad_norm": "4.795e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.777e-01", "anc_loss": "4.250e-01", "dlm_acc": "7.476e-01", "anc_acc": "7.286e-01", "epoch": 0.08492} {"step": 42465, "loss": 0.7327, "grad_norm": "2.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.973e-01", "anc_loss": "6.625e-01", "dlm_acc": "6.869e-01", "anc_acc": "6.598e-01", "epoch": 0.08493} {"step": 42470, "loss": 0.8264, "grad_norm": "3.121e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.472e+00", "anc_loss": "1.595e+00", "dlm_acc": "5.048e-01", "anc_acc": "4.778e-01", "epoch": 0.08494} {"step": 42475, "loss": 1.4109, "grad_norm": "7.507e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.043e-01", "anc_loss": "8.547e-01", "dlm_acc": "5.936e-01", "anc_acc": "5.829e-01", "epoch": 0.08495} {"step": 42480, "loss": 1.5484, "grad_norm": "3.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.406e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.252e-01", "anc_acc": "4.982e-01", "epoch": 0.08496} {"step": 42485, "loss": 1.246, "grad_norm": "5.321e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.528e+00", "dlm_acc": "5.305e-01", "anc_acc": "5.049e-01", "epoch": 0.08497} {"step": 42490, "loss": 1.0608, "grad_norm": "4.914e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.202e+00", "dlm_acc": "5.918e-01", "anc_acc": "5.620e-01", "epoch": 0.08498} {"step": 42495, "loss": 1.0296, "grad_norm": "4.445e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.965e-01", "anc_loss": "1.103e+00", "dlm_acc": "5.766e-01", "anc_acc": "5.488e-01", "epoch": 0.08499} {"step": 42500, "loss": 1.2029, "grad_norm": "2.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.132e+00", "dlm_acc": "6.417e-01", "anc_acc": "6.141e-01", "epoch": 0.085} {"step": 42505, "loss": 0.9856, "grad_norm": "3.070e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.094e-01", "anc_loss": "7.820e-01", "dlm_acc": "6.716e-01", "anc_acc": "6.561e-01", "epoch": 0.08501} {"step": 42510, "loss": 1.2081, "grad_norm": "2.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.013e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.161e-01", "anc_acc": "5.906e-01", "epoch": 0.08502} {"step": 42515, "loss": 1.5041, "grad_norm": "4.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.535e+00", "anc_loss": "1.664e+00", "dlm_acc": "5.179e-01", "anc_acc": "4.893e-01", "epoch": 0.08503} {"step": 42520, "loss": 1.2187, "grad_norm": "3.999e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.323e+00", "dlm_acc": "6.044e-01", "anc_acc": "5.781e-01", "epoch": 0.08504} {"step": 42525, "loss": 1.0771, "grad_norm": "2.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.453e-01", "anc_loss": "9.020e-01", "dlm_acc": "6.081e-01", "anc_acc": "5.973e-01", "epoch": 0.08505} {"step": 42530, "loss": 1.0, "grad_norm": "2.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.449e-01", "anc_loss": "5.629e-01", "dlm_acc": "6.454e-01", "anc_acc": "6.408e-01", "epoch": 0.08506} {"step": 42535, "loss": 1.0267, "grad_norm": "3.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.479e-01", "anc_loss": "3.852e-01", "dlm_acc": "7.740e-01", "anc_acc": "7.561e-01", "epoch": 0.08507} {"step": 42540, "loss": 1.5167, "grad_norm": "4.315e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.523e-01", "anc_loss": "9.494e-01", "dlm_acc": "7.180e-01", "anc_acc": "6.850e-01", "epoch": 0.08508} {"step": 42545, "loss": 1.1491, "grad_norm": "2.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.128e+00", "anc_loss": "1.236e+00", "dlm_acc": "6.093e-01", "anc_acc": "5.847e-01", "epoch": 0.08509} {"step": 42550, "loss": 1.174, "grad_norm": "3.905e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.168e+00", "dlm_acc": "5.321e-01", "anc_acc": "5.122e-01", "epoch": 0.0851} {"step": 42555, "loss": 1.0895, "grad_norm": "2.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.087e+00", "anc_loss": "1.141e+00", "dlm_acc": "4.895e-01", "anc_acc": "4.737e-01", "epoch": 0.08511} {"step": 42560, "loss": 1.2455, "grad_norm": "2.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.193e+00", "dlm_acc": "6.104e-01", "anc_acc": "5.813e-01", "epoch": 0.08512} {"step": 42565, "loss": 1.1269, "grad_norm": "3.344e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.852e-01", "anc_acc": "5.566e-01", "epoch": 0.08513} {"step": 42570, "loss": 1.2708, "grad_norm": "4.321e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.312e+00", "dlm_acc": "5.193e-01", "anc_acc": "4.929e-01", "epoch": 0.08514} {"step": 42575, "loss": 1.3509, "grad_norm": "2.961e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.549e+00", "anc_loss": "1.689e+00", "dlm_acc": "5.109e-01", "anc_acc": "4.829e-01", "epoch": 0.08515} {"step": 42580, "loss": 1.5544, "grad_norm": "5.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.324e+00", "dlm_acc": "6.053e-01", "anc_acc": "5.823e-01", "epoch": 0.08516} {"step": 42585, "loss": 0.8853, "grad_norm": "2.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.445e-01", "anc_loss": "9.719e-01", "dlm_acc": "5.939e-01", "anc_acc": "5.755e-01", "epoch": 0.08517} {"step": 42590, "loss": 1.4197, "grad_norm": "2.998e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.303e+00", "anc_loss": "1.445e+00", "dlm_acc": "5.659e-01", "anc_acc": "5.351e-01", "epoch": 0.08518} {"step": 42595, "loss": 1.1422, "grad_norm": "2.973e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.323e+00", "dlm_acc": "5.459e-01", "anc_acc": "4.970e-01", "epoch": 0.08519} {"step": 42600, "loss": 1.1587, "grad_norm": "3.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.218e+00", "dlm_acc": "6.076e-01", "anc_acc": "5.801e-01", "epoch": 0.0852} {"step": 42605, "loss": 1.1746, "grad_norm": "2.926e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.056e+00", "anc_loss": "1.163e+00", "dlm_acc": "5.398e-01", "anc_acc": "4.990e-01", "epoch": 0.08521} {"step": 42610, "loss": 1.1093, "grad_norm": "3.390e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.102e-01", "anc_loss": "1.041e+00", "dlm_acc": "6.258e-01", "anc_acc": "5.855e-01", "epoch": 0.08522} {"step": 42615, "loss": 1.22, "grad_norm": "1.185e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.076e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.941e-01", "anc_acc": "5.390e-01", "epoch": 0.08523} {"step": 42620, "loss": 1.322, "grad_norm": "5.768e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.264e+00", "anc_loss": "1.432e+00", "dlm_acc": "5.564e-01", "anc_acc": "5.227e-01", "epoch": 0.08524} {"step": 42625, "loss": 1.1852, "grad_norm": "5.440e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.414e-01", "anc_loss": "9.105e-01", "dlm_acc": "5.793e-01", "anc_acc": "5.553e-01", "epoch": 0.08525} {"step": 42630, "loss": 1.3366, "grad_norm": "3.450e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.295e+00", "dlm_acc": "4.905e-01", "anc_acc": "4.647e-01", "epoch": 0.08526} {"step": 42635, "loss": 1.4629, "grad_norm": "4.467e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.555e+00", "dlm_acc": "4.987e-01", "anc_acc": "4.692e-01", "epoch": 0.08527} {"step": 42640, "loss": 1.0623, "grad_norm": "5.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.266e-01", "anc_loss": "6.195e-01", "dlm_acc": "7.654e-01", "anc_acc": "7.367e-01", "epoch": 0.08528} {"step": 42645, "loss": 0.9471, "grad_norm": "1.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.359e-01", "anc_loss": "8.313e-01", "dlm_acc": "7.076e-01", "anc_acc": "6.793e-01", "epoch": 0.08529} {"step": 42650, "loss": 0.7349, "grad_norm": "3.230e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.570e-01", "anc_loss": "9.816e-01", "dlm_acc": "6.576e-01", "anc_acc": "6.265e-01", "epoch": 0.0853} {"step": 42655, "loss": 1.0237, "grad_norm": "6.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.214e+00", "anc_loss": "1.350e+00", "dlm_acc": "6.204e-01", "anc_acc": "5.871e-01", "epoch": 0.08531} {"step": 42660, "loss": 0.8853, "grad_norm": "1.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.562e-01", "anc_loss": "1.018e+00", "dlm_acc": "6.217e-01", "anc_acc": "5.700e-01", "epoch": 0.08532} {"step": 42665, "loss": 1.4743, "grad_norm": "3.380e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.088e+00", "anc_loss": "2.175e+00", "dlm_acc": "3.223e-01", "anc_acc": "3.032e-01", "epoch": 0.08533} {"step": 42670, "loss": 1.2013, "grad_norm": "2.049e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.222e+00", "anc_loss": "1.328e+00", "dlm_acc": "5.240e-01", "anc_acc": "4.950e-01", "epoch": 0.08534} {"step": 42675, "loss": 1.2013, "grad_norm": "3.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.232e+00", "anc_loss": "1.323e+00", "dlm_acc": "5.297e-01", "anc_acc": "5.068e-01", "epoch": 0.08535} {"step": 42680, "loss": 1.0823, "grad_norm": "2.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.322e-01", "anc_acc": "5.053e-01", "epoch": 0.08536} {"step": 42685, "loss": 1.6966, "grad_norm": "3.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.371e+00", "anc_loss": "1.501e+00", "dlm_acc": "4.812e-01", "anc_acc": "4.528e-01", "epoch": 0.08537} {"step": 42690, "loss": 1.006, "grad_norm": "3.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.010e+00", "anc_loss": "1.114e+00", "dlm_acc": "6.081e-01", "anc_acc": "5.780e-01", "epoch": 0.08538} {"step": 42695, "loss": 0.9943, "grad_norm": "3.225e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.025e+00", "anc_loss": "1.171e+00", "dlm_acc": "5.977e-01", "anc_acc": "5.515e-01", "epoch": 0.08539} {"step": 42700, "loss": 1.2357, "grad_norm": "3.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.213e+00", "anc_loss": "1.337e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.222e-01", "epoch": 0.0854} {"step": 42705, "loss": 1.1208, "grad_norm": "5.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.418e+00", "anc_loss": "1.519e+00", "dlm_acc": "4.605e-01", "anc_acc": "4.339e-01", "epoch": 0.08541} {"step": 42710, "loss": 1.0371, "grad_norm": "2.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.338e-01", "anc_acc": "5.074e-01", "epoch": 0.08542} {"step": 42715, "loss": 1.3144, "grad_norm": "2.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.272e+00", "anc_loss": "1.376e+00", "dlm_acc": "5.194e-01", "anc_acc": "4.869e-01", "epoch": 0.08543} {"step": 42720, "loss": 0.8369, "grad_norm": "2.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.118e-01", "anc_acc": "4.749e-01", "epoch": 0.08544} {"step": 42725, "loss": 1.0237, "grad_norm": "4.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.386e+00", "anc_loss": "1.512e+00", "dlm_acc": "4.948e-01", "anc_acc": "4.643e-01", "epoch": 0.08545} {"step": 42730, "loss": 0.7896, "grad_norm": "2.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.403e+00", "dlm_acc": "5.640e-01", "anc_acc": "5.171e-01", "epoch": 0.08546} {"step": 42735, "loss": 0.7765, "grad_norm": "3.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.267e+00", "dlm_acc": "6.312e-01", "anc_acc": "6.002e-01", "epoch": 0.08547} {"step": 42740, "loss": 1.029, "grad_norm": "3.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.049e+00", "anc_loss": "1.238e+00", "dlm_acc": "6.186e-01", "anc_acc": "5.606e-01", "epoch": 0.08548} {"step": 42745, "loss": 1.2289, "grad_norm": "3.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.256e+00", "dlm_acc": "6.177e-01", "anc_acc": "5.836e-01", "epoch": 0.08549} {"step": 42750, "loss": 0.9992, "grad_norm": "3.498e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.585e-01", "anc_acc": "5.285e-01", "epoch": 0.0855} {"step": 42755, "loss": 1.0443, "grad_norm": "2.654e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.359e+00", "dlm_acc": "6.180e-01", "anc_acc": "5.769e-01", "epoch": 0.08551} {"step": 42760, "loss": 0.7587, "grad_norm": "3.447e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.813e-01", "anc_loss": "7.570e-01", "dlm_acc": "6.541e-01", "anc_acc": "6.340e-01", "epoch": 0.08552} {"step": 42765, "loss": 0.8065, "grad_norm": "2.648e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.182e+00", "dlm_acc": "5.855e-01", "anc_acc": "5.330e-01", "epoch": 0.08553} {"step": 42770, "loss": 1.5231, "grad_norm": "3.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.498e+00", "dlm_acc": "4.954e-01", "anc_acc": "4.674e-01", "epoch": 0.08554} {"step": 42775, "loss": 1.3958, "grad_norm": "4.081e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.368e+00", "dlm_acc": "5.914e-01", "anc_acc": "5.581e-01", "epoch": 0.08555} {"step": 42780, "loss": 1.3654, "grad_norm": "7.834e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.376e+00", "anc_loss": "1.521e+00", "dlm_acc": "5.705e-01", "anc_acc": "5.365e-01", "epoch": 0.08556} {"step": 42785, "loss": 1.3496, "grad_norm": "3.054e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.423e+00", "dlm_acc": "6.116e-01", "anc_acc": "5.758e-01", "epoch": 0.08557} {"step": 42790, "loss": 1.4187, "grad_norm": "3.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.300e+00", "anc_loss": "1.426e+00", "dlm_acc": "5.794e-01", "anc_acc": "5.472e-01", "epoch": 0.08558} {"step": 42795, "loss": 1.0604, "grad_norm": "2.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.256e+00", "dlm_acc": "5.962e-01", "anc_acc": "5.655e-01", "epoch": 0.08559} {"step": 42800, "loss": 1.4565, "grad_norm": "3.643e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.498e+00", "anc_loss": "1.631e+00", "dlm_acc": "5.359e-01", "anc_acc": "5.064e-01", "epoch": 0.0856} {"step": 42805, "loss": 1.5832, "grad_norm": "2.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.559e+00", "dlm_acc": "5.468e-01", "anc_acc": "5.159e-01", "epoch": 0.08561} {"step": 42810, "loss": 1.2535, "grad_norm": "2.350e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.172e+00", "anc_loss": "1.284e+00", "dlm_acc": "5.844e-01", "anc_acc": "5.536e-01", "epoch": 0.08562} {"step": 42815, "loss": 1.3961, "grad_norm": "4.261e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.458e+00", "anc_loss": "1.575e+00", "dlm_acc": "5.463e-01", "anc_acc": "5.203e-01", "epoch": 0.08563} {"step": 42820, "loss": 1.8517, "grad_norm": "2.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.498e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.330e-01", "anc_acc": "5.037e-01", "epoch": 0.08564} {"step": 42825, "loss": 1.1823, "grad_norm": "2.474e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.901e-01", "anc_acc": "5.580e-01", "epoch": 0.08565} {"step": 42830, "loss": 1.4632, "grad_norm": "3.227e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.973e-01", "anc_loss": "1.108e+00", "dlm_acc": "6.384e-01", "anc_acc": "6.080e-01", "epoch": 0.08566} {"step": 42835, "loss": 1.6546, "grad_norm": "5.166e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.163e+00", "anc_loss": "2.227e+00", "dlm_acc": "2.369e-01", "anc_acc": "2.244e-01", "epoch": 0.08567} {"step": 42840, "loss": 1.2056, "grad_norm": "2.036e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.189e+00", "dlm_acc": "6.075e-01", "anc_acc": "5.809e-01", "epoch": 0.08568} {"step": 42845, "loss": 1.0541, "grad_norm": "2.195e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.648e-01", "anc_loss": "1.080e+00", "dlm_acc": "6.114e-01", "anc_acc": "5.773e-01", "epoch": 0.08569} {"step": 42850, "loss": 1.2321, "grad_norm": "3.728e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.067e+00", "anc_loss": "1.179e+00", "dlm_acc": "6.212e-01", "anc_acc": "5.931e-01", "epoch": 0.0857} {"step": 42855, "loss": 1.1115, "grad_norm": "1.557e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.664e-01", "anc_loss": "1.080e+00", "dlm_acc": "6.392e-01", "anc_acc": "6.082e-01", "epoch": 0.08571} {"step": 42860, "loss": 1.0983, "grad_norm": "3.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.211e+00", "dlm_acc": "6.025e-01", "anc_acc": "5.779e-01", "epoch": 0.08572} {"step": 42865, "loss": 1.1967, "grad_norm": "3.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.181e+00", "anc_loss": "1.281e+00", "dlm_acc": "5.948e-01", "anc_acc": "5.693e-01", "epoch": 0.08573} {"step": 42870, "loss": 1.4439, "grad_norm": "3.774e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.211e-01", "anc_acc": "4.941e-01", "epoch": 0.08574} {"step": 42875, "loss": 1.0625, "grad_norm": "2.675e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.719e-01", "anc_loss": "1.071e+00", "dlm_acc": "6.165e-01", "anc_acc": "5.911e-01", "epoch": 0.08575} {"step": 42880, "loss": 1.0641, "grad_norm": "3.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.156e+00", "dlm_acc": "6.043e-01", "anc_acc": "5.740e-01", "epoch": 0.08576} {"step": 42885, "loss": 1.2999, "grad_norm": "3.173e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.344e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.665e-01", "anc_acc": "5.336e-01", "epoch": 0.08577} {"step": 42890, "loss": 1.2078, "grad_norm": "4.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.111e+00", "anc_loss": "1.221e+00", "dlm_acc": "6.192e-01", "anc_acc": "5.915e-01", "epoch": 0.08578} {"step": 42895, "loss": 1.6287, "grad_norm": "3.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.897e+00", "anc_loss": "2.056e+00", "dlm_acc": "4.568e-01", "anc_acc": "4.264e-01", "epoch": 0.08579} {"step": 42900, "loss": 1.3063, "grad_norm": "3.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.222e+00", "anc_loss": "1.346e+00", "dlm_acc": "6.029e-01", "anc_acc": "5.703e-01", "epoch": 0.0858} {"step": 42905, "loss": 1.5938, "grad_norm": "4.405e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.097e+00", "anc_loss": "1.220e+00", "dlm_acc": "6.313e-01", "anc_acc": "6.019e-01", "epoch": 0.08581} {"step": 42910, "loss": 1.8678, "grad_norm": "1.318e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.878e-01", "anc_acc": "5.593e-01", "epoch": 0.08582} {"step": 42915, "loss": 1.2944, "grad_norm": "2.755e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.350e+00", "anc_loss": "1.482e+00", "dlm_acc": "4.758e-01", "anc_acc": "4.396e-01", "epoch": 0.08583} {"step": 42920, "loss": 1.3729, "grad_norm": "4.352e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.091e+00", "anc_loss": "1.209e+00", "dlm_acc": "5.405e-01", "anc_acc": "5.095e-01", "epoch": 0.08584} {"step": 42925, "loss": 1.4521, "grad_norm": "4.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.377e+00", "dlm_acc": "5.395e-01", "anc_acc": "5.067e-01", "epoch": 0.08585} {"step": 42930, "loss": 0.9487, "grad_norm": "3.096e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.258e-01", "anc_loss": "1.020e+00", "dlm_acc": "6.622e-01", "anc_acc": "6.042e-01", "epoch": 0.08586} {"step": 42935, "loss": 1.6519, "grad_norm": "2.783e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.423e+00", "anc_loss": "2.470e+00", "dlm_acc": "1.428e-01", "anc_acc": "1.346e-01", "epoch": 0.08587} {"step": 42940, "loss": 1.799, "grad_norm": "4.532e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.659e+00", "anc_loss": "2.706e+00", "dlm_acc": "1.192e-01", "anc_acc": "1.084e-01", "epoch": 0.08588} {"step": 42945, "loss": 1.2525, "grad_norm": "2.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.820e-01", "anc_loss": "9.855e-01", "dlm_acc": "6.843e-01", "anc_acc": "6.575e-01", "epoch": 0.08589} {"step": 42950, "loss": 1.7303, "grad_norm": "4.008e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.612e+00", "anc_loss": "2.712e+00", "dlm_acc": "8.723e-02", "anc_acc": "6.236e-02", "epoch": 0.0859} {"step": 42955, "loss": 1.2689, "grad_norm": "2.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.645e+00", "anc_loss": "1.845e+00", "dlm_acc": "4.049e-01", "anc_acc": "3.491e-01", "epoch": 0.08591} {"step": 42960, "loss": 1.3635, "grad_norm": "3.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.160e+00", "dlm_acc": "6.524e-01", "anc_acc": "6.185e-01", "epoch": 0.08592} {"step": 42965, "loss": 1.0982, "grad_norm": "4.232e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.065e+00", "anc_loss": "1.181e+00", "dlm_acc": "5.338e-01", "anc_acc": "4.822e-01", "epoch": 0.08593} {"step": 42970, "loss": 0.9474, "grad_norm": "2.422e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.688e-01", "anc_loss": "1.124e+00", "dlm_acc": "5.804e-01", "anc_acc": "5.214e-01", "epoch": 0.08594} {"step": 42975, "loss": 1.4905, "grad_norm": "5.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.124e+00", "anc_loss": "2.199e+00", "dlm_acc": "2.633e-01", "anc_acc": "2.469e-01", "epoch": 0.08595} {"step": 42980, "loss": 0.8882, "grad_norm": "2.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.453e+00", "anc_loss": "1.555e+00", "dlm_acc": "3.882e-01", "anc_acc": "3.631e-01", "epoch": 0.08596} {"step": 42985, "loss": 1.403, "grad_norm": "7.032e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.477e+00", "dlm_acc": "5.763e-01", "anc_acc": "5.498e-01", "epoch": 0.08597} {"step": 42990, "loss": 1.2447, "grad_norm": "3.491e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.002e-01", "epoch": 0.08598} {"step": 42995, "loss": 1.3773, "grad_norm": "3.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.486e+00", "dlm_acc": "5.484e-01", "anc_acc": "5.182e-01", "epoch": 0.08599} {"step": 43000, "loss": 1.3107, "grad_norm": "3.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.930e-01", "anc_loss": "1.145e+00", "dlm_acc": "6.301e-01", "anc_acc": "5.814e-01", "epoch": 0.086} {"step": 43005, "loss": 1.2839, "grad_norm": "3.024e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.730e-01", "anc_loss": "1.051e+00", "dlm_acc": "5.786e-01", "anc_acc": "5.586e-01", "epoch": 0.08601} {"step": 43010, "loss": 1.5319, "grad_norm": "5.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.118e+00", "anc_loss": "1.221e+00", "dlm_acc": "5.954e-01", "anc_acc": "5.650e-01", "epoch": 0.08602} {"step": 43015, "loss": 1.1969, "grad_norm": "1.320e+00", "learning_rate": "1.000e-04", "dlm_loss": "7.820e-01", "anc_loss": "8.746e-01", "dlm_acc": "6.096e-01", "anc_acc": "5.738e-01", "epoch": 0.08603} {"step": 43020, "loss": 1.0711, "grad_norm": "2.237e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.150e-01", "anc_loss": "5.500e-01", "dlm_acc": "6.603e-01", "anc_acc": "6.395e-01", "epoch": 0.08604} {"step": 43025, "loss": 1.3664, "grad_norm": "4.709e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.699e-01", "anc_loss": "8.174e-01", "dlm_acc": "5.255e-01", "anc_acc": "5.100e-01", "epoch": 0.08605} {"step": 43030, "loss": 0.8629, "grad_norm": "2.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.832e-01", "anc_loss": "8.930e-01", "dlm_acc": "6.137e-01", "anc_acc": "5.747e-01", "epoch": 0.08606} {"step": 43035, "loss": 0.8551, "grad_norm": "2.404e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.496e-01", "anc_loss": "1.064e+00", "dlm_acc": "6.234e-01", "anc_acc": "5.912e-01", "epoch": 0.08607} {"step": 43040, "loss": 1.2261, "grad_norm": "4.515e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.365e+00", "dlm_acc": "5.365e-01", "anc_acc": "4.985e-01", "epoch": 0.08608} {"step": 43045, "loss": 1.0413, "grad_norm": "1.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.805e+00", "anc_loss": "1.895e+00", "dlm_acc": "3.428e-01", "anc_acc": "3.129e-01", "epoch": 0.08609} {"step": 43050, "loss": 1.2597, "grad_norm": "3.099e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.145e+00", "dlm_acc": "6.364e-01", "anc_acc": "5.925e-01", "epoch": 0.0861} {"step": 43055, "loss": 1.5722, "grad_norm": "3.396e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.408e+00", "anc_loss": "1.597e+00", "dlm_acc": "5.403e-01", "anc_acc": "4.861e-01", "epoch": 0.08611} {"step": 43060, "loss": 1.3578, "grad_norm": "3.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.211e+00", "dlm_acc": "5.766e-01", "anc_acc": "5.431e-01", "epoch": 0.08612} {"step": 43065, "loss": 1.175, "grad_norm": "3.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.758e-01", "anc_loss": "9.695e-01", "dlm_acc": "6.474e-01", "anc_acc": "6.212e-01", "epoch": 0.08613} {"step": 43070, "loss": 1.3774, "grad_norm": "3.537e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.609e+00", "dlm_acc": "5.375e-01", "anc_acc": "5.082e-01", "epoch": 0.08614} {"step": 43075, "loss": 1.2529, "grad_norm": "4.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.204e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.827e-01", "anc_acc": "5.173e-01", "epoch": 0.08615} {"step": 43080, "loss": 1.2986, "grad_norm": "6.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.312e-01", "anc_acc": "4.917e-01", "epoch": 0.08616} {"step": 43085, "loss": 0.8915, "grad_norm": "2.456e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.244e-01", "anc_loss": "4.617e-01", "dlm_acc": "6.869e-01", "anc_acc": "6.654e-01", "epoch": 0.08617} {"step": 43090, "loss": 1.1221, "grad_norm": "2.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.259e+00", "dlm_acc": "3.687e-01", "anc_acc": "3.536e-01", "epoch": 0.08618} {"step": 43095, "loss": 0.9674, "grad_norm": "1.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.734e-01", "anc_loss": "8.383e-01", "dlm_acc": "6.723e-01", "anc_acc": "6.560e-01", "epoch": 0.08619} {"step": 43100, "loss": 1.7868, "grad_norm": "3.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.473e+00", "dlm_acc": "5.584e-01", "anc_acc": "5.260e-01", "epoch": 0.0862} {"step": 43105, "loss": 1.5595, "grad_norm": "8.758e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.402e+00", "dlm_acc": "5.224e-01", "anc_acc": "4.832e-01", "epoch": 0.08621} {"step": 43110, "loss": 1.3816, "grad_norm": "1.070e+00", "learning_rate": "1.000e-04", "dlm_loss": "9.938e-01", "anc_loss": "1.048e+00", "dlm_acc": "4.617e-01", "anc_acc": "4.482e-01", "epoch": 0.08622} {"step": 43115, "loss": 1.1352, "grad_norm": "3.305e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.643e+00", "anc_loss": "1.759e+00", "dlm_acc": "4.643e-01", "anc_acc": "4.380e-01", "epoch": 0.08623} {"step": 43120, "loss": 1.2628, "grad_norm": "2.909e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.059e-01", "anc_loss": "1.024e+00", "dlm_acc": "6.443e-01", "anc_acc": "6.065e-01", "epoch": 0.08624} {"step": 43125, "loss": 1.1421, "grad_norm": "3.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.391e+00", "dlm_acc": "4.997e-01", "anc_acc": "4.658e-01", "epoch": 0.08625} {"step": 43130, "loss": 0.98, "grad_norm": "2.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.023e-01", "anc_loss": "9.133e-01", "dlm_acc": "6.189e-01", "anc_acc": "5.681e-01", "epoch": 0.08626} {"step": 43135, "loss": 1.5607, "grad_norm": "3.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.436e+00", "dlm_acc": "5.362e-01", "anc_acc": "5.029e-01", "epoch": 0.08627} {"step": 43140, "loss": 0.8564, "grad_norm": "2.218e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.955e-01", "anc_loss": "8.223e-01", "dlm_acc": "6.852e-01", "anc_acc": "6.359e-01", "epoch": 0.08628} {"step": 43145, "loss": 1.2134, "grad_norm": "2.963e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.200e+00", "dlm_acc": "6.189e-01", "anc_acc": "5.825e-01", "epoch": 0.08629} {"step": 43150, "loss": 1.6162, "grad_norm": "4.496e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.423e+00", "dlm_acc": "5.603e-01", "anc_acc": "5.268e-01", "epoch": 0.0863} {"step": 43155, "loss": 1.1534, "grad_norm": "3.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.138e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.546e-01", "anc_acc": "5.180e-01", "epoch": 0.08631} {"step": 43160, "loss": 1.0506, "grad_norm": "4.076e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.158e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.396e-01", "anc_acc": "4.987e-01", "epoch": 0.08632} {"step": 43165, "loss": 1.4002, "grad_norm": "5.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.523e+00", "anc_loss": "1.659e+00", "dlm_acc": "4.422e-01", "anc_acc": "4.100e-01", "epoch": 0.08633} {"step": 43170, "loss": 1.8351, "grad_norm": "2.638e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.635e+00", "anc_loss": "1.767e+00", "dlm_acc": "4.763e-01", "anc_acc": "4.488e-01", "epoch": 0.08634} {"step": 43175, "loss": 1.5102, "grad_norm": "4.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.374e+00", "anc_loss": "1.490e+00", "dlm_acc": "5.619e-01", "anc_acc": "5.330e-01", "epoch": 0.08635} {"step": 43180, "loss": 1.2266, "grad_norm": "3.794e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.965e-01", "anc_loss": "7.871e-01", "dlm_acc": "6.662e-01", "anc_acc": "6.362e-01", "epoch": 0.08636} {"step": 43185, "loss": 1.1963, "grad_norm": "2.798e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.496e-01", "anc_loss": "1.027e+00", "dlm_acc": "5.771e-01", "anc_acc": "5.578e-01", "epoch": 0.08637} {"step": 43190, "loss": 1.159, "grad_norm": "2.916e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.684e-01", "anc_loss": "1.009e+00", "dlm_acc": "6.523e-01", "anc_acc": "6.027e-01", "epoch": 0.08638} {"step": 43195, "loss": 1.3363, "grad_norm": "3.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.623e-01", "anc_acc": "5.260e-01", "epoch": 0.08639} {"step": 43200, "loss": 1.4921, "grad_norm": "3.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.475e+00", "anc_loss": "1.614e+00", "dlm_acc": "5.006e-01", "anc_acc": "4.662e-01", "epoch": 0.0864} {"step": 43205, "loss": 1.2844, "grad_norm": "3.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.172e+00", "dlm_acc": "6.111e-01", "anc_acc": "5.597e-01", "epoch": 0.08641} {"step": 43210, "loss": 1.3214, "grad_norm": "2.660e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.508e-01", "anc_loss": "7.035e-01", "dlm_acc": "6.858e-01", "anc_acc": "6.620e-01", "epoch": 0.08642} {"step": 43215, "loss": 1.3755, "grad_norm": "5.304e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.447e+00", "dlm_acc": "5.579e-01", "anc_acc": "5.112e-01", "epoch": 0.08643} {"step": 43220, "loss": 1.1791, "grad_norm": "4.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.844e-01", "anc_loss": "9.508e-01", "dlm_acc": "5.082e-01", "anc_acc": "4.927e-01", "epoch": 0.08644} {"step": 43225, "loss": 1.0447, "grad_norm": "5.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.374e+00", "dlm_acc": "5.800e-01", "anc_acc": "5.379e-01", "epoch": 0.08645} {"step": 43230, "loss": 1.5571, "grad_norm": "4.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.505e+00", "anc_loss": "1.663e+00", "dlm_acc": "5.220e-01", "anc_acc": "4.878e-01", "epoch": 0.08646} {"step": 43235, "loss": 1.5088, "grad_norm": "1.412e+01", "learning_rate": "1.000e-04", "dlm_loss": "1.576e+00", "anc_loss": "1.685e+00", "dlm_acc": "4.931e-01", "anc_acc": "4.668e-01", "epoch": 0.08647} {"step": 43240, "loss": 1.191, "grad_norm": "3.273e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.438e-01", "anc_loss": "7.207e-01", "dlm_acc": "7.186e-01", "anc_acc": "6.922e-01", "epoch": 0.08648} {"step": 43245, "loss": 1.301, "grad_norm": "7.332e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.208e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.989e-01", "anc_acc": "5.468e-01", "epoch": 0.08649} {"step": 43250, "loss": 1.3153, "grad_norm": "2.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.375e-01", "anc_loss": "1.000e+00", "dlm_acc": "6.757e-01", "anc_acc": "6.244e-01", "epoch": 0.0865} {"step": 43255, "loss": 1.1397, "grad_norm": "5.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.113e-01", "anc_loss": "9.340e-01", "dlm_acc": "6.670e-01", "anc_acc": "6.327e-01", "epoch": 0.08651} {"step": 43260, "loss": 1.3714, "grad_norm": "2.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.378e+00", "dlm_acc": "6.025e-01", "anc_acc": "5.503e-01", "epoch": 0.08652} {"step": 43265, "loss": 0.9709, "grad_norm": "1.954e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.133e-01", "anc_loss": "9.375e-01", "dlm_acc": "6.777e-01", "anc_acc": "6.411e-01", "epoch": 0.08653} {"step": 43270, "loss": 1.0817, "grad_norm": "3.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.065e+00", "anc_loss": "1.174e+00", "dlm_acc": "5.639e-01", "anc_acc": "5.246e-01", "epoch": 0.08654} {"step": 43275, "loss": 1.1091, "grad_norm": "2.978e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.460e-01", "anc_loss": "7.477e-01", "dlm_acc": "7.207e-01", "anc_acc": "6.820e-01", "epoch": 0.08655} {"step": 43280, "loss": 0.9724, "grad_norm": "3.576e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.938e-01", "anc_loss": "5.605e-01", "dlm_acc": "7.377e-01", "anc_acc": "7.151e-01", "epoch": 0.08656} {"step": 43285, "loss": 1.4022, "grad_norm": "3.322e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.158e+00", "dlm_acc": "6.432e-01", "anc_acc": "5.983e-01", "epoch": 0.08657} {"step": 43290, "loss": 1.2723, "grad_norm": "2.329e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.781e-01", "anc_loss": "1.024e+00", "dlm_acc": "6.444e-01", "anc_acc": "6.027e-01", "epoch": 0.08658} {"step": 43295, "loss": 0.9202, "grad_norm": "2.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.371e-01", "anc_loss": "8.629e-01", "dlm_acc": "6.981e-01", "anc_acc": "6.568e-01", "epoch": 0.08659} {"step": 43300, "loss": 0.6921, "grad_norm": "3.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.008e-01", "anc_loss": "1.012e+00", "dlm_acc": "6.358e-01", "anc_acc": "6.021e-01", "epoch": 0.0866} {"step": 43305, "loss": 0.8273, "grad_norm": "2.428e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.193e+00", "dlm_acc": "5.988e-01", "anc_acc": "5.642e-01", "epoch": 0.08661} {"step": 43310, "loss": 1.1059, "grad_norm": "3.528e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.402e+00", "dlm_acc": "5.256e-01", "anc_acc": "4.928e-01", "epoch": 0.08662} {"step": 43315, "loss": 0.9152, "grad_norm": "3.977e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.652e-01", "anc_loss": "9.789e-01", "dlm_acc": "6.911e-01", "anc_acc": "6.580e-01", "epoch": 0.08663} {"step": 43320, "loss": 1.254, "grad_norm": "3.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.918e-01", "anc_loss": "8.059e-01", "dlm_acc": "7.535e-01", "anc_acc": "7.172e-01", "epoch": 0.08664} {"step": 43325, "loss": 1.1205, "grad_norm": "2.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.515e+00", "dlm_acc": "5.115e-01", "anc_acc": "4.771e-01", "epoch": 0.08665} {"step": 43330, "loss": 1.1146, "grad_norm": "2.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.254e+00", "dlm_acc": "5.364e-01", "anc_acc": "5.120e-01", "epoch": 0.08666} {"step": 43335, "loss": 1.2591, "grad_norm": "2.739e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.677e-01", "anc_acc": "5.378e-01", "epoch": 0.08667} {"step": 43340, "loss": 1.3415, "grad_norm": "7.581e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.603e+00", "anc_loss": "1.718e+00", "dlm_acc": "5.150e-01", "anc_acc": "4.879e-01", "epoch": 0.08668} {"step": 43345, "loss": 1.2412, "grad_norm": "4.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.559e+00", "anc_loss": "1.669e+00", "dlm_acc": "4.953e-01", "anc_acc": "4.684e-01", "epoch": 0.08669} {"step": 43350, "loss": 1.1009, "grad_norm": "3.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.650e+00", "dlm_acc": "5.175e-01", "anc_acc": "4.899e-01", "epoch": 0.0867} {"step": 43355, "loss": 0.7328, "grad_norm": "3.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.932e-02", "anc_loss": "1.000e-01", "dlm_acc": "9.516e-01", "anc_acc": "9.395e-01", "epoch": 0.08671} {"step": 43360, "loss": 0.6337, "grad_norm": "3.340e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.391e-01", "anc_loss": "5.118e-01", "dlm_acc": "8.463e-01", "anc_acc": "8.273e-01", "epoch": 0.08672} {"step": 43365, "loss": 1.1828, "grad_norm": "3.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.250e+00", "anc_loss": "1.356e+00", "dlm_acc": "6.213e-01", "anc_acc": "5.994e-01", "epoch": 0.08673} {"step": 43370, "loss": 1.3675, "grad_norm": "6.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.674e+00", "anc_loss": "1.806e+00", "dlm_acc": "5.150e-01", "anc_acc": "4.858e-01", "epoch": 0.08674} {"step": 43375, "loss": 1.2821, "grad_norm": "4.263e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.089e+00", "anc_loss": "1.206e+00", "dlm_acc": "6.532e-01", "anc_acc": "6.191e-01", "epoch": 0.08675} {"step": 43380, "loss": 1.3867, "grad_norm": "5.598e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.177e+00", "anc_loss": "1.308e+00", "dlm_acc": "6.080e-01", "anc_acc": "5.751e-01", "epoch": 0.08676} {"step": 43385, "loss": 1.0884, "grad_norm": "4.021e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.246e+00", "dlm_acc": "5.982e-01", "anc_acc": "5.692e-01", "epoch": 0.08677} {"step": 43390, "loss": 0.9815, "grad_norm": "4.865e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.126e+00", "anc_loss": "1.225e+00", "dlm_acc": "6.084e-01", "anc_acc": "5.822e-01", "epoch": 0.08678} {"step": 43395, "loss": 1.0381, "grad_norm": "3.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.313e+00", "dlm_acc": "5.648e-01", "anc_acc": "5.367e-01", "epoch": 0.08679} {"step": 43400, "loss": 1.2574, "grad_norm": "2.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.553e+00", "dlm_acc": "5.423e-01", "anc_acc": "5.147e-01", "epoch": 0.0868} {"step": 43405, "loss": 0.9363, "grad_norm": "6.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.374e+00", "anc_loss": "1.483e+00", "dlm_acc": "5.181e-01", "anc_acc": "4.882e-01", "epoch": 0.08681} {"step": 43410, "loss": 0.9139, "grad_norm": "3.292e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.576e-01", "anc_acc": "5.219e-01", "epoch": 0.08682} {"step": 43415, "loss": 1.0731, "grad_norm": "5.153e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.760e-01", "anc_acc": "5.496e-01", "epoch": 0.08683} {"step": 43420, "loss": 0.7541, "grad_norm": "2.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.258e+00", "dlm_acc": "5.880e-01", "anc_acc": "5.557e-01", "epoch": 0.08684} {"step": 43425, "loss": 1.2529, "grad_norm": "7.302e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.305e+00", "anc_loss": "1.342e+00", "dlm_acc": "3.727e-01", "anc_acc": "3.654e-01", "epoch": 0.08685} {"step": 43430, "loss": 1.2805, "grad_norm": "5.946e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.540e+00", "anc_loss": "1.637e+00", "dlm_acc": "4.791e-01", "anc_acc": "4.569e-01", "epoch": 0.08686} {"step": 43435, "loss": 1.3704, "grad_norm": "4.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.259e+00", "anc_loss": "2.350e+00", "dlm_acc": "2.791e-01", "anc_acc": "2.625e-01", "epoch": 0.08687} {"step": 43440, "loss": 0.5582, "grad_norm": "2.137e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.145e-01", "anc_loss": "8.943e-01", "dlm_acc": "6.661e-01", "anc_acc": "6.436e-01", "epoch": 0.08688} {"step": 43445, "loss": 0.9939, "grad_norm": "4.398e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.369e+00", "dlm_acc": "5.330e-01", "anc_acc": "5.095e-01", "epoch": 0.08689} {"step": 43450, "loss": 0.8657, "grad_norm": "2.424e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.945e-01", "anc_loss": "1.116e+00", "dlm_acc": "6.263e-01", "anc_acc": "5.960e-01", "epoch": 0.0869} {"step": 43455, "loss": 1.013, "grad_norm": "2.200e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.362e+00", "anc_loss": "1.481e+00", "dlm_acc": "5.245e-01", "anc_acc": "4.936e-01", "epoch": 0.08691} {"step": 43460, "loss": 0.9601, "grad_norm": "3.351e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.828e-01", "anc_loss": "1.129e+00", "dlm_acc": "6.426e-01", "anc_acc": "6.062e-01", "epoch": 0.08692} {"step": 43465, "loss": 0.8289, "grad_norm": "2.639e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.301e-01", "anc_loss": "1.015e+00", "dlm_acc": "6.227e-01", "anc_acc": "6.003e-01", "epoch": 0.08693} {"step": 43470, "loss": 1.0681, "grad_norm": "3.101e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.201e+00", "anc_loss": "1.296e+00", "dlm_acc": "5.133e-01", "anc_acc": "4.917e-01", "epoch": 0.08694} {"step": 43475, "loss": 0.8716, "grad_norm": "3.404e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.845e-01", "anc_acc": "5.503e-01", "epoch": 0.08695} {"step": 43480, "loss": 1.384, "grad_norm": "3.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.914e+00", "anc_loss": "2.048e+00", "dlm_acc": "4.651e-01", "anc_acc": "4.399e-01", "epoch": 0.08696} {"step": 43485, "loss": 1.1191, "grad_norm": "3.767e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.390e+00", "anc_loss": "1.508e+00", "dlm_acc": "5.373e-01", "anc_acc": "5.084e-01", "epoch": 0.08697} {"step": 43490, "loss": 1.018, "grad_norm": "4.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.319e+00", "anc_loss": "1.397e+00", "dlm_acc": "4.260e-01", "anc_acc": "4.047e-01", "epoch": 0.08698} {"step": 43495, "loss": 0.9831, "grad_norm": "4.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.827e-01", "anc_loss": "8.058e-01", "dlm_acc": "7.316e-01", "anc_acc": "6.948e-01", "epoch": 0.08699} {"step": 43500, "loss": 0.8118, "grad_norm": "3.131e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.621e-01", "anc_loss": "6.340e-01", "dlm_acc": "7.366e-01", "anc_acc": "7.117e-01", "epoch": 0.087} {"step": 43505, "loss": 0.7815, "grad_norm": "2.689e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.159e+00", "dlm_acc": "6.022e-01", "anc_acc": "5.751e-01", "epoch": 0.08701} {"step": 43510, "loss": 1.2097, "grad_norm": "2.523e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.973e+00", "anc_loss": "2.028e+00", "dlm_acc": "2.780e-01", "anc_acc": "2.650e-01", "epoch": 0.08702} {"step": 43515, "loss": 1.3712, "grad_norm": "1.615e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.675e+00", "anc_loss": "1.805e+00", "dlm_acc": "4.090e-01", "anc_acc": "3.799e-01", "epoch": 0.08703} {"step": 43520, "loss": 1.6787, "grad_norm": "3.911e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.116e+00", "anc_loss": "2.253e+00", "dlm_acc": "3.825e-01", "anc_acc": "3.531e-01", "epoch": 0.08704} {"step": 43525, "loss": 1.2474, "grad_norm": "2.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.575e+00", "anc_loss": "1.659e+00", "dlm_acc": "4.671e-01", "anc_acc": "4.457e-01", "epoch": 0.08705} {"step": 43530, "loss": 1.3536, "grad_norm": "4.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.234e-01", "anc_loss": "9.836e-01", "dlm_acc": "5.830e-01", "anc_acc": "5.647e-01", "epoch": 0.08706} {"step": 43535, "loss": 1.1246, "grad_norm": "2.972e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.292e+00", "dlm_acc": "5.958e-01", "anc_acc": "5.624e-01", "epoch": 0.08707} {"step": 43540, "loss": 1.2502, "grad_norm": "4.005e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.746e-01", "anc_loss": "1.092e+00", "dlm_acc": "6.418e-01", "anc_acc": "6.092e-01", "epoch": 0.08708} {"step": 43545, "loss": 0.987, "grad_norm": "3.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.953e-01", "anc_loss": "8.949e-01", "dlm_acc": "6.806e-01", "anc_acc": "6.471e-01", "epoch": 0.08709} {"step": 43550, "loss": 0.9398, "grad_norm": "5.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.715e-01", "anc_loss": "1.123e+00", "dlm_acc": "6.817e-01", "anc_acc": "6.436e-01", "epoch": 0.0871} {"step": 43555, "loss": 0.9456, "grad_norm": "1.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.115e+00", "anc_loss": "1.203e+00", "dlm_acc": "5.613e-01", "anc_acc": "5.405e-01", "epoch": 0.08711} {"step": 43560, "loss": 0.8359, "grad_norm": "1.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.075e+00", "anc_loss": "1.197e+00", "dlm_acc": "6.253e-01", "anc_acc": "5.856e-01", "epoch": 0.08712} {"step": 43565, "loss": 0.7529, "grad_norm": "3.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.656e-01", "anc_loss": "7.691e-01", "dlm_acc": "6.977e-01", "anc_acc": "6.617e-01", "epoch": 0.08713} {"step": 43570, "loss": 1.114, "grad_norm": "2.902e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.614e-01", "anc_acc": "5.269e-01", "epoch": 0.08714} {"step": 43575, "loss": 1.0158, "grad_norm": "2.579e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.212e+00", "dlm_acc": "6.095e-01", "anc_acc": "5.709e-01", "epoch": 0.08715} {"step": 43580, "loss": 1.0396, "grad_norm": "2.841e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.598e-01", "anc_loss": "9.023e-01", "dlm_acc": "6.783e-01", "anc_acc": "6.383e-01", "epoch": 0.08716} {"step": 43585, "loss": 0.9392, "grad_norm": "2.709e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.879e-01", "anc_loss": "1.048e+00", "dlm_acc": "6.854e-01", "anc_acc": "6.392e-01", "epoch": 0.08717} {"step": 43590, "loss": 1.0416, "grad_norm": "4.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.078e+00", "anc_loss": "1.166e+00", "dlm_acc": "5.554e-01", "anc_acc": "5.346e-01", "epoch": 0.08718} {"step": 43595, "loss": 1.1437, "grad_norm": "3.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.497e+00", "dlm_acc": "5.384e-01", "anc_acc": "5.058e-01", "epoch": 0.08719} {"step": 43600, "loss": 1.4788, "grad_norm": "3.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.199e+00", "anc_loss": "1.346e+00", "dlm_acc": "6.154e-01", "anc_acc": "5.764e-01", "epoch": 0.0872} {"step": 43605, "loss": 1.2747, "grad_norm": "4.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.673e+00", "anc_loss": "1.792e+00", "dlm_acc": "2.930e-01", "anc_acc": "2.640e-01", "epoch": 0.08721} {"step": 43610, "loss": 1.5368, "grad_norm": "2.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.962e+00", "anc_loss": "2.105e+00", "dlm_acc": "2.708e-01", "anc_acc": "2.354e-01", "epoch": 0.08722} {"step": 43615, "loss": 1.6574, "grad_norm": "4.417e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.059e+00", "anc_loss": "2.208e+00", "dlm_acc": "2.769e-01", "anc_acc": "2.397e-01", "epoch": 0.08723} {"step": 43620, "loss": 1.5861, "grad_norm": "3.132e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.881e+00", "anc_loss": "2.033e+00", "dlm_acc": "3.079e-01", "anc_acc": "2.643e-01", "epoch": 0.08724} {"step": 43625, "loss": 0.9063, "grad_norm": "3.979e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.128e+00", "dlm_acc": "5.646e-01", "anc_acc": "5.357e-01", "epoch": 0.08725} {"step": 43630, "loss": 0.9064, "grad_norm": "6.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.375e-01", "anc_loss": "9.812e-01", "dlm_acc": "7.052e-01", "anc_acc": "6.620e-01", "epoch": 0.08726} {"step": 43635, "loss": 1.1171, "grad_norm": "2.406e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.488e-01", "anc_loss": "8.594e-01", "dlm_acc": "6.989e-01", "anc_acc": "6.690e-01", "epoch": 0.08727} {"step": 43640, "loss": 1.1899, "grad_norm": "2.438e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.432e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.086e-01", "anc_acc": "4.785e-01", "epoch": 0.08728} {"step": 43645, "loss": 1.1689, "grad_norm": "3.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.160e-01", "anc_loss": "8.199e-01", "dlm_acc": "6.844e-01", "anc_acc": "6.530e-01", "epoch": 0.08729} {"step": 43650, "loss": 1.0768, "grad_norm": "5.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.186e+00", "anc_loss": "1.311e+00", "dlm_acc": "5.838e-01", "anc_acc": "5.443e-01", "epoch": 0.0873} {"step": 43655, "loss": 1.1869, "grad_norm": "3.098e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.469e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.333e-01", "anc_acc": "6.004e-01", "epoch": 0.08731} {"step": 43660, "loss": 1.5848, "grad_norm": "3.345e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.212e+00", "anc_loss": "1.338e+00", "dlm_acc": "5.958e-01", "anc_acc": "5.652e-01", "epoch": 0.08732} {"step": 43665, "loss": 1.0658, "grad_norm": "8.690e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.430e-01", "anc_loss": "9.547e-01", "dlm_acc": "6.578e-01", "anc_acc": "6.221e-01", "epoch": 0.08733} {"step": 43670, "loss": 1.2708, "grad_norm": "3.653e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.284e+00", "dlm_acc": "6.223e-01", "anc_acc": "5.953e-01", "epoch": 0.08734} {"step": 43675, "loss": 1.0911, "grad_norm": "3.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.432e+00", "dlm_acc": "5.658e-01", "anc_acc": "5.346e-01", "epoch": 0.08735} {"step": 43680, "loss": 0.983, "grad_norm": "4.450e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.521e-01", "anc_acc": "5.276e-01", "epoch": 0.08736} {"step": 43685, "loss": 1.0719, "grad_norm": "4.386e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.073e-01", "anc_acc": "4.791e-01", "epoch": 0.08737} {"step": 43690, "loss": 1.1849, "grad_norm": "4.580e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.172e-01", "anc_loss": "9.422e-01", "dlm_acc": "6.854e-01", "anc_acc": "6.491e-01", "epoch": 0.08738} {"step": 43695, "loss": 1.0507, "grad_norm": "3.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.383e-01", "anc_loss": "4.321e-01", "dlm_acc": "8.734e-01", "anc_acc": "8.438e-01", "epoch": 0.08739} {"step": 43700, "loss": 1.0654, "grad_norm": "5.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.039e-01", "anc_loss": "9.750e-01", "dlm_acc": "5.875e-01", "anc_acc": "5.656e-01", "epoch": 0.0874} {"step": 43705, "loss": 1.4765, "grad_norm": "2.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.625e+00", "dlm_acc": "4.902e-01", "anc_acc": "4.623e-01", "epoch": 0.08741} {"step": 43710, "loss": 1.342, "grad_norm": "4.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.464e+00", "anc_loss": "1.598e+00", "dlm_acc": "5.257e-01", "anc_acc": "4.951e-01", "epoch": 0.08742} {"step": 43715, "loss": 1.4926, "grad_norm": "3.874e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.570e+00", "anc_loss": "1.653e+00", "dlm_acc": "4.363e-01", "anc_acc": "4.167e-01", "epoch": 0.08743} {"step": 43720, "loss": 1.363, "grad_norm": "2.568e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.548e+00", "dlm_acc": "5.687e-01", "anc_acc": "5.344e-01", "epoch": 0.08744} {"step": 43725, "loss": 1.5705, "grad_norm": "4.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.479e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.065e-01", "anc_acc": "4.684e-01", "epoch": 0.08745} {"step": 43730, "loss": 1.3439, "grad_norm": "6.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.313e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.460e-01", "anc_acc": "5.041e-01", "epoch": 0.08746} {"step": 43735, "loss": 1.1776, "grad_norm": "3.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.071e+00", "anc_loss": "1.179e+00", "dlm_acc": "5.961e-01", "anc_acc": "5.654e-01", "epoch": 0.08747} {"step": 43740, "loss": 1.6572, "grad_norm": "4.930e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.394e+00", "anc_loss": "1.559e+00", "dlm_acc": "5.669e-01", "anc_acc": "5.230e-01", "epoch": 0.08748} {"step": 43745, "loss": 1.4538, "grad_norm": "2.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.211e+00", "anc_loss": "1.311e+00", "dlm_acc": "5.729e-01", "anc_acc": "5.441e-01", "epoch": 0.08749} {"step": 43750, "loss": 0.9071, "grad_norm": "2.601e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.306e-01", "anc_loss": "7.863e-01", "dlm_acc": "6.596e-01", "anc_acc": "6.404e-01", "epoch": 0.0875} {"step": 43755, "loss": 1.1095, "grad_norm": "3.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.382e+00", "dlm_acc": "5.498e-01", "anc_acc": "5.186e-01", "epoch": 0.08751} {"step": 43760, "loss": 1.5298, "grad_norm": "4.085e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.352e+00", "anc_loss": "1.513e+00", "dlm_acc": "5.444e-01", "anc_acc": "5.007e-01", "epoch": 0.08752} {"step": 43765, "loss": 1.64, "grad_norm": "1.928e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.577e+00", "dlm_acc": "5.335e-01", "anc_acc": "4.753e-01", "epoch": 0.08753} {"step": 43770, "loss": 1.5499, "grad_norm": "2.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.439e+00", "anc_loss": "1.541e+00", "dlm_acc": "4.764e-01", "anc_acc": "4.533e-01", "epoch": 0.08754} {"step": 43775, "loss": 1.0479, "grad_norm": "2.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.211e+00", "dlm_acc": "5.909e-01", "anc_acc": "5.625e-01", "epoch": 0.08755} {"step": 43780, "loss": 1.1635, "grad_norm": "3.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.193e+00", "dlm_acc": "5.866e-01", "anc_acc": "5.349e-01", "epoch": 0.08756} {"step": 43785, "loss": 1.187, "grad_norm": "8.683e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.564e+00", "dlm_acc": "5.267e-01", "anc_acc": "4.927e-01", "epoch": 0.08757} {"step": 43790, "loss": 1.0478, "grad_norm": "3.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.139e+00", "dlm_acc": "5.487e-01", "anc_acc": "5.188e-01", "epoch": 0.08758} {"step": 43795, "loss": 1.0262, "grad_norm": "1.168e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.001e+00", "anc_loss": "1.118e+00", "dlm_acc": "6.433e-01", "anc_acc": "6.076e-01", "epoch": 0.08759} {"step": 43800, "loss": 1.261, "grad_norm": "3.399e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.373e+00", "dlm_acc": "5.588e-01", "anc_acc": "5.020e-01", "epoch": 0.0876} {"step": 43805, "loss": 0.9547, "grad_norm": "5.193e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.547e-01", "anc_loss": "1.016e+00", "dlm_acc": "6.383e-01", "anc_acc": "5.812e-01", "epoch": 0.08761} {"step": 43810, "loss": 0.8032, "grad_norm": "3.011e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.174e+00", "anc_loss": "1.283e+00", "dlm_acc": "5.437e-01", "anc_acc": "5.120e-01", "epoch": 0.08762} {"step": 43815, "loss": 0.8519, "grad_norm": "2.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.320e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.020e-01", "epoch": 0.08763} {"step": 43820, "loss": 1.145, "grad_norm": "3.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.463e+00", "dlm_acc": "5.622e-01", "anc_acc": "5.295e-01", "epoch": 0.08764} {"step": 43825, "loss": 0.9446, "grad_norm": "3.267e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.253e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.425e-01", "anc_acc": "5.061e-01", "epoch": 0.08765} {"step": 43830, "loss": 1.0226, "grad_norm": "2.132e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.020e+00", "anc_loss": "1.108e+00", "dlm_acc": "5.970e-01", "anc_acc": "5.735e-01", "epoch": 0.08766} {"step": 43835, "loss": 1.2152, "grad_norm": "2.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.336e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.502e-01", "anc_acc": "5.116e-01", "epoch": 0.08767} {"step": 43840, "loss": 1.2112, "grad_norm": "2.092e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.990e-01", "anc_acc": "5.637e-01", "epoch": 0.08768} {"step": 43845, "loss": 1.0721, "grad_norm": "5.522e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.156e+00", "anc_loss": "1.279e+00", "dlm_acc": "4.786e-01", "anc_acc": "4.512e-01", "epoch": 0.08769} {"step": 43850, "loss": 1.2881, "grad_norm": "6.031e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.471e+00", "anc_loss": "1.582e+00", "dlm_acc": "5.631e-01", "anc_acc": "5.376e-01", "epoch": 0.0877} {"step": 43855, "loss": 1.4089, "grad_norm": "1.685e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.573e+00", "anc_loss": "1.712e+00", "dlm_acc": "5.011e-01", "anc_acc": "4.718e-01", "epoch": 0.08771} {"step": 43860, "loss": 0.8121, "grad_norm": "2.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.086e-01", "anc_loss": "1.027e+00", "dlm_acc": "6.532e-01", "anc_acc": "6.197e-01", "epoch": 0.08772} {"step": 43865, "loss": 1.4596, "grad_norm": "4.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.367e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.988e-01", "anc_acc": "5.764e-01", "epoch": 0.08773} {"step": 43870, "loss": 0.8025, "grad_norm": "3.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.305e-01", "anc_loss": "1.045e+00", "dlm_acc": "6.362e-01", "anc_acc": "6.054e-01", "epoch": 0.08774} {"step": 43875, "loss": 0.8329, "grad_norm": "4.602e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.207e-01", "anc_loss": "8.760e-01", "dlm_acc": "7.380e-01", "anc_acc": "6.942e-01", "epoch": 0.08775} {"step": 43880, "loss": 1.0868, "grad_norm": "3.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.453e-01", "anc_loss": "1.103e+00", "dlm_acc": "6.707e-01", "anc_acc": "6.255e-01", "epoch": 0.08776} {"step": 43885, "loss": 0.9923, "grad_norm": "1.877e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.130e+00", "dlm_acc": "6.426e-01", "anc_acc": "6.128e-01", "epoch": 0.08777} {"step": 43890, "loss": 1.1766, "grad_norm": "3.138e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.198e+00", "dlm_acc": "6.058e-01", "anc_acc": "5.777e-01", "epoch": 0.08778} {"step": 43895, "loss": 1.2213, "grad_norm": "5.359e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.245e+00", "anc_loss": "1.373e+00", "dlm_acc": "5.918e-01", "anc_acc": "5.640e-01", "epoch": 0.08779} {"step": 43900, "loss": 0.8417, "grad_norm": "4.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.250e-01", "anc_loss": "8.133e-01", "dlm_acc": "7.067e-01", "anc_acc": "6.848e-01", "epoch": 0.0878} {"step": 43905, "loss": 1.1422, "grad_norm": "3.676e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.135e+00", "anc_loss": "1.237e+00", "dlm_acc": "5.730e-01", "anc_acc": "5.498e-01", "epoch": 0.08781} {"step": 43910, "loss": 1.1443, "grad_norm": "3.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.184e+00", "dlm_acc": "6.486e-01", "anc_acc": "6.171e-01", "epoch": 0.08782} {"step": 43915, "loss": 1.3603, "grad_norm": "5.316e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.228e+00", "dlm_acc": "6.691e-01", "anc_acc": "6.270e-01", "epoch": 0.08783} {"step": 43920, "loss": 1.0848, "grad_norm": "3.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.229e-01", "anc_loss": "9.828e-01", "dlm_acc": "7.034e-01", "anc_acc": "6.569e-01", "epoch": 0.08784} {"step": 43925, "loss": 1.3917, "grad_norm": "3.713e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.540e+00", "dlm_acc": "5.299e-01", "anc_acc": "4.944e-01", "epoch": 0.08785} {"step": 43930, "loss": 1.0105, "grad_norm": "7.515e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.273e+00", "dlm_acc": "6.067e-01", "anc_acc": "5.510e-01", "epoch": 0.08786} {"step": 43935, "loss": 1.3732, "grad_norm": "3.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.618e-01", "anc_acc": "5.191e-01", "epoch": 0.08787} {"step": 43940, "loss": 1.5656, "grad_norm": "5.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.855e-01", "anc_loss": "7.645e-01", "dlm_acc": "6.683e-01", "anc_acc": "6.432e-01", "epoch": 0.08788} {"step": 43945, "loss": 1.1374, "grad_norm": "3.829e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.296e+00", "dlm_acc": "5.446e-01", "anc_acc": "5.053e-01", "epoch": 0.08789} {"step": 43950, "loss": 1.5607, "grad_norm": "5.434e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.433e+00", "dlm_acc": "5.383e-01", "anc_acc": "5.073e-01", "epoch": 0.0879} {"step": 43955, "loss": 1.1615, "grad_norm": "6.613e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.221e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.217e-01", "anc_acc": "4.844e-01", "epoch": 0.08791} {"step": 43960, "loss": 1.0714, "grad_norm": "2.104e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.839e-01", "anc_loss": "7.749e-01", "dlm_acc": "7.150e-01", "anc_acc": "6.869e-01", "epoch": 0.08792} {"step": 43965, "loss": 0.8054, "grad_norm": "3.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.743e-01", "anc_loss": "2.365e-01", "dlm_acc": "8.689e-01", "anc_acc": "8.363e-01", "epoch": 0.08793} {"step": 43970, "loss": 0.9716, "grad_norm": "2.442e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.120e-01", "anc_loss": "6.938e-01", "dlm_acc": "7.578e-01", "anc_acc": "7.300e-01", "epoch": 0.08794} {"step": 43975, "loss": 1.4237, "grad_norm": "4.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.124e+00", "anc_loss": "1.221e+00", "dlm_acc": "5.783e-01", "anc_acc": "5.486e-01", "epoch": 0.08795} {"step": 43980, "loss": 1.2799, "grad_norm": "2.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.137e-01", "anc_loss": "8.250e-01", "dlm_acc": "6.276e-01", "anc_acc": "5.781e-01", "epoch": 0.08796} {"step": 43985, "loss": 1.1933, "grad_norm": "3.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.395e+00", "dlm_acc": "5.519e-01", "anc_acc": "5.229e-01", "epoch": 0.08797} {"step": 43990, "loss": 1.3555, "grad_norm": "3.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.707e-01", "anc_loss": "1.070e+00", "dlm_acc": "6.804e-01", "anc_acc": "6.507e-01", "epoch": 0.08798} {"step": 43995, "loss": 1.3883, "grad_norm": "3.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.627e+00", "anc_loss": "1.725e+00", "dlm_acc": "4.876e-01", "anc_acc": "4.632e-01", "epoch": 0.08799} {"step": 44000, "loss": 1.5953, "grad_norm": "3.380e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.056e+00", "anc_loss": "2.208e+00", "dlm_acc": "4.056e-01", "anc_acc": "3.689e-01", "epoch": 0.088} {"step": 44005, "loss": 1.8018, "grad_norm": "3.555e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.647e+00", "anc_loss": "2.747e+00", "dlm_acc": "7.979e-02", "anc_acc": "5.858e-02", "epoch": 0.08801} {"step": 44010, "loss": 0.9415, "grad_norm": "3.104e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.193e+00", "anc_loss": "1.313e+00", "dlm_acc": "5.354e-01", "anc_acc": "5.023e-01", "epoch": 0.08802} {"step": 44015, "loss": 1.2388, "grad_norm": "3.146e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.107e+00", "anc_loss": "1.224e+00", "dlm_acc": "5.832e-01", "anc_acc": "5.522e-01", "epoch": 0.08803} {"step": 44020, "loss": 1.2266, "grad_norm": "2.591e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.071e+00", "anc_loss": "1.231e+00", "dlm_acc": "6.250e-01", "anc_acc": "5.772e-01", "epoch": 0.08804} {"step": 44025, "loss": 0.9227, "grad_norm": "3.246e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.132e+00", "anc_loss": "1.298e+00", "dlm_acc": "5.847e-01", "anc_acc": "5.308e-01", "epoch": 0.08805} {"step": 44030, "loss": 1.0219, "grad_norm": "3.311e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.406e-01", "anc_loss": "9.508e-01", "dlm_acc": "6.977e-01", "anc_acc": "6.690e-01", "epoch": 0.08806} {"step": 44035, "loss": 1.5053, "grad_norm": "2.535e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.945e-01", "anc_loss": "1.097e+00", "dlm_acc": "6.134e-01", "anc_acc": "5.830e-01", "epoch": 0.08807} {"step": 44040, "loss": 1.4116, "grad_norm": "1.972e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.652e-01", "anc_acc": "5.314e-01", "epoch": 0.08808} {"step": 44045, "loss": 1.1655, "grad_norm": "3.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.625e-01", "anc_loss": "1.104e+00", "dlm_acc": "6.175e-01", "anc_acc": "5.744e-01", "epoch": 0.08809} {"step": 44050, "loss": 1.7053, "grad_norm": "4.146e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.316e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.034e-01", "anc_acc": "4.742e-01", "epoch": 0.0881} {"step": 44055, "loss": 1.4729, "grad_norm": "9.295e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.528e+00", "anc_loss": "1.652e+00", "dlm_acc": "4.907e-01", "anc_acc": "4.649e-01", "epoch": 0.08811} {"step": 44060, "loss": 1.0398, "grad_norm": "5.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.097e+00", "anc_loss": "1.286e+00", "dlm_acc": "6.009e-01", "anc_acc": "5.512e-01", "epoch": 0.08812} {"step": 44065, "loss": 0.8919, "grad_norm": "2.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.943e-01", "anc_loss": "5.713e-01", "dlm_acc": "7.271e-01", "anc_acc": "6.868e-01", "epoch": 0.08813} {"step": 44070, "loss": 1.058, "grad_norm": "4.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.499e+00", "anc_loss": "1.559e+00", "dlm_acc": "3.394e-01", "anc_acc": "3.258e-01", "epoch": 0.08814} {"step": 44075, "loss": 1.2419, "grad_norm": "3.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.371e-01", "anc_loss": "9.180e-01", "dlm_acc": "7.191e-01", "anc_acc": "6.995e-01", "epoch": 0.08815} {"step": 44080, "loss": 1.4244, "grad_norm": "6.388e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.570e+00", "anc_loss": "1.703e+00", "dlm_acc": "4.346e-01", "anc_acc": "3.954e-01", "epoch": 0.08816} {"step": 44085, "loss": 0.9481, "grad_norm": "8.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.091e-01", "anc_loss": "1.009e+00", "dlm_acc": "5.956e-01", "anc_acc": "5.671e-01", "epoch": 0.08817} {"step": 44090, "loss": 0.7703, "grad_norm": "5.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.969e-01", "anc_loss": "7.094e-01", "dlm_acc": "3.853e-01", "anc_acc": "3.801e-01", "epoch": 0.08818} {"step": 44095, "loss": 1.3261, "grad_norm": "6.242e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.088e+00", "dlm_acc": "4.635e-01", "anc_acc": "4.465e-01", "epoch": 0.08819} {"step": 44100, "loss": 1.35, "grad_norm": "6.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.603e+00", "anc_loss": "1.724e+00", "dlm_acc": "4.744e-01", "anc_acc": "4.387e-01", "epoch": 0.0882} {"step": 44105, "loss": 1.6358, "grad_norm": "6.704e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.482e-01", "anc_acc": "5.132e-01", "epoch": 0.08821} {"step": 44110, "loss": 1.7445, "grad_norm": "5.183e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.802e+00", "anc_loss": "1.894e+00", "dlm_acc": "4.094e-01", "anc_acc": "3.823e-01", "epoch": 0.08822} {"step": 44115, "loss": 2.0928, "grad_norm": "5.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.956e+00", "anc_loss": "2.991e+00", "dlm_acc": "6.669e-02", "anc_acc": "6.088e-02", "epoch": 0.08823} {"step": 44120, "loss": 1.3241, "grad_norm": "4.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.913e+00", "anc_loss": "2.008e+00", "dlm_acc": "3.926e-01", "anc_acc": "3.713e-01", "epoch": 0.08824} {"step": 44125, "loss": 1.6222, "grad_norm": "5.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.708e+00", "anc_loss": "1.817e+00", "dlm_acc": "4.825e-01", "anc_acc": "4.622e-01", "epoch": 0.08825} {"step": 44130, "loss": 1.3802, "grad_norm": "3.799e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.534e+00", "anc_loss": "1.671e+00", "dlm_acc": "5.531e-01", "anc_acc": "5.245e-01", "epoch": 0.08826} {"step": 44135, "loss": 1.0564, "grad_norm": "2.312e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.213e+00", "anc_loss": "1.348e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.210e-01", "epoch": 0.08827} {"step": 44140, "loss": 1.0309, "grad_norm": "3.910e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.023e-01", "anc_loss": "9.926e-01", "dlm_acc": "6.021e-01", "anc_acc": "5.806e-01", "epoch": 0.08828} {"step": 44145, "loss": 1.0502, "grad_norm": "2.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.922e-01", "anc_loss": "8.324e-01", "dlm_acc": "7.315e-01", "anc_acc": "7.005e-01", "epoch": 0.08829} {"step": 44150, "loss": 1.4563, "grad_norm": "2.687e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.305e-01", "anc_loss": "1.059e+00", "dlm_acc": "6.368e-01", "anc_acc": "6.001e-01", "epoch": 0.0883} {"step": 44155, "loss": 1.8588, "grad_norm": "6.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.376e+00", "anc_loss": "1.537e+00", "dlm_acc": "5.113e-01", "anc_acc": "4.711e-01", "epoch": 0.08831} {"step": 44160, "loss": 1.0434, "grad_norm": "2.864e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.978e-01", "anc_loss": "4.086e-01", "dlm_acc": "8.634e-01", "anc_acc": "8.234e-01", "epoch": 0.08832} {"step": 44165, "loss": 1.4599, "grad_norm": "4.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.031e-01", "anc_loss": "8.238e-01", "dlm_acc": "7.861e-01", "anc_acc": "7.508e-01", "epoch": 0.08833} {"step": 44170, "loss": 1.6364, "grad_norm": "4.661e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.761e+00", "dlm_acc": "4.824e-01", "anc_acc": "4.463e-01", "epoch": 0.08834} {"step": 44175, "loss": 1.2761, "grad_norm": "3.124e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.379e+00", "dlm_acc": "5.910e-01", "anc_acc": "5.520e-01", "epoch": 0.08835} {"step": 44180, "loss": 1.3312, "grad_norm": "7.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.440e+00", "anc_loss": "1.554e+00", "dlm_acc": "5.265e-01", "anc_acc": "4.966e-01", "epoch": 0.08836} {"step": 44185, "loss": 1.0331, "grad_norm": "4.849e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.281e-01", "anc_loss": "7.914e-01", "dlm_acc": "6.391e-01", "anc_acc": "6.200e-01", "epoch": 0.08837} {"step": 44190, "loss": 1.2041, "grad_norm": "4.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.205e+00", "dlm_acc": "5.859e-01", "anc_acc": "5.432e-01", "epoch": 0.08838} {"step": 44195, "loss": 1.7331, "grad_norm": "8.276e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.373e+00", "anc_loss": "2.683e+00", "dlm_acc": "2.681e-01", "anc_acc": "2.406e-01", "epoch": 0.08839} {"step": 44200, "loss": 1.3307, "grad_norm": "9.610e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.602e+00", "anc_loss": "1.797e+00", "dlm_acc": "4.869e-01", "anc_acc": "4.577e-01", "epoch": 0.0884} {"step": 44205, "loss": 1.6202, "grad_norm": "4.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.523e+00", "anc_loss": "1.666e+00", "dlm_acc": "5.216e-01", "anc_acc": "4.882e-01", "epoch": 0.08841} {"step": 44210, "loss": 1.541, "grad_norm": "2.766e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.298e+00", "anc_loss": "1.447e+00", "dlm_acc": "5.844e-01", "anc_acc": "5.463e-01", "epoch": 0.08842} {"step": 44215, "loss": 1.5435, "grad_norm": "7.293e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.270e+00", "anc_loss": "1.456e+00", "dlm_acc": "5.634e-01", "anc_acc": "5.194e-01", "epoch": 0.08843} {"step": 44220, "loss": 1.0499, "grad_norm": "3.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.235e+00", "anc_loss": "1.340e+00", "dlm_acc": "4.795e-01", "anc_acc": "4.502e-01", "epoch": 0.08844} {"step": 44225, "loss": 0.795, "grad_norm": "2.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.246e+00", "dlm_acc": "5.295e-01", "anc_acc": "4.934e-01", "epoch": 0.08845} {"step": 44230, "loss": 0.9425, "grad_norm": "1.996e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.945e-01", "anc_loss": "4.473e-01", "dlm_acc": "8.293e-01", "anc_acc": "8.098e-01", "epoch": 0.08846} {"step": 44235, "loss": 0.9584, "grad_norm": "4.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.322e+00", "dlm_acc": "5.911e-01", "anc_acc": "5.471e-01", "epoch": 0.08847} {"step": 44240, "loss": 0.6683, "grad_norm": "1.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.984e-01", "anc_loss": "1.184e+00", "dlm_acc": "5.984e-01", "anc_acc": "5.425e-01", "epoch": 0.08848} {"step": 44245, "loss": 0.8311, "grad_norm": "2.933e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.055e-01", "anc_loss": "1.036e+00", "dlm_acc": "6.325e-01", "anc_acc": "5.933e-01", "epoch": 0.08849} {"step": 44250, "loss": 0.963, "grad_norm": "3.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.416e+00", "dlm_acc": "5.803e-01", "anc_acc": "5.414e-01", "epoch": 0.0885} {"step": 44255, "loss": 0.7967, "grad_norm": "2.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.816e-01", "anc_loss": "1.135e+00", "dlm_acc": "5.655e-01", "anc_acc": "5.077e-01", "epoch": 0.08851} {"step": 44260, "loss": 1.0136, "grad_norm": "3.541e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.333e+00", "dlm_acc": "5.416e-01", "anc_acc": "4.975e-01", "epoch": 0.08852} {"step": 44265, "loss": 0.9192, "grad_norm": "2.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.789e-01", "anc_loss": "1.102e+00", "dlm_acc": "6.478e-01", "anc_acc": "6.142e-01", "epoch": 0.08853} {"step": 44270, "loss": 1.0508, "grad_norm": "2.316e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.262e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.310e-01", "anc_acc": "4.991e-01", "epoch": 0.08854} {"step": 44275, "loss": 1.6115, "grad_norm": "3.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.478e+00", "dlm_acc": "5.653e-01", "anc_acc": "5.338e-01", "epoch": 0.08855} {"step": 44280, "loss": 1.0384, "grad_norm": "2.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.125e-01", "anc_loss": "1.023e+00", "dlm_acc": "6.611e-01", "anc_acc": "6.289e-01", "epoch": 0.08856} {"step": 44285, "loss": 1.2622, "grad_norm": "4.849e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.292e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.818e-01", "anc_acc": "5.512e-01", "epoch": 0.08857} {"step": 44290, "loss": 1.1194, "grad_norm": "2.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.227e+00", "dlm_acc": "5.990e-01", "anc_acc": "5.703e-01", "epoch": 0.08858} {"step": 44295, "loss": 1.2699, "grad_norm": "2.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.600e+00", "dlm_acc": "5.071e-01", "anc_acc": "4.802e-01", "epoch": 0.08859} {"step": 44300, "loss": 1.1231, "grad_norm": "3.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.188e+00", "dlm_acc": "6.498e-01", "anc_acc": "6.237e-01", "epoch": 0.0886} {"step": 44305, "loss": 1.5253, "grad_norm": "4.549e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.706e-01", "anc_acc": "5.375e-01", "epoch": 0.08861} {"step": 44310, "loss": 0.946, "grad_norm": "2.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.161e+00", "dlm_acc": "5.638e-01", "anc_acc": "5.355e-01", "epoch": 0.08862} {"step": 44315, "loss": 0.9854, "grad_norm": "2.959e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.816e-01", "anc_loss": "1.108e+00", "dlm_acc": "6.387e-01", "anc_acc": "6.064e-01", "epoch": 0.08863} {"step": 44320, "loss": 1.2732, "grad_norm": "4.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.412e+00", "dlm_acc": "5.748e-01", "anc_acc": "5.399e-01", "epoch": 0.08864} {"step": 44325, "loss": 1.4618, "grad_norm": "3.595e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.361e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.495e-01", "anc_acc": "5.175e-01", "epoch": 0.08865} {"step": 44330, "loss": 1.0764, "grad_norm": "2.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.034e+00", "anc_loss": "1.181e+00", "dlm_acc": "6.448e-01", "anc_acc": "6.081e-01", "epoch": 0.08866} {"step": 44335, "loss": 1.3138, "grad_norm": "4.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.778e+00", "anc_loss": "1.920e+00", "dlm_acc": "4.870e-01", "anc_acc": "4.596e-01", "epoch": 0.08867} {"step": 44340, "loss": 0.8611, "grad_norm": "4.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.137e+00", "dlm_acc": "6.080e-01", "anc_acc": "5.760e-01", "epoch": 0.08868} {"step": 44345, "loss": 1.3323, "grad_norm": "4.761e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.609e+00", "dlm_acc": "5.486e-01", "anc_acc": "5.182e-01", "epoch": 0.08869} {"step": 44350, "loss": 1.2129, "grad_norm": "6.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.559e+00", "anc_loss": "1.678e+00", "dlm_acc": "5.007e-01", "anc_acc": "4.732e-01", "epoch": 0.0887} {"step": 44355, "loss": 1.2795, "grad_norm": "3.036e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.863e+00", "anc_loss": "1.955e+00", "dlm_acc": "3.467e-01", "anc_acc": "3.268e-01", "epoch": 0.08871} {"step": 44360, "loss": 0.9638, "grad_norm": "2.569e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.467e+00", "anc_loss": "1.589e+00", "dlm_acc": "5.056e-01", "anc_acc": "4.746e-01", "epoch": 0.08872} {"step": 44365, "loss": 1.2608, "grad_norm": "3.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.553e+00", "anc_loss": "1.666e+00", "dlm_acc": "4.263e-01", "anc_acc": "4.018e-01", "epoch": 0.08873} {"step": 44370, "loss": 1.4179, "grad_norm": "4.832e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.518e+00", "anc_loss": "1.729e+00", "dlm_acc": "5.025e-01", "anc_acc": "4.451e-01", "epoch": 0.08874} {"step": 44375, "loss": 0.9195, "grad_norm": "1.583e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.471e-01", "anc_loss": "7.541e-01", "dlm_acc": "7.750e-01", "anc_acc": "7.431e-01", "epoch": 0.08875} {"step": 44380, "loss": 1.2455, "grad_norm": "3.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.318e+00", "anc_loss": "1.396e+00", "dlm_acc": "5.184e-01", "anc_acc": "4.968e-01", "epoch": 0.08876} {"step": 44385, "loss": 0.9981, "grad_norm": "2.189e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.268e-01", "anc_loss": "8.105e-01", "dlm_acc": "6.547e-01", "anc_acc": "6.290e-01", "epoch": 0.08877} {"step": 44390, "loss": 1.6229, "grad_norm": "3.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.169e+00", "dlm_acc": "5.265e-01", "anc_acc": "4.959e-01", "epoch": 0.08878} {"step": 44395, "loss": 1.4969, "grad_norm": "3.455e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.554e+00", "anc_loss": "1.684e+00", "dlm_acc": "5.215e-01", "anc_acc": "4.895e-01", "epoch": 0.08879} {"step": 44400, "loss": 1.1162, "grad_norm": "2.219e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.040e+00", "anc_loss": "1.120e+00", "dlm_acc": "6.000e-01", "anc_acc": "5.838e-01", "epoch": 0.0888} {"step": 44405, "loss": 1.0192, "grad_norm": "2.125e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.746e-01", "anc_loss": "5.062e-01", "dlm_acc": "7.044e-01", "anc_acc": "6.888e-01", "epoch": 0.08881} {"step": 44410, "loss": 1.3704, "grad_norm": "2.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.422e-01", "anc_loss": "1.027e+00", "dlm_acc": "5.677e-01", "anc_acc": "5.428e-01", "epoch": 0.08882} {"step": 44415, "loss": 1.3558, "grad_norm": "2.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.832e-01", "anc_loss": "1.078e+00", "dlm_acc": "5.803e-01", "anc_acc": "5.517e-01", "epoch": 0.08883} {"step": 44420, "loss": 1.0794, "grad_norm": "2.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.984e-01", "anc_loss": "7.672e-01", "dlm_acc": "5.681e-01", "anc_acc": "5.340e-01", "epoch": 0.08884} {"step": 44425, "loss": 1.2064, "grad_norm": "5.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.066e+00", "anc_loss": "1.210e+00", "dlm_acc": "5.643e-01", "anc_acc": "5.253e-01", "epoch": 0.08885} {"step": 44430, "loss": 1.1812, "grad_norm": "2.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.016e-01", "anc_loss": "7.129e-01", "dlm_acc": "7.467e-01", "anc_acc": "7.064e-01", "epoch": 0.08886} {"step": 44435, "loss": 1.0343, "grad_norm": "2.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.090e-01", "anc_loss": "7.182e-01", "dlm_acc": "7.603e-01", "anc_acc": "7.223e-01", "epoch": 0.08887} {"step": 44440, "loss": 0.9501, "grad_norm": "1.940e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.578e-01", "anc_loss": "9.609e-01", "dlm_acc": "5.777e-01", "anc_acc": "5.421e-01", "epoch": 0.08888} {"step": 44445, "loss": 0.8771, "grad_norm": "2.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.492e-01", "anc_loss": "1.055e+00", "dlm_acc": "6.243e-01", "anc_acc": "5.967e-01", "epoch": 0.08889} {"step": 44450, "loss": 1.4718, "grad_norm": "3.616e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.270e+00", "dlm_acc": "6.116e-01", "anc_acc": "5.813e-01", "epoch": 0.0889} {"step": 44455, "loss": 1.2999, "grad_norm": "2.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.053e+00", "anc_loss": "1.186e+00", "dlm_acc": "5.882e-01", "anc_acc": "5.425e-01", "epoch": 0.08891} {"step": 44460, "loss": 1.2168, "grad_norm": "3.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.670e-01", "anc_acc": "5.262e-01", "epoch": 0.08892} {"step": 44465, "loss": 1.0796, "grad_norm": "1.732e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.005e+00", "anc_loss": "1.141e+00", "dlm_acc": "6.061e-01", "anc_acc": "5.714e-01", "epoch": 0.08893} {"step": 44470, "loss": 1.1284, "grad_norm": "2.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.462e-01", "anc_acc": "5.179e-01", "epoch": 0.08894} {"step": 44475, "loss": 1.135, "grad_norm": "3.994e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.629e-01", "anc_loss": "1.046e+00", "dlm_acc": "6.083e-01", "anc_acc": "5.815e-01", "epoch": 0.08895} {"step": 44480, "loss": 1.3103, "grad_norm": "2.898e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.209e+00", "anc_loss": "1.340e+00", "dlm_acc": "5.832e-01", "anc_acc": "5.459e-01", "epoch": 0.08896} {"step": 44485, "loss": 1.194, "grad_norm": "3.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.496e-01", "anc_loss": "1.096e+00", "dlm_acc": "6.620e-01", "anc_acc": "6.232e-01", "epoch": 0.08897} {"step": 44490, "loss": 1.0918, "grad_norm": "5.175e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.219e-01", "anc_loss": "8.262e-01", "dlm_acc": "6.950e-01", "anc_acc": "6.598e-01", "epoch": 0.08898} {"step": 44495, "loss": 1.1061, "grad_norm": "2.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.270e-01", "anc_loss": "9.531e-01", "dlm_acc": "6.251e-01", "anc_acc": "5.709e-01", "epoch": 0.08899} {"step": 44500, "loss": 1.3135, "grad_norm": "6.563e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.664e-01", "anc_loss": "8.961e-01", "dlm_acc": "6.637e-01", "anc_acc": "6.138e-01", "epoch": 0.089} {"step": 44505, "loss": 1.2523, "grad_norm": "3.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.297e-01", "anc_loss": "9.477e-01", "dlm_acc": "5.999e-01", "anc_acc": "5.520e-01", "epoch": 0.08901} {"step": 44510, "loss": 1.1256, "grad_norm": "2.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.035e-01", "anc_loss": "8.961e-01", "dlm_acc": "5.964e-01", "anc_acc": "5.667e-01", "epoch": 0.08902} {"step": 44515, "loss": 1.1008, "grad_norm": "2.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.555e-01", "anc_loss": "7.750e-01", "dlm_acc": "4.513e-01", "anc_acc": "4.404e-01", "epoch": 0.08903} {"step": 44520, "loss": 1.4509, "grad_norm": "1.770e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.281e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.697e-01", "anc_acc": "5.354e-01", "epoch": 0.08904} {"step": 44525, "loss": 1.26, "grad_norm": "1.692e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.261e+00", "dlm_acc": "5.323e-01", "anc_acc": "4.999e-01", "epoch": 0.08905} {"step": 44530, "loss": 1.0887, "grad_norm": "5.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.164e-01", "anc_loss": "8.891e-01", "dlm_acc": "5.333e-01", "anc_acc": "5.124e-01", "epoch": 0.08906} {"step": 44535, "loss": 0.9616, "grad_norm": "2.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.684e-01", "anc_loss": "9.023e-01", "dlm_acc": "6.038e-01", "anc_acc": "5.593e-01", "epoch": 0.08907} {"step": 44540, "loss": 1.0462, "grad_norm": "3.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.616e-01", "anc_loss": "8.983e-01", "dlm_acc": "7.320e-01", "anc_acc": "6.879e-01", "epoch": 0.08908} {"step": 44545, "loss": 1.284, "grad_norm": "4.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.404e+00", "dlm_acc": "5.853e-01", "anc_acc": "5.449e-01", "epoch": 0.08909} {"step": 44550, "loss": 0.8197, "grad_norm": "4.070e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.190e+00", "dlm_acc": "6.251e-01", "anc_acc": "5.723e-01", "epoch": 0.0891} {"step": 44555, "loss": 1.1422, "grad_norm": "3.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.167e+00", "anc_loss": "1.278e+00", "dlm_acc": "5.514e-01", "anc_acc": "5.235e-01", "epoch": 0.08911} {"step": 44560, "loss": 1.0617, "grad_norm": "2.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.176e+00", "anc_loss": "1.319e+00", "dlm_acc": "5.983e-01", "anc_acc": "5.682e-01", "epoch": 0.08912} {"step": 44565, "loss": 0.8575, "grad_norm": "6.279e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.812e-01", "anc_loss": "1.040e+00", "dlm_acc": "6.603e-01", "anc_acc": "6.065e-01", "epoch": 0.08913} {"step": 44570, "loss": 1.3834, "grad_norm": "7.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.403e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.241e-01", "anc_acc": "4.854e-01", "epoch": 0.08914} {"step": 44575, "loss": 0.8755, "grad_norm": "4.695e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.337e-01", "anc_loss": "4.992e-01", "dlm_acc": "8.208e-01", "anc_acc": "7.998e-01", "epoch": 0.08915} {"step": 44580, "loss": 1.139, "grad_norm": "4.755e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.098e-01", "anc_loss": "9.051e-01", "dlm_acc": "6.518e-01", "anc_acc": "6.246e-01", "epoch": 0.08916} {"step": 44585, "loss": 1.351, "grad_norm": "3.958e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.406e-01", "anc_loss": "9.531e-01", "dlm_acc": "6.877e-01", "anc_acc": "6.628e-01", "epoch": 0.08917} {"step": 44590, "loss": 0.9427, "grad_norm": "4.231e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.132e+00", "dlm_acc": "6.210e-01", "anc_acc": "5.925e-01", "epoch": 0.08918} {"step": 44595, "loss": 0.8566, "grad_norm": "9.866e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.766e-01", "anc_loss": "4.264e-01", "dlm_acc": "7.815e-01", "anc_acc": "7.597e-01", "epoch": 0.08919} {"step": 44600, "loss": 0.9815, "grad_norm": "3.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.309e-01", "anc_loss": "3.918e-01", "dlm_acc": "7.996e-01", "anc_acc": "7.677e-01", "epoch": 0.0892} {"step": 44605, "loss": 0.6548, "grad_norm": "3.740e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.234e-01", "anc_loss": "4.863e-01", "dlm_acc": "7.473e-01", "anc_acc": "7.164e-01", "epoch": 0.08921} {"step": 44610, "loss": 0.5875, "grad_norm": "2.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.506e-01", "anc_loss": "3.977e-01", "dlm_acc": "7.435e-01", "anc_acc": "7.175e-01", "epoch": 0.08922} {"step": 44615, "loss": 0.8979, "grad_norm": "2.921e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.619e-01", "anc_loss": "5.242e-01", "dlm_acc": "7.240e-01", "anc_acc": "6.974e-01", "epoch": 0.08923} {"step": 44620, "loss": 0.8168, "grad_norm": "2.522e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.527e-01", "anc_loss": "9.531e-01", "dlm_acc": "6.598e-01", "anc_acc": "6.312e-01", "epoch": 0.08924} {"step": 44625, "loss": 0.8847, "grad_norm": "3.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.893e-01", "anc_loss": "3.068e-01", "dlm_acc": "8.065e-01", "anc_acc": "7.995e-01", "epoch": 0.08925} {"step": 44630, "loss": 0.7816, "grad_norm": "2.819e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.758e-01", "anc_loss": "2.908e-01", "dlm_acc": "8.131e-01", "anc_acc": "8.072e-01", "epoch": 0.08926} {"step": 44635, "loss": 0.8616, "grad_norm": "1.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.166e-01", "anc_loss": "4.422e-01", "dlm_acc": "7.318e-01", "anc_acc": "7.210e-01", "epoch": 0.08927} {"step": 44640, "loss": 0.7114, "grad_norm": "1.143e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.726e-02", "anc_loss": "2.882e-02", "dlm_acc": "9.835e-01", "anc_acc": "9.814e-01", "epoch": 0.08928} {"step": 44645, "loss": 1.0072, "grad_norm": "5.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.672e-01", "anc_loss": "9.516e-01", "dlm_acc": "6.126e-01", "anc_acc": "5.919e-01", "epoch": 0.08929} {"step": 44650, "loss": 0.6221, "grad_norm": "2.180e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.982e-01", "anc_loss": "6.914e-01", "dlm_acc": "7.419e-01", "anc_acc": "7.159e-01", "epoch": 0.0893} {"step": 44655, "loss": 0.8033, "grad_norm": "3.031e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.030e-01", "anc_loss": "5.707e-01", "dlm_acc": "8.016e-01", "anc_acc": "7.808e-01", "epoch": 0.08931} {"step": 44660, "loss": 1.1535, "grad_norm": "3.052e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.138e+00", "dlm_acc": "6.195e-01", "anc_acc": "6.028e-01", "epoch": 0.08932} {"step": 44665, "loss": 1.2149, "grad_norm": "5.567e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.000e-01", "anc_loss": "8.586e-01", "dlm_acc": "5.755e-01", "anc_acc": "5.617e-01", "epoch": 0.08933} {"step": 44670, "loss": 1.1339, "grad_norm": "3.363e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.920e-01", "anc_loss": "8.777e-01", "dlm_acc": "6.872e-01", "anc_acc": "6.619e-01", "epoch": 0.08934} {"step": 44675, "loss": 1.2448, "grad_norm": "3.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.264e+00", "anc_loss": "1.389e+00", "dlm_acc": "5.727e-01", "anc_acc": "5.428e-01", "epoch": 0.08935} {"step": 44680, "loss": 0.8812, "grad_norm": "2.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.816e-01", "anc_loss": "8.738e-01", "dlm_acc": "6.816e-01", "anc_acc": "6.611e-01", "epoch": 0.08936} {"step": 44685, "loss": 0.9744, "grad_norm": "2.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.644e-01", "anc_loss": "6.132e-01", "dlm_acc": "7.976e-01", "anc_acc": "7.858e-01", "epoch": 0.08937} {"step": 44690, "loss": 0.8896, "grad_norm": "7.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.016e-01", "anc_loss": "8.234e-01", "dlm_acc": "4.913e-01", "anc_acc": "4.804e-01", "epoch": 0.08938} {"step": 44695, "loss": 1.1615, "grad_norm": "2.997e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.867e-01", "anc_loss": "1.030e+00", "dlm_acc": "4.483e-01", "anc_acc": "4.326e-01", "epoch": 0.08939} {"step": 44700, "loss": 1.2521, "grad_norm": "3.122e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.113e+00", "dlm_acc": "5.940e-01", "anc_acc": "5.736e-01", "epoch": 0.0894} {"step": 44705, "loss": 1.244, "grad_norm": "1.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.180e+00", "dlm_acc": "3.958e-01", "anc_acc": "3.863e-01", "epoch": 0.08941} {"step": 44710, "loss": 1.0277, "grad_norm": "2.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.582e-01", "anc_loss": "6.813e-01", "dlm_acc": "6.096e-01", "anc_acc": "5.967e-01", "epoch": 0.08942} {"step": 44715, "loss": 1.0048, "grad_norm": "2.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.063e+00", "anc_loss": "1.158e+00", "dlm_acc": "6.363e-01", "anc_acc": "6.106e-01", "epoch": 0.08943} {"step": 44720, "loss": 1.1256, "grad_norm": "8.275e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.262e-01", "anc_loss": "7.302e-01", "dlm_acc": "7.448e-01", "anc_acc": "7.192e-01", "epoch": 0.08944} {"step": 44725, "loss": 1.2057, "grad_norm": "2.636e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.258e-01", "anc_loss": "1.054e+00", "dlm_acc": "6.687e-01", "anc_acc": "6.386e-01", "epoch": 0.08945} {"step": 44730, "loss": 0.849, "grad_norm": "2.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.841e-01", "anc_loss": "1.070e+00", "dlm_acc": "6.946e-01", "anc_acc": "6.716e-01", "epoch": 0.08946} {"step": 44735, "loss": 1.2002, "grad_norm": "1.934e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.324e-01", "anc_loss": "7.145e-01", "dlm_acc": "7.378e-01", "anc_acc": "7.145e-01", "epoch": 0.08947} {"step": 44740, "loss": 1.2326, "grad_norm": "3.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.391e-01", "anc_acc": "5.119e-01", "epoch": 0.08948} {"step": 44745, "loss": 1.3808, "grad_norm": "4.533e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.244e+00", "dlm_acc": "6.072e-01", "anc_acc": "5.765e-01", "epoch": 0.08949} {"step": 44750, "loss": 1.2344, "grad_norm": "4.884e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.849e-01", "anc_loss": "2.026e-01", "dlm_acc": "8.945e-01", "anc_acc": "8.871e-01", "epoch": 0.0895} {"step": 44755, "loss": 0.9594, "grad_norm": "4.972e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.479e-02", "anc_loss": "1.034e-01", "dlm_acc": "9.455e-01", "anc_acc": "9.411e-01", "epoch": 0.08951} {"step": 44760, "loss": 1.1882, "grad_norm": "3.560e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.865e-01", "anc_loss": "5.269e-01", "dlm_acc": "8.049e-01", "anc_acc": "7.917e-01", "epoch": 0.08952} {"step": 44765, "loss": 1.2165, "grad_norm": "3.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.707e-01", "anc_loss": "9.355e-01", "dlm_acc": "6.277e-01", "anc_acc": "6.081e-01", "epoch": 0.08953} {"step": 44770, "loss": 0.875, "grad_norm": "3.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.635e-01", "anc_loss": "6.368e-01", "dlm_acc": "7.727e-01", "anc_acc": "7.526e-01", "epoch": 0.08954} {"step": 44775, "loss": 1.0574, "grad_norm": "2.046e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.534e-01", "anc_loss": "6.260e-01", "dlm_acc": "8.070e-01", "anc_acc": "7.823e-01", "epoch": 0.08955} {"step": 44780, "loss": 1.2979, "grad_norm": "7.308e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.195e-01", "anc_loss": "9.387e-01", "dlm_acc": "7.348e-01", "anc_acc": "7.018e-01", "epoch": 0.08956} {"step": 44785, "loss": 0.8868, "grad_norm": "3.452e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.368e-01", "anc_loss": "7.028e-01", "dlm_acc": "7.130e-01", "anc_acc": "6.919e-01", "epoch": 0.08957} {"step": 44790, "loss": 0.8574, "grad_norm": "2.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.052e-01", "anc_loss": "6.006e-01", "dlm_acc": "7.897e-01", "anc_acc": "7.614e-01", "epoch": 0.08958} {"step": 44795, "loss": 1.2149, "grad_norm": "4.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.406e-01", "anc_loss": "1.091e+00", "dlm_acc": "6.338e-01", "anc_acc": "5.918e-01", "epoch": 0.08959} {"step": 44800, "loss": 1.5433, "grad_norm": "3.277e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.907e-01", "anc_acc": "5.674e-01", "epoch": 0.0896} {"step": 44805, "loss": 0.9658, "grad_norm": "3.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.674e-01", "anc_loss": "3.736e-01", "dlm_acc": "7.389e-01", "anc_acc": "7.335e-01", "epoch": 0.08961} {"step": 44810, "loss": 1.1692, "grad_norm": "7.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.078e-01", "anc_loss": "6.709e-01", "dlm_acc": "7.211e-01", "anc_acc": "7.072e-01", "epoch": 0.08962} {"step": 44815, "loss": 1.2388, "grad_norm": "3.130e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.542e-01", "anc_loss": "9.463e-01", "dlm_acc": "7.092e-01", "anc_acc": "6.868e-01", "epoch": 0.08963} {"step": 44820, "loss": 1.5136, "grad_norm": "5.654e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.092e+00", "anc_loss": "1.204e+00", "dlm_acc": "6.057e-01", "anc_acc": "5.741e-01", "epoch": 0.08964} {"step": 44825, "loss": 1.4058, "grad_norm": "4.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.619e+00", "anc_loss": "1.748e+00", "dlm_acc": "4.972e-01", "anc_acc": "4.682e-01", "epoch": 0.08965} {"step": 44830, "loss": 1.4364, "grad_norm": "4.575e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.672e+00", "anc_loss": "1.798e+00", "dlm_acc": "4.667e-01", "anc_acc": "4.416e-01", "epoch": 0.08966} {"step": 44835, "loss": 1.5641, "grad_norm": "3.554e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.444e+00", "anc_loss": "1.575e+00", "dlm_acc": "5.234e-01", "anc_acc": "4.925e-01", "epoch": 0.08967} {"step": 44840, "loss": 1.3149, "grad_norm": "4.934e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.438e+00", "anc_loss": "1.556e+00", "dlm_acc": "5.259e-01", "anc_acc": "4.982e-01", "epoch": 0.08968} {"step": 44845, "loss": 1.6114, "grad_norm": "3.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.697e+00", "anc_loss": "1.803e+00", "dlm_acc": "4.126e-01", "anc_acc": "3.870e-01", "epoch": 0.08969} {"step": 44850, "loss": 2.0159, "grad_norm": "3.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.863e+00", "anc_loss": "1.972e+00", "dlm_acc": "2.987e-01", "anc_acc": "2.716e-01", "epoch": 0.0897} {"step": 44855, "loss": 1.4626, "grad_norm": "3.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.481e+00", "anc_loss": "1.598e+00", "dlm_acc": "3.530e-01", "anc_acc": "3.250e-01", "epoch": 0.08971} {"step": 44860, "loss": 1.2181, "grad_norm": "2.408e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.259e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.209e-01", "anc_acc": "4.918e-01", "epoch": 0.08972} {"step": 44865, "loss": 1.2802, "grad_norm": "5.251e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.226e+00", "dlm_acc": "6.136e-01", "anc_acc": "5.887e-01", "epoch": 0.08973} {"step": 44870, "loss": 0.8642, "grad_norm": "2.750e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.072e+00", "anc_loss": "1.194e+00", "dlm_acc": "6.082e-01", "anc_acc": "5.784e-01", "epoch": 0.08974} {"step": 44875, "loss": 1.1771, "grad_norm": "2.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.065e+00", "anc_loss": "1.211e+00", "dlm_acc": "5.893e-01", "anc_acc": "5.465e-01", "epoch": 0.08975} {"step": 44880, "loss": 1.3423, "grad_norm": "3.942e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.549e+00", "dlm_acc": "5.181e-01", "anc_acc": "4.903e-01", "epoch": 0.08976} {"step": 44885, "loss": 1.2716, "grad_norm": "2.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.192e+00", "anc_loss": "1.308e+00", "dlm_acc": "5.282e-01", "anc_acc": "5.006e-01", "epoch": 0.08977} {"step": 44890, "loss": 1.4882, "grad_norm": "4.051e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.372e+00", "anc_loss": "1.512e+00", "dlm_acc": "5.341e-01", "anc_acc": "4.971e-01", "epoch": 0.08978} {"step": 44895, "loss": 1.4937, "grad_norm": "3.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.602e-01", "anc_loss": "7.383e-01", "dlm_acc": "6.936e-01", "anc_acc": "6.647e-01", "epoch": 0.08979} {"step": 44900, "loss": 1.3285, "grad_norm": "4.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.623e+00", "anc_loss": "1.741e+00", "dlm_acc": "4.631e-01", "anc_acc": "4.368e-01", "epoch": 0.0898} {"step": 44905, "loss": 1.6175, "grad_norm": "5.235e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.727e+00", "anc_loss": "1.848e+00", "dlm_acc": "4.399e-01", "anc_acc": "4.141e-01", "epoch": 0.08981} {"step": 44910, "loss": 1.294, "grad_norm": "4.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.538e+00", "dlm_acc": "5.243e-01", "anc_acc": "4.962e-01", "epoch": 0.08982} {"step": 44915, "loss": 0.7959, "grad_norm": "2.225e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.707e-01", "anc_loss": "6.133e-01", "dlm_acc": "4.873e-01", "anc_acc": "4.502e-01", "epoch": 0.08983} {"step": 44920, "loss": 1.1533, "grad_norm": "2.849e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.562e-01", "anc_loss": "9.008e-01", "dlm_acc": "4.270e-01", "anc_acc": "4.070e-01", "epoch": 0.08984} {"step": 44925, "loss": 1.2041, "grad_norm": "3.136e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.762e-01", "anc_loss": "7.562e-01", "dlm_acc": "5.931e-01", "anc_acc": "5.550e-01", "epoch": 0.08985} {"step": 44930, "loss": 1.342, "grad_norm": "4.407e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.477e-01", "anc_loss": "6.871e-01", "dlm_acc": "5.448e-01", "anc_acc": "5.206e-01", "epoch": 0.08986} {"step": 44935, "loss": 1.1864, "grad_norm": "3.718e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.125e-01", "anc_loss": "7.297e-01", "dlm_acc": "4.689e-01", "anc_acc": "4.564e-01", "epoch": 0.08987} {"step": 44940, "loss": 1.2712, "grad_norm": "2.398e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.391e-01", "anc_loss": "7.574e-01", "dlm_acc": "4.817e-01", "anc_acc": "4.732e-01", "epoch": 0.08988} {"step": 44945, "loss": 1.245, "grad_norm": "4.587e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.203e-01", "anc_loss": "7.383e-01", "dlm_acc": "4.586e-01", "anc_acc": "4.513e-01", "epoch": 0.08989} {"step": 44950, "loss": 1.0611, "grad_norm": "3.040e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.953e-01", "anc_loss": "6.039e-01", "dlm_acc": "4.881e-01", "anc_acc": "4.821e-01", "epoch": 0.0899} {"step": 44955, "loss": 1.2268, "grad_norm": "2.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.172e-01", "anc_loss": "9.922e-01", "dlm_acc": "5.050e-01", "anc_acc": "4.806e-01", "epoch": 0.08991} {"step": 44960, "loss": 1.1447, "grad_norm": "3.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.812e-01", "anc_loss": "1.036e+00", "dlm_acc": "5.736e-01", "anc_acc": "5.565e-01", "epoch": 0.08992} {"step": 44965, "loss": 1.2804, "grad_norm": "3.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.719e-01", "anc_loss": "6.816e-01", "dlm_acc": "5.800e-01", "anc_acc": "5.759e-01", "epoch": 0.08993} {"step": 44970, "loss": 1.4225, "grad_norm": "3.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.492e-01", "anc_loss": "7.555e-01", "dlm_acc": "5.641e-01", "anc_acc": "5.618e-01", "epoch": 0.08994} {"step": 44975, "loss": 1.0399, "grad_norm": "3.339e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.043e-01", "anc_loss": "6.098e-01", "dlm_acc": "5.928e-01", "anc_acc": "5.904e-01", "epoch": 0.08995} {"step": 44980, "loss": 1.328, "grad_norm": "3.324e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.602e-01", "anc_loss": "6.672e-01", "dlm_acc": "5.737e-01", "anc_acc": "5.706e-01", "epoch": 0.08996} {"step": 44985, "loss": 0.9443, "grad_norm": "2.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.646e-01", "anc_loss": "4.787e-01", "dlm_acc": "6.395e-01", "anc_acc": "6.298e-01", "epoch": 0.08997} {"step": 44990, "loss": 1.0358, "grad_norm": "2.611e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.971e-01", "anc_loss": "5.149e-01", "dlm_acc": "6.830e-01", "anc_acc": "6.702e-01", "epoch": 0.08998} {"step": 44995, "loss": 1.1364, "grad_norm": "1.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.645e-01", "anc_loss": "6.852e-01", "dlm_acc": "5.571e-01", "anc_acc": "5.465e-01", "epoch": 0.08999} {"step": 45000, "loss": 1.7992, "grad_norm": "5.486e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.086e+00", "anc_loss": "1.216e+00", "dlm_acc": "6.006e-01", "anc_acc": "5.636e-01", "epoch": 0.09} {"step": 45005, "loss": 1.452, "grad_norm": "3.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.171e+00", "dlm_acc": "5.707e-01", "anc_acc": "5.479e-01", "epoch": 0.09001} {"step": 45010, "loss": 1.2422, "grad_norm": "3.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.184e-01", "anc_loss": "9.852e-01", "dlm_acc": "5.572e-01", "anc_acc": "5.301e-01", "epoch": 0.09002} {"step": 45015, "loss": 1.352, "grad_norm": "4.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.093e+00", "anc_loss": "1.212e+00", "dlm_acc": "5.924e-01", "anc_acc": "5.647e-01", "epoch": 0.09003} {"step": 45020, "loss": 1.1117, "grad_norm": "4.254e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.862e-01", "anc_loss": "6.564e-01", "dlm_acc": "7.498e-01", "anc_acc": "7.280e-01", "epoch": 0.09004} {"step": 45025, "loss": 1.456, "grad_norm": "3.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.762e-01", "anc_loss": "7.910e-01", "dlm_acc": "6.496e-01", "anc_acc": "6.129e-01", "epoch": 0.09005} {"step": 45030, "loss": 1.3023, "grad_norm": "3.788e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.531e-01", "anc_loss": "6.687e-01", "dlm_acc": "4.896e-01", "anc_acc": "4.820e-01", "epoch": 0.09006} {"step": 45035, "loss": 1.3328, "grad_norm": "3.449e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.678e-01", "anc_loss": "6.327e-01", "dlm_acc": "7.197e-01", "anc_acc": "6.944e-01", "epoch": 0.09007} {"step": 45040, "loss": 0.96, "grad_norm": "3.682e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.037e-01", "anc_loss": "7.384e-01", "dlm_acc": "6.828e-01", "anc_acc": "6.721e-01", "epoch": 0.09008} {"step": 45045, "loss": 0.5974, "grad_norm": "2.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.034e-01", "anc_loss": "2.313e-01", "dlm_acc": "8.532e-01", "anc_acc": "8.367e-01", "epoch": 0.09009} {"step": 45050, "loss": 0.7445, "grad_norm": "4.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.289e-01", "anc_loss": "3.586e-01", "dlm_acc": "7.606e-01", "anc_acc": "7.427e-01", "epoch": 0.0901} {"step": 45055, "loss": 1.0167, "grad_norm": "2.478e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.275e-01", "anc_loss": "3.674e-01", "dlm_acc": "7.834e-01", "anc_acc": "7.618e-01", "epoch": 0.09011} {"step": 45060, "loss": 0.9125, "grad_norm": "2.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.363e-01", "anc_loss": "3.646e-01", "dlm_acc": "7.588e-01", "anc_acc": "7.406e-01", "epoch": 0.09012} {"step": 45065, "loss": 1.2137, "grad_norm": "3.827e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.535e-01", "anc_loss": "3.961e-01", "dlm_acc": "7.985e-01", "anc_acc": "7.742e-01", "epoch": 0.09013} {"step": 45070, "loss": 1.0014, "grad_norm": "2.312e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.171e-01", "anc_loss": "4.308e-01", "dlm_acc": "6.919e-01", "anc_acc": "6.850e-01", "epoch": 0.09014} {"step": 45075, "loss": 1.2286, "grad_norm": "4.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.602e-01", "anc_loss": "9.539e-01", "dlm_acc": "6.389e-01", "anc_acc": "6.127e-01", "epoch": 0.09015} {"step": 45080, "loss": 0.9765, "grad_norm": "3.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.355e-01", "anc_loss": "1.030e+00", "dlm_acc": "5.628e-01", "anc_acc": "5.331e-01", "epoch": 0.09016} {"step": 45085, "loss": 1.0624, "grad_norm": "2.733e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.092e+00", "anc_loss": "1.197e+00", "dlm_acc": "5.797e-01", "anc_acc": "5.500e-01", "epoch": 0.09017} {"step": 45090, "loss": 1.0826, "grad_norm": "3.416e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.542e+00", "dlm_acc": "5.637e-01", "anc_acc": "5.369e-01", "epoch": 0.09018} {"step": 45095, "loss": 0.8104, "grad_norm": "2.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.100e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.873e-01", "anc_acc": "5.581e-01", "epoch": 0.09019} {"step": 45100, "loss": 1.5951, "grad_norm": "4.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.131e+00", "dlm_acc": "5.017e-01", "anc_acc": "4.860e-01", "epoch": 0.0902} {"step": 45105, "loss": 1.1477, "grad_norm": "2.814e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.316e+00", "dlm_acc": "5.871e-01", "anc_acc": "5.575e-01", "epoch": 0.09021} {"step": 45110, "loss": 1.2074, "grad_norm": "3.744e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.758e-01", "anc_loss": "1.065e+00", "dlm_acc": "5.952e-01", "anc_acc": "5.722e-01", "epoch": 0.09022} {"step": 45115, "loss": 1.1615, "grad_norm": "3.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.110e+00", "anc_loss": "1.219e+00", "dlm_acc": "5.776e-01", "anc_acc": "5.470e-01", "epoch": 0.09023} {"step": 45120, "loss": 1.0639, "grad_norm": "5.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.249e+00", "anc_loss": "1.302e+00", "dlm_acc": "5.654e-01", "anc_acc": "5.438e-01", "epoch": 0.09024} {"step": 45125, "loss": 1.145, "grad_norm": "3.907e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.059e-01", "anc_loss": "7.902e-01", "dlm_acc": "6.154e-01", "anc_acc": "5.843e-01", "epoch": 0.09025} {"step": 45130, "loss": 1.2005, "grad_norm": "4.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.098e+00", "anc_loss": "1.185e+00", "dlm_acc": "6.188e-01", "anc_acc": "5.899e-01", "epoch": 0.09026} {"step": 45135, "loss": 1.1235, "grad_norm": "4.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.266e-01", "anc_loss": "1.006e+00", "dlm_acc": "5.929e-01", "anc_acc": "5.695e-01", "epoch": 0.09027} {"step": 45140, "loss": 1.1488, "grad_norm": "2.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.313e-01", "anc_loss": "8.992e-01", "dlm_acc": "5.819e-01", "anc_acc": "5.587e-01", "epoch": 0.09028} {"step": 45145, "loss": 1.1513, "grad_norm": "3.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.043e-01", "anc_loss": "9.797e-01", "dlm_acc": "5.616e-01", "anc_acc": "5.322e-01", "epoch": 0.09029} {"step": 45150, "loss": 1.2341, "grad_norm": "5.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.922e-01", "anc_loss": "1.094e+00", "dlm_acc": "5.743e-01", "anc_acc": "5.479e-01", "epoch": 0.0903} {"step": 45155, "loss": 1.228, "grad_norm": "1.803e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.338e-01", "anc_loss": "5.532e-01", "dlm_acc": "6.152e-01", "anc_acc": "6.029e-01", "epoch": 0.09031} {"step": 45160, "loss": 1.6137, "grad_norm": "3.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.393e-01", "anc_loss": "7.086e-01", "dlm_acc": "6.887e-01", "anc_acc": "6.540e-01", "epoch": 0.09032} {"step": 45165, "loss": 1.2342, "grad_norm": "4.240e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.977e-01", "anc_loss": "9.379e-01", "dlm_acc": "5.708e-01", "anc_acc": "5.550e-01", "epoch": 0.09033} {"step": 45170, "loss": 0.9105, "grad_norm": "3.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.293e-01", "anc_loss": "7.340e-01", "dlm_acc": "5.440e-01", "anc_acc": "5.421e-01", "epoch": 0.09034} {"step": 45175, "loss": 0.7315, "grad_norm": "1.840e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.492e-01", "anc_loss": "6.523e-01", "dlm_acc": "5.573e-01", "anc_acc": "5.561e-01", "epoch": 0.09035} {"step": 45180, "loss": 0.7426, "grad_norm": "2.408e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.594e-01", "anc_loss": "6.609e-01", "dlm_acc": "5.597e-01", "anc_acc": "5.591e-01", "epoch": 0.09036} {"step": 45185, "loss": 0.8861, "grad_norm": "1.186e+00", "learning_rate": "1.000e-04", "dlm_loss": "5.871e-01", "anc_loss": "5.906e-01", "dlm_acc": "5.728e-01", "anc_acc": "5.710e-01", "epoch": 0.09037} {"step": 45190, "loss": 1.045, "grad_norm": "4.075e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.523e-01", "anc_loss": "6.578e-01", "dlm_acc": "5.498e-01", "anc_acc": "5.476e-01", "epoch": 0.09038} {"step": 45195, "loss": 0.8933, "grad_norm": "2.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.734e-01", "anc_loss": "6.961e-01", "dlm_acc": "5.726e-01", "anc_acc": "5.664e-01", "epoch": 0.09039} {"step": 45200, "loss": 1.226, "grad_norm": "7.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.211e-01", "anc_loss": "9.117e-01", "dlm_acc": "6.248e-01", "anc_acc": "5.969e-01", "epoch": 0.0904} {"step": 45205, "loss": 1.112, "grad_norm": "4.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.104e+00", "anc_loss": "1.203e+00", "dlm_acc": "5.500e-01", "anc_acc": "5.221e-01", "epoch": 0.09041} {"step": 45210, "loss": 1.1077, "grad_norm": "4.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.477e-01", "anc_loss": "8.109e-01", "dlm_acc": "6.575e-01", "anc_acc": "6.331e-01", "epoch": 0.09042} {"step": 45215, "loss": 0.9382, "grad_norm": "4.194e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.939e-01", "anc_loss": "3.408e-01", "dlm_acc": "7.760e-01", "anc_acc": "7.446e-01", "epoch": 0.09043} {"step": 45220, "loss": 1.1323, "grad_norm": "3.169e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.461e-01", "anc_loss": "5.996e-01", "dlm_acc": "6.866e-01", "anc_acc": "6.611e-01", "epoch": 0.09044} {"step": 45225, "loss": 0.8545, "grad_norm": "1.375e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.605e-01", "anc_loss": "8.253e-01", "dlm_acc": "6.660e-01", "anc_acc": "6.455e-01", "epoch": 0.09045} {"step": 45230, "loss": 1.1468, "grad_norm": "5.173e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.092e+00", "anc_loss": "1.184e+00", "dlm_acc": "5.913e-01", "anc_acc": "5.674e-01", "epoch": 0.09046} {"step": 45235, "loss": 1.1636, "grad_norm": "3.398e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.264e+00", "anc_loss": "1.409e+00", "dlm_acc": "5.833e-01", "anc_acc": "5.489e-01", "epoch": 0.09047} {"step": 45240, "loss": 0.7617, "grad_norm": "2.274e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.177e-01", "anc_loss": "3.783e-01", "dlm_acc": "8.069e-01", "anc_acc": "7.856e-01", "epoch": 0.09048} {"step": 45245, "loss": 1.1663, "grad_norm": "3.127e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.127e+00", "dlm_acc": "6.536e-01", "anc_acc": "6.233e-01", "epoch": 0.09049} {"step": 45250, "loss": 1.0107, "grad_norm": "3.565e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.117e-01", "anc_loss": "9.014e-01", "dlm_acc": "6.616e-01", "anc_acc": "6.384e-01", "epoch": 0.0905} {"step": 45255, "loss": 1.5704, "grad_norm": "4.134e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.693e+00", "anc_loss": "1.797e+00", "dlm_acc": "4.547e-01", "anc_acc": "4.339e-01", "epoch": 0.09051} {"step": 45260, "loss": 1.1102, "grad_norm": "6.623e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.158e-01", "anc_loss": "1.014e+00", "dlm_acc": "6.771e-01", "anc_acc": "6.486e-01", "epoch": 0.09052} {"step": 45265, "loss": 0.946, "grad_norm": "3.977e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.017e+00", "anc_loss": "1.098e+00", "dlm_acc": "5.066e-01", "anc_acc": "4.831e-01", "epoch": 0.09053} {"step": 45270, "loss": 0.8287, "grad_norm": "2.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.518e-01", "anc_loss": "5.902e-01", "dlm_acc": "7.240e-01", "anc_acc": "7.113e-01", "epoch": 0.09054} {"step": 45275, "loss": 0.8459, "grad_norm": "5.364e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.592e-01", "anc_loss": "2.709e-01", "dlm_acc": "8.124e-01", "anc_acc": "8.052e-01", "epoch": 0.09055} {"step": 45280, "loss": 1.2758, "grad_norm": "3.320e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.473e-01", "anc_loss": "3.617e-01", "dlm_acc": "7.504e-01", "anc_acc": "7.429e-01", "epoch": 0.09056} {"step": 45285, "loss": 0.6523, "grad_norm": "3.767e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.367e-01", "anc_loss": "5.512e-01", "dlm_acc": "5.658e-01", "anc_acc": "5.567e-01", "epoch": 0.09057} {"step": 45290, "loss": 0.7756, "grad_norm": "3.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.547e-01", "anc_loss": "5.723e-01", "dlm_acc": "5.532e-01", "anc_acc": "5.399e-01", "epoch": 0.09058} {"step": 45295, "loss": 1.0035, "grad_norm": "2.872e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.594e-01", "anc_loss": "8.055e-01", "dlm_acc": "5.496e-01", "anc_acc": "5.354e-01", "epoch": 0.09059} {"step": 45300, "loss": 1.0294, "grad_norm": "3.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.143e-01", "anc_loss": "9.926e-01", "dlm_acc": "6.544e-01", "anc_acc": "6.336e-01", "epoch": 0.0906} {"step": 45305, "loss": 1.0411, "grad_norm": "2.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.615e-01", "anc_loss": "9.738e-01", "dlm_acc": "6.707e-01", "anc_acc": "6.354e-01", "epoch": 0.09061} {"step": 45310, "loss": 1.2261, "grad_norm": "8.318e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.164e-01", "anc_loss": "5.797e-01", "dlm_acc": "7.913e-01", "anc_acc": "7.729e-01", "epoch": 0.09062} {"step": 45315, "loss": 1.3936, "grad_norm": "4.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.043e+00", "anc_loss": "1.123e+00", "dlm_acc": "5.521e-01", "anc_acc": "5.326e-01", "epoch": 0.09063} {"step": 45320, "loss": 1.2019, "grad_norm": "5.358e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.205e+00", "anc_loss": "1.203e+00", "dlm_acc": "1.040e-01", "anc_acc": "1.036e-01", "epoch": 0.09064} {"step": 45325, "loss": 0.8819, "grad_norm": "3.360e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.012e+00", "dlm_acc": "1.045e-01", "anc_acc": "1.040e-01", "epoch": 0.09065} {"step": 45330, "loss": 1.413, "grad_norm": "4.525e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.208e+00", "anc_loss": "1.209e+00", "dlm_acc": "1.132e-01", "anc_acc": "1.119e-01", "epoch": 0.09066} {"step": 45335, "loss": 1.2279, "grad_norm": "3.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.176e-01", "anc_loss": "9.617e-01", "dlm_acc": "3.638e-01", "anc_acc": "3.497e-01", "epoch": 0.09067} {"step": 45340, "loss": 1.262, "grad_norm": "2.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.621e-01", "anc_loss": "8.172e-01", "dlm_acc": "6.492e-01", "anc_acc": "6.318e-01", "epoch": 0.09068} {"step": 45345, "loss": 1.1468, "grad_norm": "4.073e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.019e-01", "anc_loss": "8.692e-01", "dlm_acc": "6.783e-01", "anc_acc": "6.555e-01", "epoch": 0.09069} {"step": 45350, "loss": 1.4657, "grad_norm": "4.432e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.217e+00", "anc_loss": "1.343e+00", "dlm_acc": "6.103e-01", "anc_acc": "5.819e-01", "epoch": 0.0907} {"step": 45355, "loss": 1.0261, "grad_norm": "2.517e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.900e-01", "anc_loss": "6.304e-01", "dlm_acc": "7.324e-01", "anc_acc": "7.161e-01", "epoch": 0.09071} {"step": 45360, "loss": 1.2713, "grad_norm": "3.629e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.875e-01", "anc_loss": "8.844e-01", "dlm_acc": "6.633e-01", "anc_acc": "6.357e-01", "epoch": 0.09072} {"step": 45365, "loss": 0.9489, "grad_norm": "3.231e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.208e-01", "anc_loss": "5.970e-01", "dlm_acc": "7.904e-01", "anc_acc": "7.715e-01", "epoch": 0.09073} {"step": 45370, "loss": 1.0805, "grad_norm": "3.343e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.103e+00", "anc_loss": "1.255e+00", "dlm_acc": "6.425e-01", "anc_acc": "6.082e-01", "epoch": 0.09074} {"step": 45375, "loss": 1.017, "grad_norm": "2.907e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.283e-01", "anc_loss": "3.414e-01", "dlm_acc": "7.876e-01", "anc_acc": "7.832e-01", "epoch": 0.09075} {"step": 45380, "loss": 0.9119, "grad_norm": "2.892e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.285e-01", "anc_loss": "3.375e-01", "dlm_acc": "7.564e-01", "anc_acc": "7.514e-01", "epoch": 0.09076} {"step": 45385, "loss": 0.9453, "grad_norm": "5.989e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.680e-01", "anc_loss": "1.090e+00", "dlm_acc": "6.679e-01", "anc_acc": "6.334e-01", "epoch": 0.09077} {"step": 45390, "loss": 0.7561, "grad_norm": "2.859e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.945e-01", "anc_loss": "5.475e-01", "dlm_acc": "7.920e-01", "anc_acc": "7.775e-01", "epoch": 0.09078} {"step": 45395, "loss": 0.8689, "grad_norm": "5.203e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.107e-01", "anc_loss": "2.381e-01", "dlm_acc": "8.645e-01", "anc_acc": "8.523e-01", "epoch": 0.09079} {"step": 45400, "loss": 0.8791, "grad_norm": "4.761e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.427e-01", "anc_loss": "5.979e-01", "dlm_acc": "7.967e-01", "anc_acc": "7.801e-01", "epoch": 0.0908} {"step": 45405, "loss": 1.0853, "grad_norm": "2.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.391e-01", "anc_loss": "8.297e-01", "dlm_acc": "6.857e-01", "anc_acc": "6.523e-01", "epoch": 0.09081} {"step": 45410, "loss": 1.3041, "grad_norm": "2.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.379e+00", "anc_loss": "1.498e+00", "dlm_acc": "5.824e-01", "anc_acc": "5.559e-01", "epoch": 0.09082} {"step": 45415, "loss": 1.1824, "grad_norm": "3.017e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.292e+00", "dlm_acc": "5.961e-01", "anc_acc": "5.649e-01", "epoch": 0.09083} {"step": 45420, "loss": 0.803, "grad_norm": "3.870e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.785e-01", "anc_loss": "9.836e-01", "dlm_acc": "6.166e-01", "anc_acc": "5.873e-01", "epoch": 0.09084} {"step": 45425, "loss": 0.929, "grad_norm": "2.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.277e-01", "anc_loss": "4.993e-01", "dlm_acc": "8.168e-01", "anc_acc": "7.898e-01", "epoch": 0.09085} {"step": 45430, "loss": 1.1563, "grad_norm": "3.826e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.763e-01", "anc_loss": "9.574e-01", "dlm_acc": "6.919e-01", "anc_acc": "6.696e-01", "epoch": 0.09086} {"step": 45435, "loss": 0.8544, "grad_norm": "4.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.703e-01", "anc_loss": "7.406e-01", "dlm_acc": "6.825e-01", "anc_acc": "6.575e-01", "epoch": 0.09087} {"step": 45440, "loss": 1.218, "grad_norm": "5.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.275e+00", "dlm_acc": "6.576e-01", "anc_acc": "6.156e-01", "epoch": 0.09088} {"step": 45445, "loss": 0.8633, "grad_norm": "4.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.185e-01", "anc_loss": "5.229e-01", "dlm_acc": "8.359e-01", "anc_acc": "7.949e-01", "epoch": 0.09089} {"step": 45450, "loss": 0.8728, "grad_norm": "3.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.433e-01", "anc_loss": "4.256e-01", "dlm_acc": "8.408e-01", "anc_acc": "8.094e-01", "epoch": 0.0909} {"step": 45455, "loss": 1.2194, "grad_norm": "3.176e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.674e-01", "anc_loss": "6.141e-01", "dlm_acc": "7.318e-01", "anc_acc": "7.177e-01", "epoch": 0.09091} {"step": 45460, "loss": 1.0857, "grad_norm": "2.411e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.969e-01", "anc_loss": "9.938e-01", "dlm_acc": "6.497e-01", "anc_acc": "6.250e-01", "epoch": 0.09092} {"step": 45465, "loss": 1.2242, "grad_norm": "4.760e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.129e+00", "anc_loss": "1.224e+00", "dlm_acc": "5.886e-01", "anc_acc": "5.628e-01", "epoch": 0.09093} {"step": 45470, "loss": 1.2186, "grad_norm": "2.585e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.257e+00", "dlm_acc": "5.885e-01", "anc_acc": "5.587e-01", "epoch": 0.09094} {"step": 45475, "loss": 1.6096, "grad_norm": "2.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.223e-01", "anc_loss": "9.980e-01", "dlm_acc": "6.904e-01", "anc_acc": "6.706e-01", "epoch": 0.09095} {"step": 45480, "loss": 1.0407, "grad_norm": "3.796e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.184e+00", "dlm_acc": "5.504e-01", "anc_acc": "5.409e-01", "epoch": 0.09096} {"step": 45485, "loss": 1.4069, "grad_norm": "4.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.957e-01", "anc_loss": "8.699e-01", "dlm_acc": "6.810e-01", "anc_acc": "6.584e-01", "epoch": 0.09097} {"step": 45490, "loss": 1.3786, "grad_norm": "2.931e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.498e+00", "anc_loss": "1.623e+00", "dlm_acc": "5.388e-01", "anc_acc": "5.082e-01", "epoch": 0.09098} {"step": 45495, "loss": 1.0858, "grad_norm": "3.002e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.643e-01", "anc_loss": "1.080e+00", "dlm_acc": "6.609e-01", "anc_acc": "6.302e-01", "epoch": 0.09099} {"step": 45500, "loss": 1.1253, "grad_norm": "4.276e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.143e+00", "anc_loss": "1.263e+00", "dlm_acc": "6.373e-01", "anc_acc": "6.080e-01", "epoch": 0.091} {"step": 45505, "loss": 1.0802, "grad_norm": "2.628e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.205e+00", "dlm_acc": "6.366e-01", "anc_acc": "6.023e-01", "epoch": 0.09101} {"step": 45510, "loss": 1.2149, "grad_norm": "3.415e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.560e+00", "dlm_acc": "5.490e-01", "anc_acc": "5.199e-01", "epoch": 0.09102} {"step": 45515, "loss": 1.3845, "grad_norm": "3.812e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.312e+00", "anc_loss": "1.466e+00", "dlm_acc": "5.832e-01", "anc_acc": "5.477e-01", "epoch": 0.09103} {"step": 45520, "loss": 1.25, "grad_norm": "6.416e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.323e+00", "anc_loss": "1.452e+00", "dlm_acc": "6.068e-01", "anc_acc": "5.780e-01", "epoch": 0.09104} {"step": 45525, "loss": 1.2764, "grad_norm": "3.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.210e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.937e-01", "anc_acc": "5.588e-01", "epoch": 0.09105} {"step": 45530, "loss": 1.306, "grad_norm": "4.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.322e+00", "anc_loss": "1.442e+00", "dlm_acc": "5.696e-01", "anc_acc": "5.379e-01", "epoch": 0.09106} {"step": 45535, "loss": 1.0074, "grad_norm": "2.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.484e-01", "anc_loss": "1.073e+00", "dlm_acc": "6.491e-01", "anc_acc": "6.182e-01", "epoch": 0.09107} {"step": 45540, "loss": 1.108, "grad_norm": "4.279e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.241e+00", "dlm_acc": "6.230e-01", "anc_acc": "5.948e-01", "epoch": 0.09108} {"step": 45545, "loss": 0.9438, "grad_norm": "3.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.016e-01", "anc_loss": "9.930e-01", "dlm_acc": "6.536e-01", "anc_acc": "6.267e-01", "epoch": 0.09109} {"step": 45550, "loss": 1.6237, "grad_norm": "4.643e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.465e+00", "anc_loss": "1.611e+00", "dlm_acc": "5.524e-01", "anc_acc": "5.213e-01", "epoch": 0.0911} {"step": 45555, "loss": 1.3751, "grad_norm": "7.300e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.387e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.553e-01", "anc_acc": "5.185e-01", "epoch": 0.09111} {"step": 45560, "loss": 0.8007, "grad_norm": "8.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.633e-01", "anc_loss": "8.342e-01", "dlm_acc": "6.207e-01", "anc_acc": "5.995e-01", "epoch": 0.09112} {"step": 45565, "loss": 1.1044, "grad_norm": "1.368e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.852e-01", "anc_loss": "1.071e+00", "dlm_acc": "5.412e-01", "anc_acc": "5.188e-01", "epoch": 0.09113} {"step": 45570, "loss": 1.0963, "grad_norm": "3.150e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.684e-01", "anc_loss": "1.059e+00", "dlm_acc": "6.333e-01", "anc_acc": "6.084e-01", "epoch": 0.09114} {"step": 45575, "loss": 1.3427, "grad_norm": "1.043e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.016e+00", "anc_loss": "1.159e+00", "dlm_acc": "6.096e-01", "anc_acc": "5.663e-01", "epoch": 0.09115} {"step": 45580, "loss": 0.9127, "grad_norm": "2.757e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.891e-01", "anc_loss": "8.883e-01", "dlm_acc": "6.418e-01", "anc_acc": "6.109e-01", "epoch": 0.09116} {"step": 45585, "loss": 1.2754, "grad_norm": "3.544e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.203e+00", "anc_loss": "1.344e+00", "dlm_acc": "5.734e-01", "anc_acc": "5.327e-01", "epoch": 0.09117} {"step": 45590, "loss": 1.4701, "grad_norm": "2.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.258e+00", "anc_loss": "1.408e+00", "dlm_acc": "5.775e-01", "anc_acc": "5.507e-01", "epoch": 0.09118} {"step": 45595, "loss": 1.4908, "grad_norm": "3.749e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.390e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.542e-01", "anc_acc": "5.182e-01", "epoch": 0.09119} {"step": 45600, "loss": 1.3152, "grad_norm": "3.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.522e-01", "anc_acc": "5.174e-01", "epoch": 0.0912} {"step": 45605, "loss": 1.095, "grad_norm": "3.197e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.570e-01", "anc_loss": "9.914e-01", "dlm_acc": "6.437e-01", "anc_acc": "6.049e-01", "epoch": 0.09121} {"step": 45610, "loss": 1.3454, "grad_norm": "3.080e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.153e+00", "anc_loss": "1.295e+00", "dlm_acc": "6.146e-01", "anc_acc": "5.691e-01", "epoch": 0.09122} {"step": 45615, "loss": 1.2402, "grad_norm": "3.455e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.565e+00", "dlm_acc": "5.399e-01", "anc_acc": "5.069e-01", "epoch": 0.09123} {"step": 45620, "loss": 1.0683, "grad_norm": "2.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.107e+00", "dlm_acc": "5.705e-01", "anc_acc": "5.449e-01", "epoch": 0.09124} {"step": 45625, "loss": 1.3863, "grad_norm": "3.123e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.623e+00", "anc_loss": "1.728e+00", "dlm_acc": "4.608e-01", "anc_acc": "4.377e-01", "epoch": 0.09125} {"step": 45630, "loss": 0.9559, "grad_norm": "4.401e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.840e-01", "anc_loss": "9.945e-01", "dlm_acc": "6.352e-01", "anc_acc": "6.017e-01", "epoch": 0.09126} {"step": 45635, "loss": 1.2725, "grad_norm": "2.154e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.024e+00", "anc_loss": "1.195e+00", "dlm_acc": "6.559e-01", "anc_acc": "6.110e-01", "epoch": 0.09127} {"step": 45640, "loss": 1.6963, "grad_norm": "9.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.441e+00", "anc_loss": "1.577e+00", "dlm_acc": "5.369e-01", "anc_acc": "5.046e-01", "epoch": 0.09128} {"step": 45645, "loss": 1.3797, "grad_norm": "3.172e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.151e+00", "dlm_acc": "5.968e-01", "anc_acc": "5.659e-01", "epoch": 0.09129} {"step": 45650, "loss": 1.1777, "grad_norm": "5.784e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.816e-01", "anc_loss": "5.945e-01", "dlm_acc": "5.751e-01", "anc_acc": "5.702e-01", "epoch": 0.0913} {"step": 45655, "loss": 1.2711, "grad_norm": "2.478e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.770e-01", "anc_loss": "1.061e+00", "dlm_acc": "5.792e-01", "anc_acc": "5.589e-01", "epoch": 0.09131} {"step": 45660, "loss": 1.5445, "grad_norm": "3.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.606e+00", "dlm_acc": "5.346e-01", "anc_acc": "4.887e-01", "epoch": 0.09132} {"step": 45665, "loss": 1.2983, "grad_norm": "4.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.574e-01", "anc_loss": "1.112e+00", "dlm_acc": "6.562e-01", "anc_acc": "6.142e-01", "epoch": 0.09133} {"step": 45670, "loss": 1.6034, "grad_norm": "3.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.077e+00", "anc_loss": "1.209e+00", "dlm_acc": "6.633e-01", "anc_acc": "6.284e-01", "epoch": 0.09134} {"step": 45675, "loss": 1.8094, "grad_norm": "1.753e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.463e+00", "anc_loss": "1.560e+00", "dlm_acc": "5.676e-01", "anc_acc": "5.447e-01", "epoch": 0.09135} {"step": 45680, "loss": 1.8467, "grad_norm": "3.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.506e+00", "anc_loss": "2.544e+00", "dlm_acc": "1.618e-01", "anc_acc": "1.519e-01", "epoch": 0.09136} {"step": 45685, "loss": 1.7901, "grad_norm": "4.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.741e+00", "anc_loss": "2.756e+00", "dlm_acc": "5.080e-02", "anc_acc": "4.626e-02", "epoch": 0.09137} {"step": 45690, "loss": 1.2139, "grad_norm": "2.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e+00", "anc_loss": "1.453e+00", "dlm_acc": "4.225e-01", "anc_acc": "3.978e-01", "epoch": 0.09138} {"step": 45695, "loss": 1.1512, "grad_norm": "2.293e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.840e-01", "anc_loss": "1.116e+00", "dlm_acc": "6.169e-01", "anc_acc": "5.711e-01", "epoch": 0.09139} {"step": 45700, "loss": 0.9949, "grad_norm": "2.837e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.703e-01", "anc_loss": "7.937e-01", "dlm_acc": "6.680e-01", "anc_acc": "6.106e-01", "epoch": 0.0914} {"step": 45705, "loss": 1.3854, "grad_norm": "3.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.228e+00", "dlm_acc": "6.028e-01", "anc_acc": "5.590e-01", "epoch": 0.09141} {"step": 45710, "loss": 1.4087, "grad_norm": "4.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.358e+00", "anc_loss": "1.480e+00", "dlm_acc": "5.222e-01", "anc_acc": "4.929e-01", "epoch": 0.09142} {"step": 45715, "loss": 1.786, "grad_norm": "3.699e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.641e+00", "anc_loss": "1.777e+00", "dlm_acc": "4.817e-01", "anc_acc": "4.514e-01", "epoch": 0.09143} {"step": 45720, "loss": 1.3185, "grad_norm": "2.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.070e+00", "anc_loss": "1.191e+00", "dlm_acc": "5.873e-01", "anc_acc": "5.557e-01", "epoch": 0.09144} {"step": 45725, "loss": 0.7734, "grad_norm": "1.862e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.887e-01", "anc_loss": "7.441e-01", "dlm_acc": "6.434e-01", "anc_acc": "6.274e-01", "epoch": 0.09145} {"step": 45730, "loss": 0.8513, "grad_norm": "1.335e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.013e+00", "anc_loss": "1.139e+00", "dlm_acc": "5.958e-01", "anc_acc": "5.601e-01", "epoch": 0.09146} {"step": 45735, "loss": 1.0169, "grad_norm": "8.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.310e+00", "anc_loss": "1.424e+00", "dlm_acc": "5.356e-01", "anc_acc": "5.050e-01", "epoch": 0.09147} {"step": 45740, "loss": 1.3382, "grad_norm": "3.274e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.671e+00", "dlm_acc": "5.415e-01", "anc_acc": "5.113e-01", "epoch": 0.09148} {"step": 45745, "loss": 1.7081, "grad_norm": "7.982e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.609e+00", "anc_loss": "1.756e+00", "dlm_acc": "5.123e-01", "anc_acc": "4.788e-01", "epoch": 0.09149} {"step": 45750, "loss": 1.2687, "grad_norm": "4.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.357e+00", "anc_loss": "1.457e+00", "dlm_acc": "4.741e-01", "anc_acc": "4.510e-01", "epoch": 0.0915} {"step": 45755, "loss": 1.305, "grad_norm": "4.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.123e+00", "dlm_acc": "6.098e-01", "anc_acc": "5.882e-01", "epoch": 0.09151} {"step": 45760, "loss": 0.8724, "grad_norm": "3.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.629e-01", "anc_loss": "4.977e-01", "dlm_acc": "6.782e-01", "anc_acc": "6.656e-01", "epoch": 0.09152} {"step": 45765, "loss": 1.0563, "grad_norm": "3.624e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.539e-01", "anc_loss": "6.086e-01", "dlm_acc": "6.527e-01", "anc_acc": "6.325e-01", "epoch": 0.09153} {"step": 45770, "loss": 1.0026, "grad_norm": "3.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.004e-01", "anc_loss": "5.613e-01", "dlm_acc": "6.639e-01", "anc_acc": "6.370e-01", "epoch": 0.09154} {"step": 45775, "loss": 1.0903, "grad_norm": "2.768e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.305e-01", "anc_loss": "5.973e-01", "dlm_acc": "6.481e-01", "anc_acc": "6.185e-01", "epoch": 0.09155} {"step": 45780, "loss": 1.0002, "grad_norm": "2.631e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.902e-01", "anc_loss": "5.414e-01", "dlm_acc": "6.593e-01", "anc_acc": "6.331e-01", "epoch": 0.09156} {"step": 45785, "loss": 1.418, "grad_norm": "2.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.502e+00", "anc_loss": "1.620e+00", "dlm_acc": "5.226e-01", "anc_acc": "4.944e-01", "epoch": 0.09157} {"step": 45790, "loss": 1.264, "grad_norm": "2.728e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.337e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.604e-01", "anc_acc": "5.314e-01", "epoch": 0.09158} {"step": 45795, "loss": 0.8298, "grad_norm": "2.998e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.191e+00", "dlm_acc": "5.939e-01", "anc_acc": "5.646e-01", "epoch": 0.09159} {"step": 45800, "loss": 1.5077, "grad_norm": "5.802e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.483e+00", "anc_loss": "1.609e+00", "dlm_acc": "5.424e-01", "anc_acc": "5.159e-01", "epoch": 0.0916} {"step": 45805, "loss": 1.707, "grad_norm": "2.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.319e+00", "anc_loss": "2.397e+00", "dlm_acc": "2.412e-01", "anc_acc": "2.264e-01", "epoch": 0.09161} {"step": 45810, "loss": 0.8872, "grad_norm": "2.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.620e-02", "anc_loss": "3.559e-02", "dlm_acc": "9.799e-01", "anc_acc": "9.784e-01", "epoch": 0.09162} {"step": 45815, "loss": 1.3508, "grad_norm": "2.616e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.374e-02", "anc_loss": "4.048e-02", "dlm_acc": "9.799e-01", "anc_acc": "9.757e-01", "epoch": 0.09163} {"step": 45820, "loss": 0.8821, "grad_norm": "4.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.379e-02", "anc_loss": "5.718e-02", "dlm_acc": "9.689e-01", "anc_acc": "9.598e-01", "epoch": 0.09164} {"step": 45825, "loss": 0.9283, "grad_norm": "5.236e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.448e-02", "anc_loss": "2.771e-02", "dlm_acc": "9.836e-01", "anc_acc": "9.823e-01", "epoch": 0.09165} {"step": 45830, "loss": 1.4544, "grad_norm": "6.953e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.235e+00", "anc_loss": "1.351e+00", "dlm_acc": "6.020e-01", "anc_acc": "5.768e-01", "epoch": 0.09166} {"step": 45835, "loss": 1.4044, "grad_norm": "5.677e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.321e+00", "anc_loss": "1.435e+00", "dlm_acc": "5.434e-01", "anc_acc": "5.146e-01", "epoch": 0.09167} {"step": 45840, "loss": 1.3615, "grad_norm": "5.024e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.351e+00", "dlm_acc": "5.699e-01", "anc_acc": "5.451e-01", "epoch": 0.09168} {"step": 45845, "loss": 1.2643, "grad_norm": "3.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.402e+00", "dlm_acc": "5.406e-01", "anc_acc": "5.121e-01", "epoch": 0.09169} {"step": 45850, "loss": 1.7345, "grad_norm": "2.931e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.942e+00", "anc_loss": "2.084e+00", "dlm_acc": "4.570e-01", "anc_acc": "4.290e-01", "epoch": 0.0917} {"step": 45855, "loss": 1.4682, "grad_norm": "3.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.521e+00", "dlm_acc": "5.731e-01", "anc_acc": "5.468e-01", "epoch": 0.09171} {"step": 45860, "loss": 0.946, "grad_norm": "4.306e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.793e-01", "anc_acc": "5.519e-01", "epoch": 0.09172} {"step": 45865, "loss": 1.1302, "grad_norm": "4.083e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.675e+00", "anc_loss": "1.822e+00", "dlm_acc": "4.985e-01", "anc_acc": "4.648e-01", "epoch": 0.09173} {"step": 45870, "loss": 1.2115, "grad_norm": "4.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.381e+00", "dlm_acc": "6.343e-01", "anc_acc": "6.093e-01", "epoch": 0.09174} {"step": 45875, "loss": 1.0016, "grad_norm": "3.202e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.413e+00", "dlm_acc": "5.939e-01", "anc_acc": "5.621e-01", "epoch": 0.09175} {"step": 45880, "loss": 0.9394, "grad_norm": "4.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.195e+00", "anc_loss": "1.335e+00", "dlm_acc": "5.807e-01", "anc_acc": "5.446e-01", "epoch": 0.09176} {"step": 45885, "loss": 1.1503, "grad_norm": "4.932e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.357e+00", "dlm_acc": "5.920e-01", "anc_acc": "5.596e-01", "epoch": 0.09177} {"step": 45890, "loss": 1.021, "grad_norm": "3.238e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.290e+00", "anc_loss": "1.401e+00", "dlm_acc": "5.607e-01", "anc_acc": "5.327e-01", "epoch": 0.09178} {"step": 45895, "loss": 0.7469, "grad_norm": "5.133e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.143e+00", "dlm_acc": "6.412e-01", "anc_acc": "6.091e-01", "epoch": 0.09179} {"step": 45900, "loss": 0.8649, "grad_norm": "2.867e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.169e+00", "anc_loss": "1.282e+00", "dlm_acc": "5.822e-01", "anc_acc": "5.494e-01", "epoch": 0.0918} {"step": 45905, "loss": 1.1464, "grad_norm": "3.534e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.514e+00", "anc_loss": "1.645e+00", "dlm_acc": "5.500e-01", "anc_acc": "5.202e-01", "epoch": 0.09181} {"step": 45910, "loss": 1.5252, "grad_norm": "3.964e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.588e+00", "anc_loss": "1.725e+00", "dlm_acc": "5.409e-01", "anc_acc": "5.129e-01", "epoch": 0.09182} {"step": 45915, "loss": 1.1894, "grad_norm": "3.503e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.151e+00", "anc_loss": "1.278e+00", "dlm_acc": "6.088e-01", "anc_acc": "5.783e-01", "epoch": 0.09183} {"step": 45920, "loss": 1.1773, "grad_norm": "2.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.398e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.636e-01", "anc_acc": "5.329e-01", "epoch": 0.09184} {"step": 45925, "loss": 1.1358, "grad_norm": "4.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.644e-01", "anc_acc": "5.317e-01", "epoch": 0.09185} {"step": 45930, "loss": 1.4295, "grad_norm": "3.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.363e+00", "anc_loss": "1.499e+00", "dlm_acc": "5.773e-01", "anc_acc": "5.505e-01", "epoch": 0.09186} {"step": 45935, "loss": 1.1511, "grad_norm": "3.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.517e+00", "dlm_acc": "5.052e-01", "anc_acc": "4.755e-01", "epoch": 0.09187} {"step": 45940, "loss": 1.2023, "grad_norm": "4.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.684e+00", "anc_loss": "1.812e+00", "dlm_acc": "4.780e-01", "anc_acc": "4.508e-01", "epoch": 0.09188} {"step": 45945, "loss": 1.3181, "grad_norm": "2.452e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.308e+00", "anc_loss": "1.425e+00", "dlm_acc": "5.846e-01", "anc_acc": "5.578e-01", "epoch": 0.09189} {"step": 45950, "loss": 0.8945, "grad_norm": "2.706e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.035e+00", "anc_loss": "1.152e+00", "dlm_acc": "5.725e-01", "anc_acc": "5.401e-01", "epoch": 0.0919} {"step": 45955, "loss": 1.3254, "grad_norm": "4.238e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.419e+00", "anc_loss": "1.559e+00", "dlm_acc": "5.649e-01", "anc_acc": "5.330e-01", "epoch": 0.09191} {"step": 45960, "loss": 1.0605, "grad_norm": "4.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.545e-01", "anc_acc": "5.236e-01", "epoch": 0.09192} {"step": 45965, "loss": 0.9718, "grad_norm": "5.897e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.299e+00", "dlm_acc": "5.961e-01", "anc_acc": "5.598e-01", "epoch": 0.09193} {"step": 45970, "loss": 1.4044, "grad_norm": "6.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.418e+00", "anc_loss": "1.537e+00", "dlm_acc": "5.571e-01", "anc_acc": "5.303e-01", "epoch": 0.09194} {"step": 45975, "loss": 1.0988, "grad_norm": "3.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.595e+00", "dlm_acc": "5.489e-01", "anc_acc": "5.192e-01", "epoch": 0.09195} {"step": 45980, "loss": 1.1407, "grad_norm": "5.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.095e+00", "anc_loss": "1.230e+00", "dlm_acc": "6.217e-01", "anc_acc": "5.863e-01", "epoch": 0.09196} {"step": 45985, "loss": 0.9675, "grad_norm": "3.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.142e+00", "anc_loss": "1.244e+00", "dlm_acc": "5.831e-01", "anc_acc": "5.610e-01", "epoch": 0.09197} {"step": 45990, "loss": 1.2326, "grad_norm": "3.078e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.603e+00", "anc_loss": "1.786e+00", "dlm_acc": "5.000e-01", "anc_acc": "4.731e-01", "epoch": 0.09198} {"step": 45995, "loss": 1.3359, "grad_norm": "4.464e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.457e+00", "anc_loss": "1.588e+00", "dlm_acc": "5.298e-01", "anc_acc": "4.984e-01", "epoch": 0.09199} {"step": 46000, "loss": 0.992, "grad_norm": "4.257e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.272e+00", "anc_loss": "1.400e+00", "dlm_acc": "5.822e-01", "anc_acc": "5.543e-01", "epoch": 0.092} {"step": 46005, "loss": 1.4671, "grad_norm": "1.267e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.317e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.974e-01", "anc_acc": "5.680e-01", "epoch": 0.09201} {"step": 46010, "loss": 1.4107, "grad_norm": "3.830e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.533e+00", "anc_loss": "1.706e+00", "dlm_acc": "5.489e-01", "anc_acc": "5.178e-01", "epoch": 0.09202} {"step": 46015, "loss": 1.0851, "grad_norm": "2.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.263e+00", "anc_loss": "1.398e+00", "dlm_acc": "5.807e-01", "anc_acc": "5.461e-01", "epoch": 0.09203} {"step": 46020, "loss": 1.0556, "grad_norm": "4.313e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.297e-01", "anc_loss": "7.641e-01", "dlm_acc": "5.401e-01", "anc_acc": "5.306e-01", "epoch": 0.09204} {"step": 46025, "loss": 0.8158, "grad_norm": "1.907e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.789e-01", "anc_loss": "7.293e-01", "dlm_acc": "5.773e-01", "anc_acc": "5.606e-01", "epoch": 0.09205} {"step": 46030, "loss": 1.0629, "grad_norm": "2.820e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.411e+00", "anc_loss": "1.564e+00", "dlm_acc": "5.483e-01", "anc_acc": "5.156e-01", "epoch": 0.09206} {"step": 46035, "loss": 1.5313, "grad_norm": "4.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.402e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.412e-01", "anc_acc": "5.091e-01", "epoch": 0.09207} {"step": 46040, "loss": 1.1262, "grad_norm": "3.004e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.266e+00", "anc_loss": "1.405e+00", "dlm_acc": "5.739e-01", "anc_acc": "5.442e-01", "epoch": 0.09208} {"step": 46045, "loss": 1.2301, "grad_norm": "2.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.172e-01", "anc_acc": "4.896e-01", "epoch": 0.09209} {"step": 46050, "loss": 1.1044, "grad_norm": "4.697e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.255e+00", "dlm_acc": "6.158e-01", "anc_acc": "5.879e-01", "epoch": 0.0921} {"step": 46055, "loss": 1.0341, "grad_norm": "2.047e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.179e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.893e-01", "anc_acc": "5.632e-01", "epoch": 0.09211} {"step": 46060, "loss": 1.6727, "grad_norm": "3.646e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.496e+00", "anc_loss": "1.652e+00", "dlm_acc": "5.469e-01", "anc_acc": "5.090e-01", "epoch": 0.09212} {"step": 46065, "loss": 1.5688, "grad_norm": "2.848e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.695e+00", "anc_loss": "1.841e+00", "dlm_acc": "5.153e-01", "anc_acc": "4.835e-01", "epoch": 0.09213} {"step": 46070, "loss": 0.986, "grad_norm": "1.953e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.233e+00", "dlm_acc": "5.816e-01", "anc_acc": "5.489e-01", "epoch": 0.09214} {"step": 46075, "loss": 1.4124, "grad_norm": "3.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.768e+00", "anc_loss": "1.909e+00", "dlm_acc": "4.766e-01", "anc_acc": "4.447e-01", "epoch": 0.09215} {"step": 46080, "loss": 1.1736, "grad_norm": "2.650e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.239e+00", "anc_loss": "1.358e+00", "dlm_acc": "5.989e-01", "anc_acc": "5.691e-01", "epoch": 0.09216} {"step": 46085, "loss": 1.3466, "grad_norm": "4.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.284e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.667e-01", "anc_acc": "5.406e-01", "epoch": 0.09217} {"step": 46090, "loss": 1.5405, "grad_norm": "3.544e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.292e+00", "dlm_acc": "5.912e-01", "anc_acc": "5.604e-01", "epoch": 0.09218} {"step": 46095, "loss": 1.2315, "grad_norm": "1.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.243e+00", "anc_loss": "1.346e+00", "dlm_acc": "5.979e-01", "anc_acc": "5.677e-01", "epoch": 0.09219} {"step": 46100, "loss": 1.4879, "grad_norm": "8.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.655e+00", "dlm_acc": "3.124e-01", "anc_acc": "2.901e-01", "epoch": 0.0922} {"step": 46105, "loss": 1.4592, "grad_norm": "2.341e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.438e+00", "anc_loss": "1.530e+00", "dlm_acc": "4.372e-01", "anc_acc": "4.126e-01", "epoch": 0.09221} {"step": 46110, "loss": 1.4725, "grad_norm": "7.577e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.565e+00", "anc_loss": "1.681e+00", "dlm_acc": "5.341e-01", "anc_acc": "5.089e-01", "epoch": 0.09222} {"step": 46115, "loss": 1.3316, "grad_norm": "4.112e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.446e+00", "anc_loss": "1.570e+00", "dlm_acc": "5.222e-01", "anc_acc": "4.929e-01", "epoch": 0.09223} {"step": 46120, "loss": 1.155, "grad_norm": "3.569e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.300e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.537e-01", "anc_acc": "5.214e-01", "epoch": 0.09224} {"step": 46125, "loss": 1.5405, "grad_norm": "3.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.394e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.642e-01", "anc_acc": "5.337e-01", "epoch": 0.09225} {"step": 46130, "loss": 1.513, "grad_norm": "2.394e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.688e+00", "dlm_acc": "5.439e-01", "anc_acc": "5.107e-01", "epoch": 0.09226} {"step": 46135, "loss": 1.5349, "grad_norm": "7.779e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.557e+00", "anc_loss": "1.708e+00", "dlm_acc": "5.237e-01", "anc_acc": "4.903e-01", "epoch": 0.09227} {"step": 46140, "loss": 1.4642, "grad_norm": "3.034e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.492e+00", "anc_loss": "1.655e+00", "dlm_acc": "5.612e-01", "anc_acc": "5.268e-01", "epoch": 0.09228} {"step": 46145, "loss": 0.7319, "grad_norm": "2.951e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.742e-01", "anc_loss": "8.805e-01", "dlm_acc": "6.646e-01", "anc_acc": "6.316e-01", "epoch": 0.09229} {"step": 46150, "loss": 0.8384, "grad_norm": "2.931e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.523e-01", "anc_loss": "7.793e-01", "dlm_acc": "6.963e-01", "anc_acc": "6.552e-01", "epoch": 0.0923} {"step": 46155, "loss": 1.0425, "grad_norm": "1.125e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.512e-01", "anc_loss": "9.625e-01", "dlm_acc": "6.508e-01", "anc_acc": "6.169e-01", "epoch": 0.09231} {"step": 46160, "loss": 1.0636, "grad_norm": "2.723e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.313e-01", "anc_loss": "1.033e+00", "dlm_acc": "6.581e-01", "anc_acc": "6.311e-01", "epoch": 0.09232} {"step": 46165, "loss": 1.2191, "grad_norm": "2.353e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.028e+00", "anc_loss": "1.126e+00", "dlm_acc": "6.088e-01", "anc_acc": "5.809e-01", "epoch": 0.09233} {"step": 46170, "loss": 1.5174, "grad_norm": "6.386e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.080e+00", "anc_loss": "2.175e+00", "dlm_acc": "3.167e-01", "anc_acc": "2.952e-01", "epoch": 0.09234} {"step": 46175, "loss": 1.6496, "grad_norm": "3.686e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.355e+00", "anc_loss": "1.488e+00", "dlm_acc": "5.767e-01", "anc_acc": "5.466e-01", "epoch": 0.09235} {"step": 46180, "loss": 1.2637, "grad_norm": "4.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.419e-01", "anc_loss": "8.259e-01", "dlm_acc": "6.708e-01", "anc_acc": "6.367e-01", "epoch": 0.09236} {"step": 46185, "loss": 1.051, "grad_norm": "2.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.809e-01", "anc_loss": "9.187e-01", "dlm_acc": "6.995e-01", "anc_acc": "6.422e-01", "epoch": 0.09237} {"step": 46190, "loss": 1.1258, "grad_norm": "1.972e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.331e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.483e-01", "anc_acc": "5.171e-01", "epoch": 0.09238} {"step": 46195, "loss": 1.0286, "grad_norm": "3.776e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.921e-01", "anc_loss": "8.603e-01", "dlm_acc": "7.070e-01", "anc_acc": "6.529e-01", "epoch": 0.09239} {"step": 46200, "loss": 1.572, "grad_norm": "3.559e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.663e+00", "anc_loss": "1.766e+00", "dlm_acc": "3.843e-01", "anc_acc": "3.584e-01", "epoch": 0.0924} {"step": 46205, "loss": 1.066, "grad_norm": "3.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.109e+00", "anc_loss": "1.188e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.118e-01", "epoch": 0.09241} {"step": 46210, "loss": 1.5977, "grad_norm": "3.099e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.127e+00", "anc_loss": "2.163e+00", "dlm_acc": "2.830e-01", "anc_acc": "2.743e-01", "epoch": 0.09242} {"step": 46215, "loss": 1.3914, "grad_norm": "2.245e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.552e+00", "anc_loss": "1.680e+00", "dlm_acc": "4.632e-01", "anc_acc": "4.294e-01", "epoch": 0.09243} {"step": 46220, "loss": 1.253, "grad_norm": "2.034e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.300e+00", "anc_loss": "1.439e+00", "dlm_acc": "5.294e-01", "anc_acc": "4.907e-01", "epoch": 0.09244} {"step": 46225, "loss": 1.2682, "grad_norm": "5.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.441e+00", "dlm_acc": "5.708e-01", "anc_acc": "5.449e-01", "epoch": 0.09245} {"step": 46230, "loss": 1.39, "grad_norm": "6.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.652e+00", "anc_loss": "1.780e+00", "dlm_acc": "4.378e-01", "anc_acc": "4.028e-01", "epoch": 0.09246} {"step": 46235, "loss": 1.5996, "grad_norm": "5.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.906e+00", "anc_loss": "2.925e+00", "dlm_acc": "3.686e-02", "anc_acc": "3.424e-02", "epoch": 0.09247} {"step": 46240, "loss": 1.4426, "grad_norm": "3.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.461e+00", "anc_loss": "2.500e+00", "dlm_acc": "1.441e-01", "anc_acc": "1.366e-01", "epoch": 0.09248} {"step": 46245, "loss": 1.2523, "grad_norm": "2.990e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.074e+00", "anc_loss": "1.182e+00", "dlm_acc": "6.713e-01", "anc_acc": "6.405e-01", "epoch": 0.09249} {"step": 46250, "loss": 0.7519, "grad_norm": "3.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.789e-01", "anc_loss": "1.892e-01", "dlm_acc": "8.648e-01", "anc_acc": "8.613e-01", "epoch": 0.0925} {"step": 46255, "loss": 1.2204, "grad_norm": "7.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.273e+00", "dlm_acc": "6.211e-01", "anc_acc": "5.791e-01", "epoch": 0.09251} {"step": 46260, "loss": 1.2286, "grad_norm": "2.746e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.221e+00", "anc_loss": "1.346e+00", "dlm_acc": "5.768e-01", "anc_acc": "5.433e-01", "epoch": 0.09252} {"step": 46265, "loss": 1.4094, "grad_norm": "4.113e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.407e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.431e-01", "anc_acc": "5.062e-01", "epoch": 0.09253} {"step": 46270, "loss": 1.0935, "grad_norm": "4.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.388e+00", "anc_loss": "1.530e+00", "dlm_acc": "5.197e-01", "anc_acc": "4.814e-01", "epoch": 0.09254} {"step": 46275, "loss": 1.3947, "grad_norm": "3.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.450e+00", "anc_loss": "1.578e+00", "dlm_acc": "5.102e-01", "anc_acc": "4.830e-01", "epoch": 0.09255} {"step": 46280, "loss": 1.5225, "grad_norm": "2.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.666e+00", "anc_loss": "1.806e+00", "dlm_acc": "4.443e-01", "anc_acc": "4.153e-01", "epoch": 0.09256} {"step": 46285, "loss": 0.9278, "grad_norm": "1.854e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.052e-01", "anc_acc": "4.454e-01", "epoch": 0.09257} {"step": 46290, "loss": 1.0813, "grad_norm": "2.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.145e+00", "anc_loss": "1.307e+00", "dlm_acc": "6.058e-01", "anc_acc": "5.621e-01", "epoch": 0.09258} {"step": 46295, "loss": 1.6282, "grad_norm": "2.937e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.343e+00", "anc_loss": "1.458e+00", "dlm_acc": "5.761e-01", "anc_acc": "5.495e-01", "epoch": 0.09259} {"step": 46300, "loss": 1.3072, "grad_norm": "3.108e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.140e+00", "anc_loss": "1.278e+00", "dlm_acc": "5.627e-01", "anc_acc": "5.258e-01", "epoch": 0.0926} {"step": 46305, "loss": 1.322, "grad_norm": "2.950e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.238e-01", "anc_loss": "1.047e+00", "dlm_acc": "6.259e-01", "anc_acc": "5.863e-01", "epoch": 0.09261} {"step": 46310, "loss": 1.1708, "grad_norm": "3.190e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.411e-01", "anc_loss": "8.375e-01", "dlm_acc": "7.004e-01", "anc_acc": "6.682e-01", "epoch": 0.09262} {"step": 46315, "loss": 1.4777, "grad_norm": "3.993e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.538e+00", "anc_loss": "1.695e+00", "dlm_acc": "5.086e-01", "anc_acc": "4.779e-01", "epoch": 0.09263} {"step": 46320, "loss": 1.1392, "grad_norm": "3.907e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.188e+00", "anc_loss": "1.314e+00", "dlm_acc": "5.755e-01", "anc_acc": "5.460e-01", "epoch": 0.09264} {"step": 46325, "loss": 1.2181, "grad_norm": "2.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.164e+00", "anc_loss": "1.269e+00", "dlm_acc": "5.670e-01", "anc_acc": "5.392e-01", "epoch": 0.09265} {"step": 46330, "loss": 1.1276, "grad_norm": "3.187e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.114e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.953e-01", "anc_acc": "5.638e-01", "epoch": 0.09266} {"step": 46335, "loss": 2.015, "grad_norm": "4.351e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.834e+00", "anc_loss": "1.959e+00", "dlm_acc": "4.464e-01", "anc_acc": "4.213e-01", "epoch": 0.09267} {"step": 46340, "loss": 1.3836, "grad_norm": "3.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.529e-01", "anc_acc": "5.247e-01", "epoch": 0.09268} {"step": 46345, "loss": 1.5548, "grad_norm": "2.167e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.569e+00", "anc_loss": "1.682e+00", "dlm_acc": "4.901e-01", "anc_acc": "4.633e-01", "epoch": 0.09269} {"step": 46350, "loss": 1.1864, "grad_norm": "3.332e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.071e+00", "anc_loss": "1.173e+00", "dlm_acc": "5.977e-01", "anc_acc": "5.679e-01", "epoch": 0.0927} {"step": 46355, "loss": 1.6505, "grad_norm": "2.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.541e+00", "anc_loss": "1.673e+00", "dlm_acc": "5.471e-01", "anc_acc": "5.130e-01", "epoch": 0.09271} {"step": 46360, "loss": 1.2658, "grad_norm": "2.581e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.363e+00", "dlm_acc": "5.741e-01", "anc_acc": "5.468e-01", "epoch": 0.09272} {"step": 46365, "loss": 1.3015, "grad_norm": "2.810e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.127e-01", "anc_acc": "4.858e-01", "epoch": 0.09273} {"step": 46370, "loss": 1.3096, "grad_norm": "4.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.561e+00", "dlm_acc": "5.400e-01", "anc_acc": "5.062e-01", "epoch": 0.09274} {"step": 46375, "loss": 1.2606, "grad_norm": "2.756e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.346e+00", "anc_loss": "1.469e+00", "dlm_acc": "5.521e-01", "anc_acc": "5.184e-01", "epoch": 0.09275} {"step": 46380, "loss": 1.0257, "grad_norm": "3.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.206e+00", "anc_loss": "1.303e+00", "dlm_acc": "5.408e-01", "anc_acc": "5.181e-01", "epoch": 0.09276} {"step": 46385, "loss": 0.9181, "grad_norm": "2.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.111e+00", "anc_loss": "1.234e+00", "dlm_acc": "5.844e-01", "anc_acc": "5.548e-01", "epoch": 0.09277} {"step": 46390, "loss": 0.8904, "grad_norm": "3.405e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.273e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.510e-01", "anc_acc": "5.220e-01", "epoch": 0.09278} {"step": 46395, "loss": 1.1381, "grad_norm": "2.172e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.733e-01", "anc_acc": "5.402e-01", "epoch": 0.09279} {"step": 46400, "loss": 1.0178, "grad_norm": "1.909e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.655e+00", "anc_loss": "1.787e+00", "dlm_acc": "5.046e-01", "anc_acc": "4.761e-01", "epoch": 0.0928} {"step": 46405, "loss": 1.1948, "grad_norm": "4.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.527e+00", "anc_loss": "1.636e+00", "dlm_acc": "5.102e-01", "anc_acc": "4.860e-01", "epoch": 0.09281} {"step": 46410, "loss": 1.7292, "grad_norm": "3.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.677e+00", "anc_loss": "1.837e+00", "dlm_acc": "5.302e-01", "anc_acc": "4.956e-01", "epoch": 0.09282} {"step": 46415, "loss": 1.2421, "grad_norm": "2.570e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.198e+00", "anc_loss": "1.310e+00", "dlm_acc": "6.031e-01", "anc_acc": "5.781e-01", "epoch": 0.09283} {"step": 46420, "loss": 1.2631, "grad_norm": "3.963e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.547e+00", "dlm_acc": "5.262e-01", "anc_acc": "4.953e-01", "epoch": 0.09284} {"step": 46425, "loss": 1.1786, "grad_norm": "3.023e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.170e+00", "anc_loss": "1.286e+00", "dlm_acc": "5.856e-01", "anc_acc": "5.576e-01", "epoch": 0.09285} {"step": 46430, "loss": 1.2649, "grad_norm": "5.472e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.547e+00", "anc_loss": "1.677e+00", "dlm_acc": "4.961e-01", "anc_acc": "4.667e-01", "epoch": 0.09286} {"step": 46435, "loss": 0.7844, "grad_norm": "2.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.010e+00", "anc_loss": "1.114e+00", "dlm_acc": "5.993e-01", "anc_acc": "5.707e-01", "epoch": 0.09287} {"step": 46440, "loss": 1.4643, "grad_norm": "3.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.475e+00", "anc_loss": "1.628e+00", "dlm_acc": "5.596e-01", "anc_acc": "5.247e-01", "epoch": 0.09288} {"step": 46445, "loss": 1.1093, "grad_norm": "3.649e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.344e-01", "anc_loss": "1.029e+00", "dlm_acc": "6.545e-01", "anc_acc": "6.272e-01", "epoch": 0.09289} {"step": 46450, "loss": 0.9996, "grad_norm": "8.578e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.105e-01", "anc_loss": "8.691e-01", "dlm_acc": "6.050e-01", "anc_acc": "5.871e-01", "epoch": 0.0929} {"step": 46455, "loss": 1.1413, "grad_norm": "2.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.021e+00", "anc_loss": "1.141e+00", "dlm_acc": "6.045e-01", "anc_acc": "5.693e-01", "epoch": 0.09291} {"step": 46460, "loss": 1.1564, "grad_norm": "3.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.238e+00", "dlm_acc": "5.006e-01", "anc_acc": "4.795e-01", "epoch": 0.09292} {"step": 46465, "loss": 0.8399, "grad_norm": "1.909e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.586e-01", "anc_loss": "9.422e-01", "dlm_acc": "5.671e-01", "anc_acc": "5.483e-01", "epoch": 0.09293} {"step": 46470, "loss": 1.0934, "grad_norm": "4.056e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.148e-01", "anc_loss": "7.434e-01", "dlm_acc": "7.263e-01", "anc_acc": "6.859e-01", "epoch": 0.09294} {"step": 46475, "loss": 1.0498, "grad_norm": "1.086e+00", "learning_rate": "1.000e-04", "dlm_loss": "7.535e-01", "anc_loss": "8.438e-01", "dlm_acc": "6.550e-01", "anc_acc": "6.267e-01", "epoch": 0.09295} {"step": 46480, "loss": 1.3666, "grad_norm": "4.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.258e-01", "anc_loss": "7.727e-01", "dlm_acc": "5.571e-01", "anc_acc": "5.360e-01", "epoch": 0.09296} {"step": 46485, "loss": 1.1969, "grad_norm": "3.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.086e-01", "anc_loss": "8.172e-01", "dlm_acc": "3.714e-01", "anc_acc": "3.663e-01", "epoch": 0.09297} {"step": 46490, "loss": 1.0889, "grad_norm": "2.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.875e-01", "anc_loss": "1.038e+00", "dlm_acc": "4.506e-01", "anc_acc": "4.354e-01", "epoch": 0.09298} {"step": 46495, "loss": 1.4525, "grad_norm": "3.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.502e+00", "anc_loss": "1.613e+00", "dlm_acc": "4.916e-01", "anc_acc": "4.636e-01", "epoch": 0.09299} {"step": 46500, "loss": 1.1701, "grad_norm": "3.027e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.328e-01", "anc_loss": "7.578e-01", "dlm_acc": "4.696e-01", "anc_acc": "4.551e-01", "epoch": 0.093} {"step": 46505, "loss": 0.9196, "grad_norm": "3.710e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.074e-01", "anc_loss": "7.973e-01", "dlm_acc": "5.924e-01", "anc_acc": "5.561e-01", "epoch": 0.09301} {"step": 46510, "loss": 1.1007, "grad_norm": "3.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.641e-01", "anc_loss": "9.723e-01", "dlm_acc": "6.407e-01", "anc_acc": "6.000e-01", "epoch": 0.09302} {"step": 46515, "loss": 1.1856, "grad_norm": "4.140e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.281e-01", "anc_loss": "9.227e-01", "dlm_acc": "5.407e-01", "anc_acc": "5.165e-01", "epoch": 0.09303} {"step": 46520, "loss": 1.1049, "grad_norm": "2.928e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.453e-01", "anc_loss": "9.102e-01", "dlm_acc": "5.866e-01", "anc_acc": "5.612e-01", "epoch": 0.09304} {"step": 46525, "loss": 0.9126, "grad_norm": "2.751e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.129e-01", "anc_loss": "5.344e-01", "dlm_acc": "6.633e-01", "anc_acc": "6.550e-01", "epoch": 0.09305} {"step": 46530, "loss": 0.8524, "grad_norm": "2.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.662e-01", "anc_loss": "7.664e-01", "dlm_acc": "7.013e-01", "anc_acc": "6.706e-01", "epoch": 0.09306} {"step": 46535, "loss": 1.2848, "grad_norm": "5.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.519e+00", "dlm_acc": "5.632e-01", "anc_acc": "5.303e-01", "epoch": 0.09307} {"step": 46540, "loss": 1.0305, "grad_norm": "7.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.418e-01", "anc_loss": "1.013e+00", "dlm_acc": "7.011e-01", "anc_acc": "6.828e-01", "epoch": 0.09308} {"step": 46545, "loss": 1.3409, "grad_norm": "4.649e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.498e+00", "anc_loss": "1.623e+00", "dlm_acc": "5.276e-01", "anc_acc": "5.010e-01", "epoch": 0.09309} {"step": 46550, "loss": 1.0721, "grad_norm": "3.399e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.602e-01", "anc_loss": "1.077e+00", "dlm_acc": "5.950e-01", "anc_acc": "5.581e-01", "epoch": 0.0931} {"step": 46555, "loss": 1.1317, "grad_norm": "2.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.942e-01", "anc_loss": "6.998e-01", "dlm_acc": "7.712e-01", "anc_acc": "7.378e-01", "epoch": 0.09311} {"step": 46560, "loss": 1.2477, "grad_norm": "4.149e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.225e+00", "dlm_acc": "5.377e-01", "anc_acc": "5.087e-01", "epoch": 0.09312} {"step": 46565, "loss": 1.0402, "grad_norm": "1.506e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.441e-01", "anc_loss": "1.038e+00", "dlm_acc": "5.872e-01", "anc_acc": "5.640e-01", "epoch": 0.09313} {"step": 46570, "loss": 1.418, "grad_norm": "4.492e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.664e-01", "anc_loss": "1.061e+00", "dlm_acc": "6.194e-01", "anc_acc": "5.997e-01", "epoch": 0.09314} {"step": 46575, "loss": 1.3792, "grad_norm": "3.727e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.371e-01", "anc_loss": "7.715e-01", "dlm_acc": "7.676e-01", "anc_acc": "7.306e-01", "epoch": 0.09315} {"step": 46580, "loss": 1.0327, "grad_norm": "4.459e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.672e-01", "anc_loss": "1.113e+00", "dlm_acc": "6.690e-01", "anc_acc": "6.342e-01", "epoch": 0.09316} {"step": 46585, "loss": 1.3979, "grad_norm": "3.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.812e-01", "anc_loss": "9.773e-01", "dlm_acc": "5.633e-01", "anc_acc": "5.340e-01", "epoch": 0.09317} {"step": 46590, "loss": 1.3429, "grad_norm": "4.786e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.157e+00", "dlm_acc": "6.269e-01", "anc_acc": "6.029e-01", "epoch": 0.09318} {"step": 46595, "loss": 0.844, "grad_norm": "7.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.893e-01", "anc_loss": "7.920e-01", "dlm_acc": "7.094e-01", "anc_acc": "6.753e-01", "epoch": 0.09319} {"step": 46600, "loss": 1.0573, "grad_norm": "4.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.186e+00", "anc_loss": "1.261e+00", "dlm_acc": "5.602e-01", "anc_acc": "5.378e-01", "epoch": 0.0932} {"step": 46605, "loss": 1.5216, "grad_norm": "2.488e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.560e-01", "anc_loss": "7.020e-01", "dlm_acc": "8.289e-01", "anc_acc": "7.810e-01", "epoch": 0.09321} {"step": 46610, "loss": 1.1516, "grad_norm": "3.224e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.840e-01", "anc_loss": "9.875e-01", "dlm_acc": "6.320e-01", "anc_acc": "6.033e-01", "epoch": 0.09322} {"step": 46615, "loss": 0.9016, "grad_norm": "1.584e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.945e-01", "anc_loss": "9.988e-01", "dlm_acc": "6.550e-01", "anc_acc": "6.237e-01", "epoch": 0.09323} {"step": 46620, "loss": 1.1513, "grad_norm": "1.741e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.279e+00", "dlm_acc": "5.840e-01", "anc_acc": "5.569e-01", "epoch": 0.09324} {"step": 46625, "loss": 1.0326, "grad_norm": "1.404e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.768e-01", "anc_loss": "8.875e-01", "dlm_acc": "6.756e-01", "anc_acc": "6.422e-01", "epoch": 0.09325} {"step": 46630, "loss": 1.1568, "grad_norm": "2.518e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.163e+00", "dlm_acc": "6.206e-01", "anc_acc": "5.878e-01", "epoch": 0.09326} {"step": 46635, "loss": 1.0301, "grad_norm": "3.019e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.042e+00", "anc_loss": "1.165e+00", "dlm_acc": "6.327e-01", "anc_acc": "5.991e-01", "epoch": 0.09327} {"step": 46640, "loss": 1.1752, "grad_norm": "2.248e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.405e+00", "anc_loss": "1.523e+00", "dlm_acc": "5.250e-01", "anc_acc": "4.974e-01", "epoch": 0.09328} {"step": 46645, "loss": 1.2227, "grad_norm": "4.335e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.088e+00", "anc_loss": "1.230e+00", "dlm_acc": "6.363e-01", "anc_acc": "6.030e-01", "epoch": 0.09329} {"step": 46650, "loss": 1.2424, "grad_norm": "3.162e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.372e+00", "dlm_acc": "5.675e-01", "anc_acc": "5.388e-01", "epoch": 0.0933} {"step": 46655, "loss": 1.1858, "grad_norm": "4.107e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.141e+00", "anc_loss": "1.251e+00", "dlm_acc": "6.143e-01", "anc_acc": "5.877e-01", "epoch": 0.09331} {"step": 46660, "loss": 1.3038, "grad_norm": "3.151e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.304e+00", "anc_loss": "1.431e+00", "dlm_acc": "6.001e-01", "anc_acc": "5.691e-01", "epoch": 0.09332} {"step": 46665, "loss": 1.795, "grad_norm": "3.656e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.577e+00", "anc_loss": "1.722e+00", "dlm_acc": "5.173e-01", "anc_acc": "4.840e-01", "epoch": 0.09333} {"step": 46670, "loss": 1.0345, "grad_norm": "1.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.262e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.524e-01", "anc_acc": "5.227e-01", "epoch": 0.09334} {"step": 46675, "loss": 1.3123, "grad_norm": "2.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.410e+00", "anc_loss": "1.552e+00", "dlm_acc": "5.414e-01", "anc_acc": "5.062e-01", "epoch": 0.09335} {"step": 46680, "loss": 1.3206, "grad_norm": "5.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.354e+00", "anc_loss": "1.463e+00", "dlm_acc": "5.343e-01", "anc_acc": "5.080e-01", "epoch": 0.09336} {"step": 46685, "loss": 1.2846, "grad_norm": "1.725e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.267e+00", "dlm_acc": "6.034e-01", "anc_acc": "5.631e-01", "epoch": 0.09337} {"step": 46690, "loss": 1.1229, "grad_norm": "3.702e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.339e-01", "anc_loss": "7.002e-01", "dlm_acc": "6.352e-01", "anc_acc": "6.089e-01", "epoch": 0.09338} {"step": 46695, "loss": 1.1012, "grad_norm": "2.658e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.523e-02", "anc_loss": "5.190e-02", "dlm_acc": "9.805e-01", "anc_acc": "9.703e-01", "epoch": 0.09339} {"step": 46700, "loss": 1.1226, "grad_norm": "2.901e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.524e-01", "anc_loss": "5.031e-01", "dlm_acc": "8.087e-01", "anc_acc": "7.840e-01", "epoch": 0.0934} {"step": 46705, "loss": 1.1025, "grad_norm": "5.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.859e-01", "anc_loss": "8.578e-01", "dlm_acc": "6.216e-01", "anc_acc": "5.963e-01", "epoch": 0.09341} {"step": 46710, "loss": 1.124, "grad_norm": "2.001e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.288e+00", "anc_loss": "1.393e+00", "dlm_acc": "5.355e-01", "anc_acc": "5.135e-01", "epoch": 0.09342} {"step": 46715, "loss": 1.0212, "grad_norm": "4.494e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.836e-01", "anc_loss": "9.148e-01", "dlm_acc": "5.024e-01", "anc_acc": "4.933e-01", "epoch": 0.09343} {"step": 46720, "loss": 1.0739, "grad_norm": "2.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.805e-01", "anc_loss": "7.078e-01", "dlm_acc": "5.408e-01", "anc_acc": "5.276e-01", "epoch": 0.09344} {"step": 46725, "loss": 1.089, "grad_norm": "4.282e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.734e-01", "anc_loss": "9.078e-01", "dlm_acc": "5.206e-01", "anc_acc": "5.095e-01", "epoch": 0.09345} {"step": 46730, "loss": 1.0804, "grad_norm": "2.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.805e-01", "anc_loss": "8.352e-01", "dlm_acc": "6.297e-01", "anc_acc": "6.137e-01", "epoch": 0.09346} {"step": 46735, "loss": 0.8985, "grad_norm": "5.939e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.735e-01", "anc_loss": "3.016e-01", "dlm_acc": "8.531e-01", "anc_acc": "8.434e-01", "epoch": 0.09347} {"step": 46740, "loss": 1.0606, "grad_norm": "4.703e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.145e-01", "anc_loss": "6.297e-01", "dlm_acc": "5.514e-01", "anc_acc": "5.448e-01", "epoch": 0.09348} {"step": 46745, "loss": 1.0737, "grad_norm": "3.113e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.922e-01", "anc_loss": "8.766e-01", "dlm_acc": "6.373e-01", "anc_acc": "6.128e-01", "epoch": 0.09349} {"step": 46750, "loss": 1.2163, "grad_norm": "2.906e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.855e-01", "anc_loss": "7.527e-01", "dlm_acc": "5.960e-01", "anc_acc": "5.696e-01", "epoch": 0.0935} {"step": 46755, "loss": 1.4419, "grad_norm": "5.068e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.050e+00", "anc_loss": "1.115e+00", "dlm_acc": "5.633e-01", "anc_acc": "5.456e-01", "epoch": 0.09351} {"step": 46760, "loss": 1.035, "grad_norm": "2.809e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.164e-01", "anc_loss": "9.930e-01", "dlm_acc": "5.652e-01", "anc_acc": "5.482e-01", "epoch": 0.09352} {"step": 46765, "loss": 1.0867, "grad_norm": "4.152e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.212e+00", "dlm_acc": "4.963e-01", "anc_acc": "4.720e-01", "epoch": 0.09353} {"step": 46770, "loss": 0.7425, "grad_norm": "2.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.770e-01", "anc_loss": "7.910e-01", "dlm_acc": "7.744e-01", "anc_acc": "7.469e-01", "epoch": 0.09354} {"step": 46775, "loss": 1.1072, "grad_norm": "1.906e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.406e-01", "anc_loss": "7.512e-01", "dlm_acc": "7.429e-01", "anc_acc": "7.096e-01", "epoch": 0.09355} {"step": 46780, "loss": 1.3433, "grad_norm": "4.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.221e+00", "anc_loss": "1.354e+00", "dlm_acc": "5.760e-01", "anc_acc": "5.426e-01", "epoch": 0.09356} {"step": 46785, "loss": 1.4958, "grad_norm": "6.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.526e+00", "anc_loss": "1.640e+00", "dlm_acc": "4.996e-01", "anc_acc": "4.739e-01", "epoch": 0.09357} {"step": 46790, "loss": 1.2765, "grad_norm": "3.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.054e+00", "anc_loss": "1.159e+00", "dlm_acc": "6.179e-01", "anc_acc": "5.885e-01", "epoch": 0.09358} {"step": 46795, "loss": 0.9672, "grad_norm": "3.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.352e-01", "anc_loss": "1.027e+00", "dlm_acc": "5.734e-01", "anc_acc": "5.462e-01", "epoch": 0.09359} {"step": 46800, "loss": 1.0526, "grad_norm": "2.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.680e-01", "anc_loss": "9.336e-01", "dlm_acc": "5.561e-01", "anc_acc": "5.386e-01", "epoch": 0.0936} {"step": 46805, "loss": 1.0285, "grad_norm": "3.521e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.484e-01", "anc_loss": "6.004e-01", "dlm_acc": "6.590e-01", "anc_acc": "6.418e-01", "epoch": 0.09361} {"step": 46810, "loss": 1.0756, "grad_norm": "3.053e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.313e-01", "anc_loss": "9.836e-01", "dlm_acc": "5.132e-01", "anc_acc": "4.965e-01", "epoch": 0.09362} {"step": 46815, "loss": 1.2608, "grad_norm": "1.214e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.030e+00", "anc_loss": "1.055e+00", "dlm_acc": "3.561e-01", "anc_acc": "3.486e-01", "epoch": 0.09363} {"step": 46820, "loss": 0.8535, "grad_norm": "3.665e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.488e-01", "anc_loss": "4.906e-01", "dlm_acc": "6.733e-01", "anc_acc": "6.470e-01", "epoch": 0.09364} {"step": 46825, "loss": 0.8955, "grad_norm": "3.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.891e-01", "anc_loss": "6.078e-01", "dlm_acc": "5.463e-01", "anc_acc": "5.357e-01", "epoch": 0.09365} {"step": 46830, "loss": 1.1182, "grad_norm": "2.939e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.305e-01", "anc_loss": "7.445e-01", "dlm_acc": "4.543e-01", "anc_acc": "4.478e-01", "epoch": 0.09366} {"step": 46835, "loss": 1.1897, "grad_norm": "3.288e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.453e-01", "anc_loss": "8.602e-01", "dlm_acc": "4.597e-01", "anc_acc": "4.544e-01", "epoch": 0.09367} {"step": 46840, "loss": 0.9447, "grad_norm": "3.558e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.516e-01", "anc_loss": "6.633e-01", "dlm_acc": "4.541e-01", "anc_acc": "4.464e-01", "epoch": 0.09368} {"step": 46845, "loss": 1.3423, "grad_norm": "3.913e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.445e-01", "anc_loss": "7.602e-01", "dlm_acc": "4.650e-01", "anc_acc": "4.556e-01", "epoch": 0.09369} {"step": 46850, "loss": 1.1606, "grad_norm": "3.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.836e-01", "anc_loss": "7.965e-01", "dlm_acc": "4.685e-01", "anc_acc": "4.639e-01", "epoch": 0.0937} {"step": 46855, "loss": 0.8366, "grad_norm": "2.992e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.318e-01", "anc_loss": "7.934e-01", "dlm_acc": "6.478e-01", "anc_acc": "6.301e-01", "epoch": 0.09371} {"step": 46860, "loss": 0.8934, "grad_norm": "5.152e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.262e-01", "anc_loss": "9.223e-01", "dlm_acc": "6.291e-01", "anc_acc": "5.963e-01", "epoch": 0.09372} {"step": 46865, "loss": 0.8204, "grad_norm": "5.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.512e-01", "anc_loss": "6.789e-01", "dlm_acc": "5.343e-01", "anc_acc": "5.149e-01", "epoch": 0.09373} {"step": 46870, "loss": 1.0793, "grad_norm": "3.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.797e-01", "anc_loss": "7.117e-01", "dlm_acc": "5.249e-01", "anc_acc": "5.084e-01", "epoch": 0.09374} {"step": 46875, "loss": 0.8603, "grad_norm": "3.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.867e-01", "anc_loss": "6.266e-01", "dlm_acc": "5.621e-01", "anc_acc": "5.380e-01", "epoch": 0.09375} {"step": 46880, "loss": 1.079, "grad_norm": "3.182e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.492e-01", "anc_loss": "7.039e-01", "dlm_acc": "5.764e-01", "anc_acc": "5.463e-01", "epoch": 0.09376} {"step": 46885, "loss": 1.1467, "grad_norm": "2.594e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.562e-01", "anc_loss": "5.109e-01", "dlm_acc": "6.237e-01", "anc_acc": "5.792e-01", "epoch": 0.09377} {"step": 46890, "loss": 1.071, "grad_norm": "1.915e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.883e-01", "anc_loss": "5.684e-01", "dlm_acc": "6.382e-01", "anc_acc": "5.778e-01", "epoch": 0.09378} {"step": 46895, "loss": 1.3096, "grad_norm": "2.164e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.286e+00", "dlm_acc": "5.578e-01", "anc_acc": "5.236e-01", "epoch": 0.09379} {"step": 46900, "loss": 1.2585, "grad_norm": "3.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.009e+00", "anc_loss": "1.117e+00", "dlm_acc": "6.195e-01", "anc_acc": "5.915e-01", "epoch": 0.0938} {"step": 46905, "loss": 1.1205, "grad_norm": "5.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.703e-01", "anc_loss": "1.068e+00", "dlm_acc": "5.802e-01", "anc_acc": "5.517e-01", "epoch": 0.09381} {"step": 46910, "loss": 1.6414, "grad_norm": "5.187e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.138e+00", "dlm_acc": "7.264e-01", "anc_acc": "7.027e-01", "epoch": 0.09382} {"step": 46915, "loss": 1.1703, "grad_norm": "1.270e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.711e-01", "anc_loss": "7.324e-01", "dlm_acc": "6.547e-01", "anc_acc": "6.334e-01", "epoch": 0.09383} {"step": 46920, "loss": 1.3891, "grad_norm": "2.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.420e+00", "anc_loss": "1.543e+00", "dlm_acc": "5.051e-01", "anc_acc": "4.764e-01", "epoch": 0.09384} {"step": 46925, "loss": 1.0669, "grad_norm": "3.971e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.617e-01", "anc_loss": "8.538e-01", "dlm_acc": "7.424e-01", "anc_acc": "7.183e-01", "epoch": 0.09385} {"step": 46930, "loss": 1.109, "grad_norm": "2.593e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.512e-01", "anc_loss": "4.758e-01", "dlm_acc": "6.668e-01", "anc_acc": "6.528e-01", "epoch": 0.09386} {"step": 46935, "loss": 1.1331, "grad_norm": "2.831e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.437e-01", "anc_loss": "4.699e-01", "dlm_acc": "6.923e-01", "anc_acc": "6.777e-01", "epoch": 0.09387} {"step": 46940, "loss": 1.2071, "grad_norm": "3.949e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.047e-01", "anc_loss": "7.375e-01", "dlm_acc": "4.943e-01", "anc_acc": "4.746e-01", "epoch": 0.09388} {"step": 46945, "loss": 1.0, "grad_norm": "2.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.934e-01", "anc_loss": "6.168e-01", "dlm_acc": "5.133e-01", "anc_acc": "4.938e-01", "epoch": 0.09389} {"step": 46950, "loss": 1.1292, "grad_norm": "2.848e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.125e-01", "anc_loss": "7.328e-01", "dlm_acc": "4.863e-01", "anc_acc": "4.734e-01", "epoch": 0.0939} {"step": 46955, "loss": 1.1503, "grad_norm": "6.838e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.320e-01", "anc_loss": "8.770e-01", "dlm_acc": "7.039e-01", "anc_acc": "6.596e-01", "epoch": 0.09391} {"step": 46960, "loss": 0.6875, "grad_norm": "2.071e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.703e-01", "anc_loss": "7.658e-01", "dlm_acc": "7.384e-01", "anc_acc": "7.103e-01", "epoch": 0.09392} {"step": 46965, "loss": 1.0709, "grad_norm": "2.460e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.242e-01", "anc_loss": "1.021e+00", "dlm_acc": "5.987e-01", "anc_acc": "5.673e-01", "epoch": 0.09393} {"step": 46970, "loss": 1.4865, "grad_norm": "6.844e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.859e-01", "anc_loss": "1.054e+00", "dlm_acc": "5.024e-01", "anc_acc": "4.755e-01", "epoch": 0.09394} {"step": 46975, "loss": 0.9128, "grad_norm": "7.925e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.005e-01", "anc_loss": "8.760e-01", "dlm_acc": "7.347e-01", "anc_acc": "7.151e-01", "epoch": 0.09395} {"step": 46980, "loss": 0.8138, "grad_norm": "4.647e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.880e-02", "anc_loss": "8.303e-02", "dlm_acc": "9.688e-01", "anc_acc": "9.638e-01", "epoch": 0.09396} {"step": 46985, "loss": 1.2111, "grad_norm": "3.625e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.042e+00", "anc_loss": "1.148e+00", "dlm_acc": "5.478e-01", "anc_acc": "5.149e-01", "epoch": 0.09397} {"step": 46990, "loss": 1.1341, "grad_norm": "3.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.881e-01", "anc_loss": "5.781e-01", "dlm_acc": "7.047e-01", "anc_acc": "6.672e-01", "epoch": 0.09398} {"step": 46995, "loss": 1.2189, "grad_norm": "2.985e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.945e-01", "anc_loss": "8.453e-01", "dlm_acc": "5.822e-01", "anc_acc": "5.597e-01", "epoch": 0.09399} {"step": 47000, "loss": 1.1602, "grad_norm": "3.489e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.242e-01", "anc_loss": "7.840e-01", "dlm_acc": "6.262e-01", "anc_acc": "6.053e-01", "epoch": 0.094} {"step": 47005, "loss": 0.9231, "grad_norm": "4.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.012e-01", "anc_loss": "1.003e+00", "dlm_acc": "6.228e-01", "anc_acc": "5.946e-01", "epoch": 0.09401} {"step": 47010, "loss": 1.1795, "grad_norm": "3.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.813e-01", "anc_loss": "5.371e-01", "dlm_acc": "6.935e-01", "anc_acc": "6.619e-01", "epoch": 0.09402} {"step": 47015, "loss": 0.8964, "grad_norm": "5.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.381e-01", "anc_loss": "1.029e+00", "dlm_acc": "5.887e-01", "anc_acc": "5.618e-01", "epoch": 0.09403} {"step": 47020, "loss": 1.0611, "grad_norm": "4.117e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.006e+00", "anc_loss": "1.077e+00", "dlm_acc": "6.508e-01", "anc_acc": "6.337e-01", "epoch": 0.09404} {"step": 47025, "loss": 0.4806, "grad_norm": "3.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.953e-01", "anc_loss": "6.418e-01", "dlm_acc": "4.611e-01", "anc_acc": "4.267e-01", "epoch": 0.09405} {"step": 47030, "loss": 1.085, "grad_norm": "3.654e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.805e-01", "anc_loss": "9.297e-01", "dlm_acc": "4.003e-01", "anc_acc": "3.686e-01", "epoch": 0.09406} {"step": 47035, "loss": 0.8724, "grad_norm": "3.890e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.656e-01", "anc_loss": "8.219e-01", "dlm_acc": "4.363e-01", "anc_acc": "3.983e-01", "epoch": 0.09407} {"step": 47040, "loss": 0.8369, "grad_norm": "2.758e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.602e-01", "anc_loss": "8.289e-01", "dlm_acc": "4.607e-01", "anc_acc": "4.164e-01", "epoch": 0.09408} {"step": 47045, "loss": 0.8139, "grad_norm": "2.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.547e-01", "anc_loss": "8.359e-01", "dlm_acc": "4.999e-01", "anc_acc": "4.585e-01", "epoch": 0.09409} {"step": 47050, "loss": 0.7608, "grad_norm": "4.562e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.101e+00", "anc_loss": "1.218e+00", "dlm_acc": "6.023e-01", "anc_acc": "5.797e-01", "epoch": 0.0941} {"step": 47055, "loss": 0.9186, "grad_norm": "4.866e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.379e-01", "anc_loss": "7.602e-01", "dlm_acc": "7.124e-01", "anc_acc": "6.704e-01", "epoch": 0.09411} {"step": 47060, "loss": 0.8703, "grad_norm": "3.533e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.184e-01", "anc_loss": "1.042e+00", "dlm_acc": "6.194e-01", "anc_acc": "5.796e-01", "epoch": 0.09412} {"step": 47065, "loss": 1.0958, "grad_norm": "5.861e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.174e-01", "anc_loss": "7.937e-01", "dlm_acc": "7.246e-01", "anc_acc": "7.015e-01", "epoch": 0.09413} {"step": 47070, "loss": 1.4058, "grad_norm": "4.863e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.055e+00", "anc_loss": "1.155e+00", "dlm_acc": "6.341e-01", "anc_acc": "6.034e-01", "epoch": 0.09414} {"step": 47075, "loss": 0.8943, "grad_norm": "2.798e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.013e+00", "anc_loss": "1.130e+00", "dlm_acc": "6.534e-01", "anc_acc": "6.239e-01", "epoch": 0.09415} {"step": 47080, "loss": 1.4053, "grad_norm": "9.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.374e+00", "dlm_acc": "5.726e-01", "anc_acc": "5.432e-01", "epoch": 0.09416} {"step": 47085, "loss": 1.1318, "grad_norm": "3.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.893e-01", "anc_loss": "2.083e-01", "dlm_acc": "8.840e-01", "anc_acc": "8.735e-01", "epoch": 0.09417} {"step": 47090, "loss": 1.0251, "grad_norm": "3.141e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.959e-02", "anc_loss": "7.595e-02", "dlm_acc": "9.511e-01", "anc_acc": "9.489e-01", "epoch": 0.09418} {"step": 47095, "loss": 0.9799, "grad_norm": "4.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.866e-02", "anc_loss": "5.552e-02", "dlm_acc": "9.839e-01", "anc_acc": "9.825e-01", "epoch": 0.09419} {"step": 47100, "loss": 1.3412, "grad_norm": "3.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.151e+00", "anc_loss": "1.250e+00", "dlm_acc": "5.988e-01", "anc_acc": "5.745e-01", "epoch": 0.0942} {"step": 47105, "loss": 0.997, "grad_norm": "2.187e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.996e-01", "anc_loss": "9.023e-01", "dlm_acc": "6.497e-01", "anc_acc": "6.085e-01", "epoch": 0.09421} {"step": 47110, "loss": 1.09, "grad_norm": "2.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.138e+00", "anc_loss": "1.243e+00", "dlm_acc": "6.140e-01", "anc_acc": "5.883e-01", "epoch": 0.09422} {"step": 47115, "loss": 0.9719, "grad_norm": "4.669e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.202e+00", "anc_loss": "1.336e+00", "dlm_acc": "5.910e-01", "anc_acc": "5.589e-01", "epoch": 0.09423} {"step": 47120, "loss": 1.2105, "grad_norm": "1.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.653e+00", "anc_loss": "1.783e+00", "dlm_acc": "4.717e-01", "anc_acc": "4.435e-01", "epoch": 0.09424} {"step": 47125, "loss": 0.8332, "grad_norm": "2.664e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.313e-01", "anc_loss": "9.047e-01", "dlm_acc": "6.164e-01", "anc_acc": "5.964e-01", "epoch": 0.09425} {"step": 47130, "loss": 1.1281, "grad_norm": "7.165e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.812e-01", "anc_loss": "7.875e-01", "dlm_acc": "5.511e-01", "anc_acc": "5.489e-01", "epoch": 0.09426} {"step": 47135, "loss": 0.7645, "grad_norm": "2.095e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.469e-01", "anc_loss": "7.527e-01", "dlm_acc": "5.526e-01", "anc_acc": "5.512e-01", "epoch": 0.09427} {"step": 47140, "loss": 0.6166, "grad_norm": "1.742e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.508e-01", "anc_loss": "6.570e-01", "dlm_acc": "5.679e-01", "anc_acc": "5.645e-01", "epoch": 0.09428} {"step": 47145, "loss": 1.114, "grad_norm": "1.090e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.309e+00", "dlm_acc": "4.773e-01", "anc_acc": "4.662e-01", "epoch": 0.09429} {"step": 47150, "loss": 0.9239, "grad_norm": "1.116e+00", "learning_rate": "1.000e-04", "dlm_loss": "7.406e-01", "anc_loss": "7.586e-01", "dlm_acc": "5.160e-01", "anc_acc": "5.089e-01", "epoch": 0.0943} {"step": 47155, "loss": 0.9639, "grad_norm": "3.099e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.145e-01", "anc_loss": "6.285e-01", "dlm_acc": "5.464e-01", "anc_acc": "5.374e-01", "epoch": 0.09431} {"step": 47160, "loss": 0.93, "grad_norm": "3.848e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.465e-01", "anc_loss": "5.609e-01", "dlm_acc": "5.664e-01", "anc_acc": "5.576e-01", "epoch": 0.09432} {"step": 47165, "loss": 0.73, "grad_norm": "3.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.555e-01", "anc_loss": "5.684e-01", "dlm_acc": "5.679e-01", "anc_acc": "5.630e-01", "epoch": 0.09433} {"step": 47170, "loss": 0.8652, "grad_norm": "3.501e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.797e-01", "anc_loss": "5.926e-01", "dlm_acc": "5.659e-01", "anc_acc": "5.588e-01", "epoch": 0.09434} {"step": 47175, "loss": 0.7585, "grad_norm": "3.035e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.145e-01", "anc_loss": "7.504e-01", "dlm_acc": "5.571e-01", "anc_acc": "5.460e-01", "epoch": 0.09435} {"step": 47180, "loss": 1.1852, "grad_norm": "2.781e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.032e+00", "anc_loss": "1.132e+00", "dlm_acc": "5.372e-01", "anc_acc": "5.110e-01", "epoch": 0.09436} {"step": 47185, "loss": 1.0129, "grad_norm": "3.290e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.133e-01", "anc_loss": "1.034e+00", "dlm_acc": "6.584e-01", "anc_acc": "6.274e-01", "epoch": 0.09437} {"step": 47190, "loss": 1.2603, "grad_norm": "2.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.081e+00", "anc_loss": "1.188e+00", "dlm_acc": "6.760e-01", "anc_acc": "6.515e-01", "epoch": 0.09438} {"step": 47195, "loss": 0.9756, "grad_norm": "2.678e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.355e-01", "anc_loss": "7.348e-01", "dlm_acc": "7.399e-01", "anc_acc": "7.031e-01", "epoch": 0.09439} {"step": 47200, "loss": 0.8341, "grad_norm": "2.148e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.258e-01", "anc_loss": "4.789e-01", "dlm_acc": "7.098e-01", "anc_acc": "6.836e-01", "epoch": 0.0944} {"step": 47205, "loss": 1.3062, "grad_norm": "3.476e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.389e+00", "dlm_acc": "5.333e-01", "anc_acc": "5.019e-01", "epoch": 0.09441} {"step": 47210, "loss": 1.3441, "grad_norm": "3.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.123e-01", "anc_loss": "9.109e-01", "dlm_acc": "7.210e-01", "anc_acc": "6.961e-01", "epoch": 0.09442} {"step": 47215, "loss": 0.7751, "grad_norm": "1.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.339e-02", "anc_loss": "2.848e-02", "dlm_acc": "9.851e-01", "anc_acc": "9.831e-01", "epoch": 0.09443} {"step": 47220, "loss": 1.1259, "grad_norm": "3.851e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.295e+00", "dlm_acc": "6.283e-01", "anc_acc": "5.931e-01", "epoch": 0.09444} {"step": 47225, "loss": 1.2157, "grad_norm": "5.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.146e+00", "dlm_acc": "5.450e-01", "anc_acc": "5.170e-01", "epoch": 0.09445} {"step": 47230, "loss": 1.5618, "grad_norm": "3.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.321e+00", "dlm_acc": "5.493e-01", "anc_acc": "5.242e-01", "epoch": 0.09446} {"step": 47235, "loss": 1.2561, "grad_norm": "2.595e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.307e+00", "anc_loss": "1.422e+00", "dlm_acc": "5.456e-01", "anc_acc": "5.202e-01", "epoch": 0.09447} {"step": 47240, "loss": 1.4894, "grad_norm": "4.797e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.345e+00", "anc_loss": "1.455e+00", "dlm_acc": "5.442e-01", "anc_acc": "5.179e-01", "epoch": 0.09448} {"step": 47245, "loss": 1.0036, "grad_norm": "2.074e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.658e-01", "anc_loss": "8.626e-01", "dlm_acc": "7.266e-01", "anc_acc": "7.004e-01", "epoch": 0.09449} {"step": 47250, "loss": 1.3551, "grad_norm": "5.112e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.598e-01", "anc_loss": "4.488e-01", "dlm_acc": "8.103e-01", "anc_acc": "7.709e-01", "epoch": 0.0945} {"step": 47255, "loss": 1.2395, "grad_norm": "2.863e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.017e+00", "anc_loss": "1.135e+00", "dlm_acc": "6.580e-01", "anc_acc": "6.322e-01", "epoch": 0.09451} {"step": 47260, "loss": 0.8064, "grad_norm": "2.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.746e-01", "anc_loss": "4.193e-01", "dlm_acc": "8.489e-01", "anc_acc": "8.361e-01", "epoch": 0.09452} {"step": 47265, "loss": 1.0311, "grad_norm": "2.701e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.905e-01", "anc_loss": "1.109e+00", "dlm_acc": "6.860e-01", "anc_acc": "6.579e-01", "epoch": 0.09453} {"step": 47270, "loss": 0.6697, "grad_norm": "9.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e-01", "anc_loss": "1.219e-01", "dlm_acc": "9.545e-01", "anc_acc": "9.489e-01", "epoch": 0.09454} {"step": 47275, "loss": 0.8385, "grad_norm": "1.688e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.594e-01", "anc_loss": "2.058e-01", "dlm_acc": "9.345e-01", "anc_acc": "9.142e-01", "epoch": 0.09455} {"step": 47280, "loss": 1.0054, "grad_norm": "3.929e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.524e-01", "anc_loss": "1.043e+00", "dlm_acc": "6.818e-01", "anc_acc": "6.597e-01", "epoch": 0.09456} {"step": 47285, "loss": 0.98, "grad_norm": "2.678e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.829e-01", "anc_loss": "7.936e-01", "dlm_acc": "7.641e-01", "anc_acc": "7.365e-01", "epoch": 0.09457} {"step": 47290, "loss": 0.9064, "grad_norm": "3.413e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.973e-01", "anc_loss": "8.887e-01", "dlm_acc": "6.724e-01", "anc_acc": "6.455e-01", "epoch": 0.09458} {"step": 47295, "loss": 1.0558, "grad_norm": "3.064e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.042e-01", "anc_loss": "7.744e-01", "dlm_acc": "7.205e-01", "anc_acc": "7.027e-01", "epoch": 0.09459} {"step": 47300, "loss": 1.1745, "grad_norm": "2.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.296e+00", "dlm_acc": "5.926e-01", "anc_acc": "5.640e-01", "epoch": 0.0946} {"step": 47305, "loss": 0.8628, "grad_norm": "2.663e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.567e-01", "anc_loss": "6.168e-01", "dlm_acc": "7.499e-01", "anc_acc": "7.301e-01", "epoch": 0.09461} {"step": 47310, "loss": 1.4592, "grad_norm": "5.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.665e-01", "anc_loss": "2.996e-01", "dlm_acc": "8.881e-01", "anc_acc": "8.790e-01", "epoch": 0.09462} {"step": 47315, "loss": 1.3627, "grad_norm": "4.115e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.182e+00", "anc_loss": "1.284e+00", "dlm_acc": "5.881e-01", "anc_acc": "5.671e-01", "epoch": 0.09463} {"step": 47320, "loss": 1.1592, "grad_norm": "1.588e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.758e-01", "anc_loss": "7.391e-01", "dlm_acc": "7.153e-01", "anc_acc": "6.908e-01", "epoch": 0.09464} {"step": 47325, "loss": 0.8359, "grad_norm": "2.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.736e-01", "anc_loss": "5.621e-01", "dlm_acc": "7.529e-01", "anc_acc": "7.192e-01", "epoch": 0.09465} {"step": 47330, "loss": 1.003, "grad_norm": "2.089e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.438e-01", "anc_loss": "7.250e-01", "dlm_acc": "7.006e-01", "anc_acc": "6.812e-01", "epoch": 0.09466} {"step": 47335, "loss": 1.3996, "grad_norm": "5.953e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.572e+00", "anc_loss": "1.714e+00", "dlm_acc": "4.951e-01", "anc_acc": "4.655e-01", "epoch": 0.09467} {"step": 47340, "loss": 0.823, "grad_norm": "2.174e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.891e-01", "anc_loss": "5.293e-01", "dlm_acc": "7.451e-01", "anc_acc": "7.334e-01", "epoch": 0.09468} {"step": 47345, "loss": 1.3139, "grad_norm": "5.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.971e-01", "anc_loss": "1.095e+00", "dlm_acc": "6.373e-01", "anc_acc": "6.151e-01", "epoch": 0.09469} {"step": 47350, "loss": 1.2718, "grad_norm": "2.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.895e-01", "anc_loss": "6.438e-01", "dlm_acc": "7.419e-01", "anc_acc": "7.267e-01", "epoch": 0.0947} {"step": 47355, "loss": 0.8427, "grad_norm": "2.198e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.472e-01", "anc_loss": "2.929e-01", "dlm_acc": "8.605e-01", "anc_acc": "8.378e-01", "epoch": 0.09471} {"step": 47360, "loss": 1.0958, "grad_norm": "2.441e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.011e+00", "anc_loss": "1.072e+00", "dlm_acc": "4.880e-01", "anc_acc": "4.716e-01", "epoch": 0.09472} {"step": 47365, "loss": 1.3226, "grad_norm": "6.817e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.052e+00", "anc_loss": "1.110e+00", "dlm_acc": "4.859e-01", "anc_acc": "4.719e-01", "epoch": 0.09473} {"step": 47370, "loss": 0.9854, "grad_norm": "2.075e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.570e-01", "anc_loss": "3.785e-01", "dlm_acc": "7.689e-01", "anc_acc": "7.598e-01", "epoch": 0.09474} {"step": 47375, "loss": 1.4946, "grad_norm": "2.367e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.078e+00", "anc_loss": "1.183e+00", "dlm_acc": "6.456e-01", "anc_acc": "6.248e-01", "epoch": 0.09475} {"step": 47380, "loss": 1.3569, "grad_norm": "5.046e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.813e-01", "anc_loss": "1.105e+00", "dlm_acc": "6.690e-01", "anc_acc": "6.398e-01", "epoch": 0.09476} {"step": 47385, "loss": 0.6621, "grad_norm": "1.875e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.187e-01", "anc_loss": "1.341e-01", "dlm_acc": "9.384e-01", "anc_acc": "9.319e-01", "epoch": 0.09477} {"step": 47390, "loss": 0.8167, "grad_norm": "3.965e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e-01", "anc_loss": "1.213e-01", "dlm_acc": "9.423e-01", "anc_acc": "9.350e-01", "epoch": 0.09478} {"step": 47395, "loss": 0.7268, "grad_norm": "2.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.301e-01", "anc_loss": "2.549e-01", "dlm_acc": "8.655e-01", "anc_acc": "8.530e-01", "epoch": 0.09479} {"step": 47400, "loss": 0.9225, "grad_norm": "2.435e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.020e-01", "anc_loss": "6.680e-01", "dlm_acc": "7.500e-01", "anc_acc": "7.331e-01", "epoch": 0.0948} {"step": 47405, "loss": 0.9587, "grad_norm": "3.651e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.477e-01", "anc_loss": "7.117e-01", "dlm_acc": "7.755e-01", "anc_acc": "7.246e-01", "epoch": 0.09481} {"step": 47410, "loss": 1.0627, "grad_norm": "2.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.132e+00", "anc_loss": "1.262e+00", "dlm_acc": "5.402e-01", "anc_acc": "5.247e-01", "epoch": 0.09482} {"step": 47415, "loss": 1.0262, "grad_norm": "2.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.586e-01", "anc_loss": "1.064e+00", "dlm_acc": "6.278e-01", "anc_acc": "5.993e-01", "epoch": 0.09483} {"step": 47420, "loss": 1.1048, "grad_norm": "2.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.033e-01", "anc_loss": "9.916e-01", "dlm_acc": "6.607e-01", "anc_acc": "6.355e-01", "epoch": 0.09484} {"step": 47425, "loss": 1.1999, "grad_norm": "2.111e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.484e+00", "anc_loss": "1.616e+00", "dlm_acc": "5.094e-01", "anc_acc": "4.805e-01", "epoch": 0.09485} {"step": 47430, "loss": 0.9279, "grad_norm": "2.230e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.123e+00", "anc_loss": "1.232e+00", "dlm_acc": "5.532e-01", "anc_acc": "5.210e-01", "epoch": 0.09486} {"step": 47435, "loss": 1.164, "grad_norm": "2.304e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.429e+00", "dlm_acc": "5.660e-01", "anc_acc": "5.336e-01", "epoch": 0.09487} {"step": 47440, "loss": 1.0144, "grad_norm": "2.422e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.120e+00", "anc_loss": "1.234e+00", "dlm_acc": "6.184e-01", "anc_acc": "5.960e-01", "epoch": 0.09488} {"step": 47445, "loss": 1.1375, "grad_norm": "3.988e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.382e+00", "anc_loss": "1.506e+00", "dlm_acc": "5.578e-01", "anc_acc": "5.335e-01", "epoch": 0.09489} {"step": 47450, "loss": 1.289, "grad_norm": "3.672e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.373e+00", "anc_loss": "1.497e+00", "dlm_acc": "5.436e-01", "anc_acc": "5.111e-01", "epoch": 0.0949} {"step": 47455, "loss": 1.2984, "grad_norm": "5.615e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.426e+00", "anc_loss": "1.572e+00", "dlm_acc": "5.388e-01", "anc_acc": "5.055e-01", "epoch": 0.09491} {"step": 47460, "loss": 1.0987, "grad_norm": "3.446e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.396e-01", "anc_acc": "5.059e-01", "epoch": 0.09492} {"step": 47465, "loss": 1.2756, "grad_norm": "5.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.455e+00", "anc_loss": "1.578e+00", "dlm_acc": "5.079e-01", "anc_acc": "4.775e-01", "epoch": 0.09493} {"step": 47470, "loss": 1.3238, "grad_norm": "3.676e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.403e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.426e-01", "anc_acc": "5.155e-01", "epoch": 0.09494} {"step": 47475, "loss": 1.1094, "grad_norm": "4.198e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.556e+00", "dlm_acc": "5.088e-01", "anc_acc": "4.788e-01", "epoch": 0.09495} {"step": 47480, "loss": 1.7008, "grad_norm": "3.433e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.567e+00", "anc_loss": "1.705e+00", "dlm_acc": "5.264e-01", "anc_acc": "4.972e-01", "epoch": 0.09496} {"step": 47485, "loss": 1.4594, "grad_norm": "2.705e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.620e+00", "anc_loss": "1.755e+00", "dlm_acc": "4.702e-01", "anc_acc": "4.399e-01", "epoch": 0.09497} {"step": 47490, "loss": 1.2866, "grad_norm": "9.522e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.452e+00", "anc_loss": "1.595e+00", "dlm_acc": "5.544e-01", "anc_acc": "5.198e-01", "epoch": 0.09498} {"step": 47495, "loss": 0.9464, "grad_norm": "8.945e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.822e-01", "anc_loss": "9.910e-01", "dlm_acc": "6.497e-01", "anc_acc": "6.216e-01", "epoch": 0.09499} {"step": 47500, "loss": 0.7834, "grad_norm": "1.213e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.778e-01", "anc_loss": "6.430e-01", "dlm_acc": "7.866e-01", "anc_acc": "7.718e-01", "epoch": 0.095} {"step": 47505, "loss": 0.7191, "grad_norm": "2.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.679e-01", "anc_loss": "7.795e-01", "dlm_acc": "7.459e-01", "anc_acc": "7.141e-01", "epoch": 0.09501} {"step": 47510, "loss": 1.1591, "grad_norm": "3.299e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.945e-01", "anc_loss": "8.656e-01", "dlm_acc": "5.950e-01", "anc_acc": "5.731e-01", "epoch": 0.09502} {"step": 47515, "loss": 1.2645, "grad_norm": "3.795e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.284e+00", "dlm_acc": "6.241e-01", "anc_acc": "5.963e-01", "epoch": 0.09503} {"step": 47520, "loss": 0.9468, "grad_norm": "5.830e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.118e-01", "anc_loss": "5.704e-01", "dlm_acc": "8.201e-01", "anc_acc": "7.996e-01", "epoch": 0.09504} {"step": 47525, "loss": 1.3373, "grad_norm": "5.317e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.941e-01", "anc_loss": "1.091e+00", "dlm_acc": "6.689e-01", "anc_acc": "6.492e-01", "epoch": 0.09505} {"step": 47530, "loss": 0.8913, "grad_norm": "3.276e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.652e-01", "anc_loss": "6.523e-01", "dlm_acc": "7.489e-01", "anc_acc": "7.223e-01", "epoch": 0.09506} {"step": 47535, "loss": 1.0888, "grad_norm": "2.145e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.352e-01", "anc_loss": "8.102e-01", "dlm_acc": "6.736e-01", "anc_acc": "6.575e-01", "epoch": 0.09507} {"step": 47540, "loss": 0.8226, "grad_norm": "7.376e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.156e-01", "anc_loss": "8.332e-01", "dlm_acc": "5.691e-01", "anc_acc": "5.591e-01", "epoch": 0.09508} {"step": 47545, "loss": 1.0987, "grad_norm": "7.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.551e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.464e-01", "anc_acc": "6.202e-01", "epoch": 0.09509} {"step": 47550, "loss": 1.2536, "grad_norm": "2.497e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.106e+00", "anc_loss": "1.227e+00", "dlm_acc": "6.644e-01", "anc_acc": "6.407e-01", "epoch": 0.0951} {"step": 47555, "loss": 1.0528, "grad_norm": "2.891e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.389e-01", "anc_loss": "4.890e-01", "dlm_acc": "8.406e-01", "anc_acc": "8.258e-01", "epoch": 0.09511} {"step": 47560, "loss": 1.1507, "grad_norm": "2.513e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.354e-01", "anc_loss": "9.123e-01", "dlm_acc": "6.831e-01", "anc_acc": "6.605e-01", "epoch": 0.09512} {"step": 47565, "loss": 0.9721, "grad_norm": "3.013e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.547e-01", "anc_loss": "7.073e-01", "dlm_acc": "6.864e-01", "anc_acc": "6.702e-01", "epoch": 0.09513} {"step": 47570, "loss": 0.8845, "grad_norm": "3.058e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.499e-01", "anc_loss": "2.650e-01", "dlm_acc": "8.349e-01", "anc_acc": "8.274e-01", "epoch": 0.09514} {"step": 47575, "loss": 1.2016, "grad_norm": "4.108e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.916e-01", "anc_loss": "7.773e-01", "dlm_acc": "7.390e-01", "anc_acc": "7.136e-01", "epoch": 0.09515} {"step": 47580, "loss": 0.8912, "grad_norm": "3.207e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.264e-01", "anc_loss": "5.699e-01", "dlm_acc": "7.780e-01", "anc_acc": "7.648e-01", "epoch": 0.09516} {"step": 47585, "loss": 0.9757, "grad_norm": "1.832e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.721e-01", "anc_loss": "8.268e-01", "dlm_acc": "7.230e-01", "anc_acc": "7.101e-01", "epoch": 0.09517} {"step": 47590, "loss": 0.6988, "grad_norm": "2.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.686e-01", "anc_loss": "2.042e-01", "dlm_acc": "9.322e-01", "anc_acc": "9.174e-01", "epoch": 0.09518} {"step": 47595, "loss": 1.1127, "grad_norm": "4.996e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.060e-02", "anc_loss": "1.053e-01", "dlm_acc": "9.628e-01", "anc_acc": "9.563e-01", "epoch": 0.09519} {"step": 47600, "loss": 1.0998, "grad_norm": "3.126e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.300e-01", "anc_loss": "6.769e-01", "dlm_acc": "7.218e-01", "anc_acc": "7.072e-01", "epoch": 0.0952} {"step": 47605, "loss": 1.0717, "grad_norm": "2.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.744e-01", "anc_loss": "9.654e-01", "dlm_acc": "6.384e-01", "anc_acc": "6.085e-01", "epoch": 0.09521} {"step": 47610, "loss": 1.1319, "grad_norm": "2.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.910e-01", "anc_loss": "1.115e+00", "dlm_acc": "6.561e-01", "anc_acc": "6.232e-01", "epoch": 0.09522} {"step": 47615, "loss": 0.9103, "grad_norm": "2.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.805e-01", "anc_loss": "9.625e-01", "dlm_acc": "6.073e-01", "anc_acc": "5.880e-01", "epoch": 0.09523} {"step": 47620, "loss": 1.0788, "grad_norm": "3.740e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.228e+00", "anc_loss": "1.371e+00", "dlm_acc": "6.102e-01", "anc_acc": "5.770e-01", "epoch": 0.09524} {"step": 47625, "loss": 1.6858, "grad_norm": "4.228e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.492e-01", "anc_loss": "1.056e+00", "dlm_acc": "6.945e-01", "anc_acc": "6.676e-01", "epoch": 0.09525} {"step": 47630, "loss": 1.0087, "grad_norm": "3.484e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.086e-01", "anc_loss": "1.027e+00", "dlm_acc": "6.582e-01", "anc_acc": "6.259e-01", "epoch": 0.09526} {"step": 47635, "loss": 1.0755, "grad_norm": "4.241e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.175e+00", "anc_loss": "1.288e+00", "dlm_acc": "6.008e-01", "anc_acc": "5.714e-01", "epoch": 0.09527} {"step": 47640, "loss": 0.8392, "grad_norm": "3.143e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.031e-01", "anc_loss": "8.762e-01", "dlm_acc": "6.352e-01", "anc_acc": "6.131e-01", "epoch": 0.09528} {"step": 47645, "loss": 0.9656, "grad_norm": "3.825e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.901e-01", "anc_loss": "4.363e-01", "dlm_acc": "8.294e-01", "anc_acc": "8.117e-01", "epoch": 0.09529} {"step": 47650, "loss": 0.8391, "grad_norm": "1.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.440e-01", "anc_loss": "4.967e-01", "dlm_acc": "7.904e-01", "anc_acc": "7.710e-01", "epoch": 0.0953} {"step": 47655, "loss": 0.7534, "grad_norm": "1.536e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.323e-01", "anc_loss": "2.502e-01", "dlm_acc": "8.334e-01", "anc_acc": "8.259e-01", "epoch": 0.09531} {"step": 47660, "loss": 0.7354, "grad_norm": "2.303e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.967e-01", "anc_loss": "4.245e-01", "dlm_acc": "7.801e-01", "anc_acc": "7.739e-01", "epoch": 0.09532} {"step": 47665, "loss": 1.6238, "grad_norm": "4.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.591e-01", "anc_loss": "9.547e-01", "dlm_acc": "7.057e-01", "anc_acc": "6.823e-01", "epoch": 0.09533} {"step": 47670, "loss": 1.4724, "grad_norm": "4.909e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.285e-01", "anc_loss": "1.020e+00", "dlm_acc": "6.618e-01", "anc_acc": "6.369e-01", "epoch": 0.09534} {"step": 47675, "loss": 1.1572, "grad_norm": "8.453e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.707e-01", "anc_loss": "1.061e+00", "dlm_acc": "6.524e-01", "anc_acc": "6.319e-01", "epoch": 0.09535} {"step": 47680, "loss": 0.9494, "grad_norm": "3.457e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.816e-01", "anc_loss": "8.666e-01", "dlm_acc": "6.712e-01", "anc_acc": "6.466e-01", "epoch": 0.09536} {"step": 47685, "loss": 1.0403, "grad_norm": "1.758e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.707e-01", "anc_loss": "1.066e+00", "dlm_acc": "6.210e-01", "anc_acc": "5.946e-01", "epoch": 0.09537} {"step": 47690, "loss": 0.8707, "grad_norm": "5.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.271e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.387e-01", "anc_acc": "5.141e-01", "epoch": 0.09538} {"step": 47695, "loss": 0.8819, "grad_norm": "3.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.083e+00", "anc_loss": "1.191e+00", "dlm_acc": "6.022e-01", "anc_acc": "5.738e-01", "epoch": 0.09539} {"step": 47700, "loss": 1.2515, "grad_norm": "8.619e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.062e+00", "anc_loss": "1.191e+00", "dlm_acc": "6.236e-01", "anc_acc": "5.900e-01", "epoch": 0.0954} {"step": 47705, "loss": 1.47, "grad_norm": "8.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.605e+00", "anc_loss": "1.728e+00", "dlm_acc": "5.057e-01", "anc_acc": "4.782e-01", "epoch": 0.09541} {"step": 47710, "loss": 1.1839, "grad_norm": "5.006e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.360e+00", "anc_loss": "1.490e+00", "dlm_acc": "5.885e-01", "anc_acc": "5.601e-01", "epoch": 0.09542} {"step": 47715, "loss": 1.0792, "grad_norm": "4.689e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.216e+00", "anc_loss": "1.345e+00", "dlm_acc": "5.767e-01", "anc_acc": "5.444e-01", "epoch": 0.09543} {"step": 47720, "loss": 1.1388, "grad_norm": "4.321e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.176e+00", "anc_loss": "1.306e+00", "dlm_acc": "5.969e-01", "anc_acc": "5.659e-01", "epoch": 0.09544} {"step": 47725, "loss": 0.9479, "grad_norm": "3.255e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.105e+00", "anc_loss": "1.259e+00", "dlm_acc": "6.044e-01", "anc_acc": "5.667e-01", "epoch": 0.09545} {"step": 47730, "loss": 0.7812, "grad_norm": "2.858e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.441e-01", "anc_loss": "8.582e-01", "dlm_acc": "7.007e-01", "anc_acc": "6.635e-01", "epoch": 0.09546} {"step": 47735, "loss": 0.8729, "grad_norm": "3.196e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.919e-01", "anc_loss": "4.859e-01", "dlm_acc": "8.165e-01", "anc_acc": "7.847e-01", "epoch": 0.09547} {"step": 47740, "loss": 1.0229, "grad_norm": "2.289e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.291e+00", "anc_loss": "1.425e+00", "dlm_acc": "5.404e-01", "anc_acc": "5.068e-01", "epoch": 0.09548} {"step": 47745, "loss": 0.8408, "grad_norm": "3.225e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.065e+00", "anc_loss": "1.190e+00", "dlm_acc": "5.870e-01", "anc_acc": "5.528e-01", "epoch": 0.09549} {"step": 47750, "loss": 0.8627, "grad_norm": "1.500e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.922e-01", "anc_loss": "1.108e+00", "dlm_acc": "6.161e-01", "anc_acc": "5.812e-01", "epoch": 0.0955} {"step": 47755, "loss": 1.2125, "grad_norm": "3.077e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.347e+00", "anc_loss": "1.491e+00", "dlm_acc": "5.440e-01", "anc_acc": "5.118e-01", "epoch": 0.09551} {"step": 47760, "loss": 1.063, "grad_norm": "1.925e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.138e+00", "dlm_acc": "6.366e-01", "anc_acc": "6.033e-01", "epoch": 0.09552} {"step": 47765, "loss": 1.2303, "grad_norm": "3.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.302e+00", "dlm_acc": "5.739e-01", "anc_acc": "5.439e-01", "epoch": 0.09553} {"step": 47770, "loss": 1.3287, "grad_norm": "2.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.154e+00", "anc_loss": "1.286e+00", "dlm_acc": "5.852e-01", "anc_acc": "5.528e-01", "epoch": 0.09554} {"step": 47775, "loss": 1.1475, "grad_norm": "1.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.124e+00", "dlm_acc": "6.216e-01", "anc_acc": "5.895e-01", "epoch": 0.09555} {"step": 47780, "loss": 0.9753, "grad_norm": "3.962e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.121e+00", "anc_loss": "1.226e+00", "dlm_acc": "5.805e-01", "anc_acc": "5.555e-01", "epoch": 0.09556} {"step": 47785, "loss": 2.1516, "grad_norm": "5.369e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.078e+00", "anc_loss": "2.237e+00", "dlm_acc": "4.474e-01", "anc_acc": "4.149e-01", "epoch": 0.09557} {"step": 47790, "loss": 1.1815, "grad_norm": "5.312e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.277e-01", "anc_loss": "1.029e+00", "dlm_acc": "6.202e-01", "anc_acc": "5.862e-01", "epoch": 0.09558} {"step": 47795, "loss": 1.3073, "grad_norm": "3.161e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.655e+00", "anc_loss": "1.783e+00", "dlm_acc": "4.401e-01", "anc_acc": "4.170e-01", "epoch": 0.09559} {"step": 47800, "loss": 1.3374, "grad_norm": "5.504e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.510e+00", "anc_loss": "1.598e+00", "dlm_acc": "4.530e-01", "anc_acc": "4.304e-01", "epoch": 0.0956} {"step": 47805, "loss": 1.4945, "grad_norm": "3.801e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.391e+00", "anc_loss": "1.542e+00", "dlm_acc": "5.463e-01", "anc_acc": "5.107e-01", "epoch": 0.09561} {"step": 47810, "loss": 1.6511, "grad_norm": "2.022e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.600e+00", "dlm_acc": "5.721e-01", "anc_acc": "5.205e-01", "epoch": 0.09562} {"step": 47815, "loss": 1.2401, "grad_norm": "3.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.149e+00", "anc_loss": "1.331e+00", "dlm_acc": "5.728e-01", "anc_acc": "5.169e-01", "epoch": 0.09563} {"step": 47820, "loss": 1.2056, "grad_norm": "4.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.566e-01", "anc_loss": "7.879e-01", "dlm_acc": "4.829e-01", "anc_acc": "4.713e-01", "epoch": 0.09564} {"step": 47825, "loss": 1.4684, "grad_norm": "6.681e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.168e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.832e-01", "anc_acc": "5.549e-01", "epoch": 0.09565} {"step": 47830, "loss": 1.4097, "grad_norm": "3.206e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.875e-01", "anc_loss": "1.112e+00", "dlm_acc": "6.616e-01", "anc_acc": "6.312e-01", "epoch": 0.09566} {"step": 47835, "loss": 1.0417, "grad_norm": "6.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.387e-01", "anc_loss": "8.652e-01", "dlm_acc": "7.166e-01", "anc_acc": "6.784e-01", "epoch": 0.09567} {"step": 47840, "loss": 0.8734, "grad_norm": "3.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.828e-01", "anc_loss": "5.066e-01", "dlm_acc": "8.392e-01", "anc_acc": "8.018e-01", "epoch": 0.09568} {"step": 47845, "loss": 1.4285, "grad_norm": "3.307e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.296e+00", "anc_loss": "1.431e+00", "dlm_acc": "5.593e-01", "anc_acc": "5.257e-01", "epoch": 0.09569} {"step": 47850, "loss": 1.0806, "grad_norm": "2.937e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.613e-01", "anc_loss": "9.867e-01", "dlm_acc": "6.108e-01", "anc_acc": "5.667e-01", "epoch": 0.0957} {"step": 47855, "loss": 0.893, "grad_norm": "4.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.910e-01", "anc_loss": "9.199e-01", "dlm_acc": "6.889e-01", "anc_acc": "6.403e-01", "epoch": 0.09571} {"step": 47860, "loss": 1.0206, "grad_norm": "2.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.539e-01", "anc_loss": "9.602e-01", "dlm_acc": "6.316e-01", "anc_acc": "6.005e-01", "epoch": 0.09572} {"step": 47865, "loss": 1.1219, "grad_norm": "2.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.648e-01", "anc_loss": "8.812e-01", "dlm_acc": "7.014e-01", "anc_acc": "6.680e-01", "epoch": 0.09573} {"step": 47870, "loss": 1.431, "grad_norm": "3.081e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.410e+00", "anc_loss": "1.564e+00", "dlm_acc": "5.458e-01", "anc_acc": "5.100e-01", "epoch": 0.09574} {"step": 47875, "loss": 1.1077, "grad_norm": "4.354e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.106e+00", "anc_loss": "1.233e+00", "dlm_acc": "5.837e-01", "anc_acc": "5.487e-01", "epoch": 0.09575} {"step": 47880, "loss": 1.1731, "grad_norm": "3.953e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.181e+00", "anc_loss": "1.316e+00", "dlm_acc": "5.824e-01", "anc_acc": "5.513e-01", "epoch": 0.09576} {"step": 47885, "loss": 1.1847, "grad_norm": "3.172e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.941e-01", "anc_loss": "7.000e-01", "dlm_acc": "7.759e-01", "anc_acc": "7.464e-01", "epoch": 0.09577} {"step": 47890, "loss": 1.0776, "grad_norm": "7.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.863e-01", "anc_loss": "9.008e-01", "dlm_acc": "6.902e-01", "anc_acc": "6.574e-01", "epoch": 0.09578} {"step": 47895, "loss": 1.1935, "grad_norm": "3.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.007e+00", "anc_loss": "1.103e+00", "dlm_acc": "6.085e-01", "anc_acc": "5.813e-01", "epoch": 0.09579} {"step": 47900, "loss": 1.0414, "grad_norm": "2.538e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.672e-01", "anc_loss": "7.949e-01", "dlm_acc": "7.272e-01", "anc_acc": "6.776e-01", "epoch": 0.0958} {"step": 47905, "loss": 1.1955, "grad_norm": "1.932e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.117e-01", "anc_loss": "1.067e+00", "dlm_acc": "6.766e-01", "anc_acc": "6.180e-01", "epoch": 0.09581} {"step": 47910, "loss": 1.3086, "grad_norm": "1.049e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.211e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.751e-01", "anc_acc": "5.431e-01", "epoch": 0.09582} {"step": 47915, "loss": 1.229, "grad_norm": "4.655e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.820e-01", "anc_loss": "1.179e+00", "dlm_acc": "6.335e-01", "anc_acc": "5.746e-01", "epoch": 0.09583} {"step": 47920, "loss": 1.4315, "grad_norm": "5.044e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.974e+00", "anc_loss": "2.039e+00", "dlm_acc": "3.432e-01", "anc_acc": "3.138e-01", "epoch": 0.09584} {"step": 47925, "loss": 1.041, "grad_norm": "2.556e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.158e+00", "dlm_acc": "5.927e-01", "anc_acc": "5.396e-01", "epoch": 0.09585} {"step": 47930, "loss": 1.3278, "grad_norm": "3.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.746e-01", "anc_loss": "1.120e+00", "dlm_acc": "6.147e-01", "anc_acc": "5.607e-01", "epoch": 0.09586} {"step": 47935, "loss": 1.0649, "grad_norm": "5.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.434e-01", "anc_loss": "9.504e-01", "dlm_acc": "6.605e-01", "anc_acc": "6.197e-01", "epoch": 0.09587} {"step": 47940, "loss": 1.5293, "grad_norm": "2.847e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.587e+00", "anc_loss": "1.711e+00", "dlm_acc": "4.827e-01", "anc_acc": "4.492e-01", "epoch": 0.09588} {"step": 47945, "loss": 1.2837, "grad_norm": "3.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.017e+00", "anc_loss": "1.164e+00", "dlm_acc": "6.176e-01", "anc_acc": "5.753e-01", "epoch": 0.09589} {"step": 47950, "loss": 1.1335, "grad_norm": "5.361e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.249e+00", "anc_loss": "1.402e+00", "dlm_acc": "5.655e-01", "anc_acc": "5.230e-01", "epoch": 0.0959} {"step": 47955, "loss": 1.0502, "grad_norm": "2.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.084e+00", "anc_loss": "1.239e+00", "dlm_acc": "6.016e-01", "anc_acc": "5.563e-01", "epoch": 0.09591} {"step": 47960, "loss": 1.1172, "grad_norm": "2.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.750e-01", "anc_loss": "9.539e-01", "dlm_acc": "6.298e-01", "anc_acc": "5.951e-01", "epoch": 0.09592} {"step": 47965, "loss": 0.8532, "grad_norm": "2.539e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.050e+00", "anc_loss": "1.164e+00", "dlm_acc": "6.285e-01", "anc_acc": "5.972e-01", "epoch": 0.09593} {"step": 47970, "loss": 1.1092, "grad_norm": "4.755e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.559e+00", "anc_loss": "1.692e+00", "dlm_acc": "5.264e-01", "anc_acc": "4.963e-01", "epoch": 0.09594} {"step": 47975, "loss": 1.067, "grad_norm": "4.316e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.313e-01", "anc_loss": "1.027e+00", "dlm_acc": "5.871e-01", "anc_acc": "5.592e-01", "epoch": 0.09595} {"step": 47980, "loss": 0.6155, "grad_norm": "2.497e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.574e-01", "anc_loss": "4.996e-01", "dlm_acc": "6.267e-01", "anc_acc": "5.944e-01", "epoch": 0.09596} {"step": 47985, "loss": 0.987, "grad_norm": "2.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.676e-01", "anc_loss": "1.088e+00", "dlm_acc": "6.138e-01", "anc_acc": "5.829e-01", "epoch": 0.09597} {"step": 47990, "loss": 1.2807, "grad_norm": "3.483e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.003e+00", "anc_loss": "1.180e+00", "dlm_acc": "6.561e-01", "anc_acc": "6.001e-01", "epoch": 0.09598} {"step": 47995, "loss": 1.0133, "grad_norm": "2.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.495e-01", "anc_loss": "1.036e+00", "dlm_acc": "6.450e-01", "anc_acc": "6.225e-01", "epoch": 0.09599} {"step": 48000, "loss": 1.1737, "grad_norm": "4.093e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.055e-01", "anc_loss": "7.074e-01", "dlm_acc": "7.354e-01", "anc_acc": "7.025e-01", "epoch": 0.096} {"step": 48005, "loss": 1.2895, "grad_norm": "6.061e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.145e-01", "anc_loss": "1.005e+00", "dlm_acc": "6.296e-01", "anc_acc": "6.051e-01", "epoch": 0.09601} {"step": 48010, "loss": 0.7042, "grad_norm": "2.263e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.366e-01", "anc_loss": "3.703e-01", "dlm_acc": "7.801e-01", "anc_acc": "7.647e-01", "epoch": 0.09602} {"step": 48015, "loss": 0.9493, "grad_norm": "5.290e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.472e-01", "anc_loss": "6.374e-01", "dlm_acc": "7.939e-01", "anc_acc": "7.576e-01", "epoch": 0.09603} {"step": 48020, "loss": 0.6269, "grad_norm": "1.852e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.715e-01", "anc_loss": "6.789e-01", "dlm_acc": "6.858e-01", "anc_acc": "6.354e-01", "epoch": 0.09604} {"step": 48025, "loss": 1.3587, "grad_norm": "4.233e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.158e+00", "anc_loss": "1.279e+00", "dlm_acc": "5.580e-01", "anc_acc": "5.265e-01", "epoch": 0.09605} {"step": 48030, "loss": 1.0883, "grad_norm": "4.062e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.403e+00", "anc_loss": "1.531e+00", "dlm_acc": "5.491e-01", "anc_acc": "5.165e-01", "epoch": 0.09606} {"step": 48035, "loss": 1.7839, "grad_norm": "3.628e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.068e-01", "anc_loss": "7.750e-01", "dlm_acc": "6.365e-01", "anc_acc": "6.150e-01", "epoch": 0.09607} {"step": 48040, "loss": 1.2063, "grad_norm": "3.573e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.230e-01", "anc_loss": "6.734e-01", "dlm_acc": "5.654e-01", "anc_acc": "5.350e-01", "epoch": 0.09608} {"step": 48045, "loss": 1.2311, "grad_norm": "4.045e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.300e-01", "anc_loss": "9.482e-01", "dlm_acc": "6.836e-01", "anc_acc": "6.474e-01", "epoch": 0.09609} {"step": 48050, "loss": 1.1984, "grad_norm": "4.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.436e+00", "anc_loss": "1.518e+00", "dlm_acc": "4.131e-01", "anc_acc": "3.941e-01", "epoch": 0.0961} {"step": 48055, "loss": 0.8056, "grad_norm": "3.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.535e-01", "anc_loss": "2.719e-01", "dlm_acc": "8.654e-01", "anc_acc": "8.578e-01", "epoch": 0.09611} {"step": 48060, "loss": 0.6924, "grad_norm": "2.185e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.982e-01", "anc_loss": "2.137e-01", "dlm_acc": "8.905e-01", "anc_acc": "8.835e-01", "epoch": 0.09612} {"step": 48065, "loss": 0.8902, "grad_norm": "2.981e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.645e-01", "anc_loss": "2.846e-01", "dlm_acc": "8.640e-01", "anc_acc": "8.547e-01", "epoch": 0.09613} {"step": 48070, "loss": 1.0291, "grad_norm": "8.178e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.190e+00", "anc_loss": "1.280e+00", "dlm_acc": "5.419e-01", "anc_acc": "5.170e-01", "epoch": 0.09614} {"step": 48075, "loss": 0.7295, "grad_norm": "3.268e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.293e-01", "anc_loss": "4.551e-01", "dlm_acc": "6.469e-01", "anc_acc": "6.274e-01", "epoch": 0.09615} {"step": 48080, "loss": 1.2688, "grad_norm": "3.434e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.754e-01", "anc_loss": "6.188e-01", "dlm_acc": "6.204e-01", "anc_acc": "5.951e-01", "epoch": 0.09616} {"step": 48085, "loss": 1.0547, "grad_norm": "5.324e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.484e-01", "anc_loss": "4.820e-01", "dlm_acc": "6.483e-01", "anc_acc": "6.246e-01", "epoch": 0.09617} {"step": 48090, "loss": 1.1275, "grad_norm": "2.715e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.234e-01", "anc_loss": "4.500e-01", "dlm_acc": "6.906e-01", "anc_acc": "6.726e-01", "epoch": 0.09618} {"step": 48095, "loss": 1.4067, "grad_norm": "4.987e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.301e-01", "anc_loss": "9.119e-01", "dlm_acc": "6.366e-01", "anc_acc": "6.136e-01", "epoch": 0.09619} {"step": 48100, "loss": 1.3253, "grad_norm": "3.160e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.627e+00", "dlm_acc": "5.172e-01", "anc_acc": "4.878e-01", "epoch": 0.0962} {"step": 48105, "loss": 0.934, "grad_norm": "1.490e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.438e-01", "anc_loss": "6.574e-01", "dlm_acc": "5.915e-01", "anc_acc": "5.837e-01", "epoch": 0.09621} {"step": 48110, "loss": 1.1894, "grad_norm": "4.244e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.430e-01", "anc_loss": "8.016e-01", "dlm_acc": "5.604e-01", "anc_acc": "5.480e-01", "epoch": 0.09622} {"step": 48115, "loss": 1.0307, "grad_norm": "2.255e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.113e-01", "anc_loss": "6.180e-01", "dlm_acc": "5.886e-01", "anc_acc": "5.853e-01", "epoch": 0.09623} {"step": 48120, "loss": 1.1903, "grad_norm": "6.951e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.996e-01", "anc_loss": "6.328e-01", "dlm_acc": "7.077e-01", "anc_acc": "6.983e-01", "epoch": 0.09624} {"step": 48125, "loss": 1.0505, "grad_norm": "2.445e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.871e-01", "anc_loss": "9.484e-01", "dlm_acc": "5.721e-01", "anc_acc": "5.531e-01", "epoch": 0.09625} {"step": 48130, "loss": 1.0598, "grad_norm": "2.463e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.154e+00", "dlm_acc": "5.841e-01", "anc_acc": "5.549e-01", "epoch": 0.09626} {"step": 48135, "loss": 1.0078, "grad_norm": "2.657e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.748e-01", "anc_loss": "3.459e-01", "dlm_acc": "8.671e-01", "anc_acc": "8.449e-01", "epoch": 0.09627} {"step": 48140, "loss": 1.3127, "grad_norm": "4.583e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.413e+00", "anc_loss": "1.550e+00", "dlm_acc": "5.274e-01", "anc_acc": "4.975e-01", "epoch": 0.09628} {"step": 48145, "loss": 1.1958, "grad_norm": "2.391e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.165e-01", "anc_loss": "1.029e+00", "dlm_acc": "6.978e-01", "anc_acc": "6.712e-01", "epoch": 0.09629} {"step": 48150, "loss": 1.2807, "grad_norm": "1.935e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.157e+00", "anc_loss": "1.272e+00", "dlm_acc": "5.710e-01", "anc_acc": "5.492e-01", "epoch": 0.0963} {"step": 48155, "loss": 1.2674, "grad_norm": "8.645e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.079e-01", "anc_loss": "8.802e-01", "dlm_acc": "6.381e-01", "anc_acc": "6.196e-01", "epoch": 0.09631} {"step": 48160, "loss": 0.9622, "grad_norm": "2.215e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.937e-01", "anc_loss": "7.586e-01", "dlm_acc": "6.203e-01", "anc_acc": "5.985e-01", "epoch": 0.09632} {"step": 48165, "loss": 1.1308, "grad_norm": "2.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.246e-01", "anc_loss": "4.500e-01", "dlm_acc": "6.805e-01", "anc_acc": "6.625e-01", "epoch": 0.09633} {"step": 48170, "loss": 1.3474, "grad_norm": "4.087e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.301e-01", "anc_loss": "4.953e-01", "dlm_acc": "8.135e-01", "anc_acc": "7.913e-01", "epoch": 0.09634} {"step": 48175, "loss": 1.2125, "grad_norm": "3.899e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.354e-01", "anc_loss": "8.016e-01", "dlm_acc": "6.219e-01", "anc_acc": "6.059e-01", "epoch": 0.09635} {"step": 48180, "loss": 1.2653, "grad_norm": "5.136e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.570e-01", "anc_loss": "1.014e+00", "dlm_acc": "4.591e-01", "anc_acc": "4.409e-01", "epoch": 0.09636} {"step": 48185, "loss": 0.9335, "grad_norm": "6.718e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.016e-02", "anc_loss": "5.136e-02", "dlm_acc": "9.822e-01", "anc_acc": "9.719e-01", "epoch": 0.09637} {"step": 48190, "loss": 1.4202, "grad_norm": "7.963e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.427e-01", "anc_loss": "6.381e-01", "dlm_acc": "7.695e-01", "anc_acc": "7.280e-01", "epoch": 0.09638} {"step": 48195, "loss": 1.1459, "grad_norm": "2.515e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.824e-01", "anc_loss": "6.580e-01", "dlm_acc": "7.161e-01", "anc_acc": "6.920e-01", "epoch": 0.09639} {"step": 48200, "loss": 1.1839, "grad_norm": "2.357e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.773e-01", "anc_loss": "1.086e+00", "dlm_acc": "6.825e-01", "anc_acc": "6.558e-01", "epoch": 0.0964} {"step": 48205, "loss": 1.2283, "grad_norm": "4.031e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.488e+00", "anc_loss": "1.583e+00", "dlm_acc": "4.987e-01", "anc_acc": "4.766e-01", "epoch": 0.09641} {"step": 48210, "loss": 1.1028, "grad_norm": "3.086e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.155e+00", "anc_loss": "1.266e+00", "dlm_acc": "6.297e-01", "anc_acc": "6.039e-01", "epoch": 0.09642} {"step": 48215, "loss": 1.0923, "grad_norm": "2.409e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.708e-01", "anc_loss": "6.514e-01", "dlm_acc": "7.883e-01", "anc_acc": "7.632e-01", "epoch": 0.09643} {"step": 48220, "loss": 1.3314, "grad_norm": "8.495e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.059e+00", "anc_loss": "1.190e+00", "dlm_acc": "6.315e-01", "anc_acc": "6.003e-01", "epoch": 0.09644} {"step": 48225, "loss": 1.4491, "grad_norm": "3.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.648e-01", "anc_loss": "1.094e+00", "dlm_acc": "6.406e-01", "anc_acc": "6.060e-01", "epoch": 0.09645} {"step": 48230, "loss": 1.5831, "grad_norm": "2.780e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.263e+00", "dlm_acc": "6.252e-01", "anc_acc": "5.987e-01", "epoch": 0.09646} {"step": 48235, "loss": 1.2903, "grad_norm": "2.612e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.687e-01", "anc_loss": "5.093e-01", "dlm_acc": "7.347e-01", "anc_acc": "7.121e-01", "epoch": 0.09647} {"step": 48240, "loss": 1.3805, "grad_norm": "2.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.945e-01", "anc_loss": "1.075e+00", "dlm_acc": "6.674e-01", "anc_acc": "6.448e-01", "epoch": 0.09648} {"step": 48245, "loss": 0.9555, "grad_norm": "3.084e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.840e-01", "anc_loss": "6.738e-01", "dlm_acc": "7.725e-01", "anc_acc": "7.470e-01", "epoch": 0.09649} {"step": 48250, "loss": 1.1914, "grad_norm": "2.443e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.640e-01", "anc_loss": "4.214e-01", "dlm_acc": "8.617e-01", "anc_acc": "8.402e-01", "epoch": 0.0965} {"step": 48255, "loss": 1.2233, "grad_norm": "3.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.824e-01", "anc_loss": "7.979e-01", "dlm_acc": "7.432e-01", "anc_acc": "7.087e-01", "epoch": 0.09651} {"step": 48260, "loss": 1.0375, "grad_norm": "1.195e+00", "learning_rate": "1.000e-04", "dlm_loss": "6.215e-01", "anc_loss": "6.875e-01", "dlm_acc": "7.188e-01", "anc_acc": "6.944e-01", "epoch": 0.09652} {"step": 48265, "loss": 1.2103, "grad_norm": "1.062e+00", "learning_rate": "1.000e-04", "dlm_loss": "5.474e-01", "anc_loss": "6.252e-01", "dlm_acc": "8.038e-01", "anc_acc": "7.722e-01", "epoch": 0.09653} {"step": 48270, "loss": 0.9811, "grad_norm": "3.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.547e-01", "anc_loss": "4.953e-01", "dlm_acc": "7.427e-01", "anc_acc": "7.239e-01", "epoch": 0.09654} {"step": 48275, "loss": 0.8488, "grad_norm": "3.425e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.798e-01", "anc_loss": "6.426e-01", "dlm_acc": "7.754e-01", "anc_acc": "7.537e-01", "epoch": 0.09655} {"step": 48280, "loss": 0.8785, "grad_norm": "2.090e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.608e-01", "anc_loss": "4.112e-01", "dlm_acc": "8.722e-01", "anc_acc": "8.581e-01", "epoch": 0.09656} {"step": 48285, "loss": 1.1836, "grad_norm": "2.967e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.441e-01", "anc_loss": "1.089e+00", "dlm_acc": "6.444e-01", "anc_acc": "6.019e-01", "epoch": 0.09657} {"step": 48290, "loss": 1.1575, "grad_norm": "3.270e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.893e-01", "anc_loss": "4.451e-01", "dlm_acc": "8.430e-01", "anc_acc": "8.189e-01", "epoch": 0.09658} {"step": 48295, "loss": 1.3173, "grad_norm": "4.811e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.906e-01", "anc_loss": "1.014e+00", "dlm_acc": "6.328e-01", "anc_acc": "5.902e-01", "epoch": 0.09659} {"step": 48300, "loss": 1.3344, "grad_norm": "6.382e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.630e-01", "anc_loss": "1.037e+00", "dlm_acc": "6.977e-01", "anc_acc": "6.812e-01", "epoch": 0.0966} {"step": 48305, "loss": 1.1857, "grad_norm": "3.927e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.805e-01", "anc_loss": "8.250e-01", "dlm_acc": "6.256e-01", "anc_acc": "6.148e-01", "epoch": 0.09661} {"step": 48310, "loss": 1.1668, "grad_norm": "3.641e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.336e-01", "anc_loss": "8.867e-01", "dlm_acc": "6.496e-01", "anc_acc": "6.340e-01", "epoch": 0.09662} {"step": 48315, "loss": 1.5525, "grad_norm": "3.738e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.293e+00", "anc_loss": "1.407e+00", "dlm_acc": "5.187e-01", "anc_acc": "4.968e-01", "epoch": 0.09663} {"step": 48320, "loss": 1.7965, "grad_norm": "7.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.267e+00", "anc_loss": "1.402e+00", "dlm_acc": "5.947e-01", "anc_acc": "5.677e-01", "epoch": 0.09664} {"step": 48325, "loss": 1.0428, "grad_norm": "4.157e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.719e-01", "anc_loss": "7.656e-01", "dlm_acc": "7.511e-01", "anc_acc": "7.286e-01", "epoch": 0.09665} {"step": 48330, "loss": 1.0239, "grad_norm": "3.118e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.261e-01", "anc_loss": "4.896e-01", "dlm_acc": "8.140e-01", "anc_acc": "7.924e-01", "epoch": 0.09666} {"step": 48335, "loss": 1.2002, "grad_norm": "2.736e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.241e+00", "anc_loss": "1.387e+00", "dlm_acc": "6.221e-01", "anc_acc": "5.931e-01", "epoch": 0.09667} {"step": 48340, "loss": 1.0215, "grad_norm": "4.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.094e-01", "anc_loss": "6.925e-01", "dlm_acc": "7.490e-01", "anc_acc": "7.249e-01", "epoch": 0.09668} {"step": 48345, "loss": 0.9072, "grad_norm": "2.936e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.467e-01", "anc_loss": "6.203e-01", "dlm_acc": "7.139e-01", "anc_acc": "6.797e-01", "epoch": 0.09669} {"step": 48350, "loss": 1.1286, "grad_norm": "2.499e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.539e-01", "anc_loss": "1.063e+00", "dlm_acc": "6.283e-01", "anc_acc": "6.005e-01", "epoch": 0.0967} {"step": 48355, "loss": 0.9376, "grad_norm": "1.159e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.678e-01", "anc_loss": "8.359e-01", "dlm_acc": "6.666e-01", "anc_acc": "6.468e-01", "epoch": 0.09671} {"step": 48360, "loss": 1.1297, "grad_norm": "2.475e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.705e-01", "anc_loss": "5.239e-01", "dlm_acc": "7.634e-01", "anc_acc": "7.462e-01", "epoch": 0.09672} {"step": 48365, "loss": 1.0066, "grad_norm": "4.020e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.844e-01", "anc_loss": "1.009e+00", "dlm_acc": "6.744e-01", "anc_acc": "6.429e-01", "epoch": 0.09673} {"step": 48370, "loss": 1.2688, "grad_norm": "5.266e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.633e-01", "anc_loss": "8.293e-01", "dlm_acc": "7.784e-01", "anc_acc": "7.439e-01", "epoch": 0.09674} {"step": 48375, "loss": 1.0592, "grad_norm": "4.281e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.693e-01", "anc_loss": "1.045e+00", "dlm_acc": "5.665e-01", "anc_acc": "5.441e-01", "epoch": 0.09675} {"step": 48380, "loss": 0.7846, "grad_norm": "3.021e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.483e-01", "anc_loss": "7.436e-01", "dlm_acc": "7.096e-01", "anc_acc": "6.760e-01", "epoch": 0.09676} {"step": 48385, "loss": 1.1884, "grad_norm": "4.060e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.495e+00", "anc_loss": "1.603e+00", "dlm_acc": "5.273e-01", "anc_acc": "5.032e-01", "epoch": 0.09677} {"step": 48390, "loss": 1.4517, "grad_norm": "5.105e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.762e+00", "anc_loss": "1.878e+00", "dlm_acc": "4.448e-01", "anc_acc": "4.179e-01", "epoch": 0.09678} {"step": 48395, "loss": 1.2293, "grad_norm": "2.512e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.102e+00", "anc_loss": "1.217e+00", "dlm_acc": "5.949e-01", "anc_acc": "5.663e-01", "epoch": 0.09679} {"step": 48400, "loss": 1.3099, "grad_norm": "4.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.381e+00", "dlm_acc": "5.939e-01", "anc_acc": "5.651e-01", "epoch": 0.0968} {"step": 48405, "loss": 1.0722, "grad_norm": "3.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.008e+00", "anc_loss": "1.109e+00", "dlm_acc": "5.516e-01", "anc_acc": "5.217e-01", "epoch": 0.09681} {"step": 48410, "loss": 1.6149, "grad_norm": "4.888e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.579e+00", "anc_loss": "1.688e+00", "dlm_acc": "5.398e-01", "anc_acc": "5.152e-01", "epoch": 0.09682} {"step": 48415, "loss": 1.2353, "grad_norm": "2.403e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.412e+00", "anc_loss": "1.538e+00", "dlm_acc": "5.384e-01", "anc_acc": "5.082e-01", "epoch": 0.09683} {"step": 48420, "loss": 0.9913, "grad_norm": "6.793e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.414e+00", "anc_loss": "1.536e+00", "dlm_acc": "4.802e-01", "anc_acc": "4.510e-01", "epoch": 0.09684} {"step": 48425, "loss": 0.8761, "grad_norm": "5.018e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.584e+00", "anc_loss": "1.716e+00", "dlm_acc": "4.916e-01", "anc_acc": "4.660e-01", "epoch": 0.09685} {"step": 48430, "loss": 1.2006, "grad_norm": "3.722e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.578e-01", "anc_loss": "1.075e+00", "dlm_acc": "6.351e-01", "anc_acc": "5.977e-01", "epoch": 0.09686} {"step": 48435, "loss": 1.2865, "grad_norm": "2.918e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.394e+00", "anc_loss": "1.523e+00", "dlm_acc": "5.347e-01", "anc_acc": "5.033e-01", "epoch": 0.09687} {"step": 48440, "loss": 1.1932, "grad_norm": "3.201e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.647e+00", "anc_loss": "1.775e+00", "dlm_acc": "5.099e-01", "anc_acc": "4.813e-01", "epoch": 0.09688} {"step": 48445, "loss": 1.3289, "grad_norm": "3.606e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.683e+00", "anc_loss": "1.803e+00", "dlm_acc": "4.827e-01", "anc_acc": "4.585e-01", "epoch": 0.09689} {"step": 48450, "loss": 1.4039, "grad_norm": "6.210e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.555e+00", "anc_loss": "1.670e+00", "dlm_acc": "4.504e-01", "anc_acc": "4.236e-01", "epoch": 0.0969} {"step": 48455, "loss": 1.0036, "grad_norm": "3.821e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.462e+00", "dlm_acc": "5.587e-01", "anc_acc": "5.254e-01", "epoch": 0.09691} {"step": 48460, "loss": 0.9832, "grad_norm": "3.440e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.285e+00", "dlm_acc": "5.754e-01", "anc_acc": "5.398e-01", "epoch": 0.09692} {"step": 48465, "loss": 1.042, "grad_norm": "1.390e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.510e+00", "dlm_acc": "5.564e-01", "anc_acc": "5.255e-01", "epoch": 0.09693} {"step": 48470, "loss": 1.5696, "grad_norm": "2.243e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.550e+00", "anc_loss": "1.692e+00", "dlm_acc": "5.432e-01", "anc_acc": "5.076e-01", "epoch": 0.09694} {"step": 48475, "loss": 0.728, "grad_norm": "9.244e-02", "learning_rate": "1.000e-04", "dlm_loss": "9.996e-01", "anc_loss": "1.117e+00", "dlm_acc": "6.032e-01", "anc_acc": "5.707e-01", "epoch": 0.09695} {"step": 48480, "loss": 1.3103, "grad_norm": "2.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.328e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.543e-01", "anc_acc": "5.205e-01", "epoch": 0.09696} {"step": 48485, "loss": 0.9957, "grad_norm": "3.286e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.645e-01", "anc_loss": "1.095e+00", "dlm_acc": "6.451e-01", "anc_acc": "6.097e-01", "epoch": 0.09697} {"step": 48490, "loss": 1.4422, "grad_norm": "2.627e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.586e+00", "anc_loss": "1.713e+00", "dlm_acc": "5.484e-01", "anc_acc": "5.213e-01", "epoch": 0.09698} {"step": 48495, "loss": 0.9788, "grad_norm": "3.747e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.426e+00", "dlm_acc": "5.520e-01", "anc_acc": "5.212e-01", "epoch": 0.09699} {"step": 48500, "loss": 1.3324, "grad_norm": "2.373e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.430e+00", "anc_loss": "1.570e+00", "dlm_acc": "5.643e-01", "anc_acc": "5.328e-01", "epoch": 0.097} {"step": 48505, "loss": 0.7977, "grad_norm": "5.030e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.152e-01", "anc_loss": "9.305e-01", "dlm_acc": "6.640e-01", "anc_acc": "6.335e-01", "epoch": 0.09701} {"step": 48510, "loss": 0.9159, "grad_norm": "1.853e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.523e-01", "anc_loss": "1.070e+00", "dlm_acc": "6.107e-01", "anc_acc": "5.752e-01", "epoch": 0.09702} {"step": 48515, "loss": 1.499, "grad_norm": "3.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.617e+00", "anc_loss": "1.773e+00", "dlm_acc": "5.336e-01", "anc_acc": "5.006e-01", "epoch": 0.09703} {"step": 48520, "loss": 1.5863, "grad_norm": "4.401e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.675e+00", "anc_loss": "1.794e+00", "dlm_acc": "4.806e-01", "anc_acc": "4.534e-01", "epoch": 0.09704} {"step": 48525, "loss": 1.4283, "grad_norm": "4.378e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.476e+00", "anc_loss": "1.618e+00", "dlm_acc": "5.718e-01", "anc_acc": "5.398e-01", "epoch": 0.09705} {"step": 48530, "loss": 1.7105, "grad_norm": "3.995e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.653e+00", "anc_loss": "1.816e+00", "dlm_acc": "4.381e-01", "anc_acc": "3.971e-01", "epoch": 0.09706} {"step": 48535, "loss": 1.2447, "grad_norm": "3.724e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.485e+00", "dlm_acc": "5.329e-01", "anc_acc": "4.801e-01", "epoch": 0.09707} {"step": 48540, "loss": 1.0948, "grad_norm": "2.621e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.166e+00", "dlm_acc": "6.135e-01", "anc_acc": "5.823e-01", "epoch": 0.09708} {"step": 48545, "loss": 1.3382, "grad_norm": "3.657e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.169e-01", "anc_loss": "8.123e-01", "dlm_acc": "7.415e-01", "anc_acc": "7.198e-01", "epoch": 0.09709} {"step": 48550, "loss": 1.1898, "grad_norm": "2.928e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.173e+00", "anc_loss": "1.361e+00", "dlm_acc": "5.694e-01", "anc_acc": "5.136e-01", "epoch": 0.0971} {"step": 48555, "loss": 1.4449, "grad_norm": "3.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.734e+00", "anc_loss": "1.849e+00", "dlm_acc": "4.177e-01", "anc_acc": "3.907e-01", "epoch": 0.09711} {"step": 48560, "loss": 1.0112, "grad_norm": "3.063e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.555e-01", "anc_loss": "9.504e-01", "dlm_acc": "6.087e-01", "anc_acc": "5.792e-01", "epoch": 0.09712} {"step": 48565, "loss": 1.2729, "grad_norm": "4.974e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.096e+00", "anc_loss": "1.229e+00", "dlm_acc": "6.067e-01", "anc_acc": "5.713e-01", "epoch": 0.09713} {"step": 48570, "loss": 0.8918, "grad_norm": "2.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.684e-01", "anc_loss": "1.064e+00", "dlm_acc": "6.130e-01", "anc_acc": "5.855e-01", "epoch": 0.09714} {"step": 48575, "loss": 0.9057, "grad_norm": "2.885e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.848e-01", "anc_loss": "6.633e-01", "dlm_acc": "7.483e-01", "anc_acc": "7.266e-01", "epoch": 0.09715} {"step": 48580, "loss": 1.3839, "grad_norm": "3.283e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.432e+00", "anc_loss": "1.520e+00", "dlm_acc": "4.935e-01", "anc_acc": "4.676e-01", "epoch": 0.09716} {"step": 48585, "loss": 1.4431, "grad_norm": "7.783e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.095e+00", "anc_loss": "2.164e+00", "dlm_acc": "2.505e-01", "anc_acc": "2.321e-01", "epoch": 0.09717} {"step": 48590, "loss": 1.1555, "grad_norm": "1.242e+00", "learning_rate": "1.000e-04", "dlm_loss": "8.295e-01", "anc_loss": "9.071e-01", "dlm_acc": "6.726e-01", "anc_acc": "6.534e-01", "epoch": 0.09718} {"step": 48595, "loss": 1.0543, "grad_norm": "2.674e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.306e+00", "dlm_acc": "5.951e-01", "anc_acc": "5.552e-01", "epoch": 0.09719} {"step": 48600, "loss": 1.4011, "grad_norm": "9.439e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.380e+00", "anc_loss": "1.519e+00", "dlm_acc": "5.721e-01", "anc_acc": "5.405e-01", "epoch": 0.0972} {"step": 48605, "loss": 1.2441, "grad_norm": "2.298e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.244e+00", "anc_loss": "1.430e+00", "dlm_acc": "5.844e-01", "anc_acc": "5.332e-01", "epoch": 0.09721} {"step": 48610, "loss": 1.1452, "grad_norm": "2.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.304e+00", "dlm_acc": "5.781e-01", "anc_acc": "5.364e-01", "epoch": 0.09722} {"step": 48615, "loss": 1.2451, "grad_norm": "4.539e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.727e-01", "anc_loss": "9.383e-01", "dlm_acc": "6.978e-01", "anc_acc": "6.482e-01", "epoch": 0.09723} {"step": 48620, "loss": 1.3047, "grad_norm": "4.493e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.048e+00", "anc_loss": "1.208e+00", "dlm_acc": "5.701e-01", "anc_acc": "5.229e-01", "epoch": 0.09724} {"step": 48625, "loss": 1.4465, "grad_norm": "5.755e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.308e+00", "anc_loss": "2.331e+00", "dlm_acc": "1.003e-01", "anc_acc": "9.193e-02", "epoch": 0.09725} {"step": 48630, "loss": 0.825, "grad_norm": "3.540e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.273e-01", "anc_loss": "7.742e-01", "dlm_acc": "3.820e-01", "anc_acc": "3.361e-01", "epoch": 0.09726} {"step": 48635, "loss": 1.4381, "grad_norm": "2.899e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.103e+00", "anc_loss": "1.194e+00", "dlm_acc": "5.243e-01", "anc_acc": "4.960e-01", "epoch": 0.09727} {"step": 48640, "loss": 1.7545, "grad_norm": "4.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.528e+00", "dlm_acc": "5.309e-01", "anc_acc": "4.746e-01", "epoch": 0.09728} {"step": 48645, "loss": 1.1652, "grad_norm": "4.024e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.633e-01", "anc_loss": "9.609e-01", "dlm_acc": "5.419e-01", "anc_acc": "5.004e-01", "epoch": 0.09729} {"step": 48650, "loss": 1.1531, "grad_norm": "3.542e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.274e+00", "anc_loss": "1.435e+00", "dlm_acc": "5.261e-01", "anc_acc": "4.800e-01", "epoch": 0.0973} {"step": 48655, "loss": 1.1735, "grad_norm": "6.472e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.258e-01", "anc_loss": "9.789e-01", "dlm_acc": "6.606e-01", "anc_acc": "6.091e-01", "epoch": 0.09731} {"step": 48660, "loss": 1.3011, "grad_norm": "4.824e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.080e+00", "anc_loss": "1.221e+00", "dlm_acc": "5.763e-01", "anc_acc": "5.288e-01", "epoch": 0.09732} {"step": 48665, "loss": 1.0194, "grad_norm": "4.919e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.516e-01", "anc_loss": "1.001e+00", "dlm_acc": "6.770e-01", "anc_acc": "6.308e-01", "epoch": 0.09733} {"step": 48670, "loss": 0.8252, "grad_norm": "1.421e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.576e-01", "anc_loss": "2.221e-01", "dlm_acc": "9.014e-01", "anc_acc": "8.770e-01", "epoch": 0.09734} {"step": 48675, "loss": 0.9433, "grad_norm": "3.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.055e-01", "anc_loss": "2.717e-01", "dlm_acc": "8.912e-01", "anc_acc": "8.634e-01", "epoch": 0.09735} {"step": 48680, "loss": 1.2585, "grad_norm": "3.025e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.391e-01", "anc_loss": "1.106e+00", "dlm_acc": "6.364e-01", "anc_acc": "5.809e-01", "epoch": 0.09736} {"step": 48685, "loss": 1.1134, "grad_norm": "1.926e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.871e-01", "anc_loss": "9.297e-01", "dlm_acc": "6.769e-01", "anc_acc": "6.227e-01", "epoch": 0.09737} {"step": 48690, "loss": 0.9917, "grad_norm": "2.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.578e-01", "anc_loss": "8.641e-01", "dlm_acc": "6.599e-01", "anc_acc": "6.246e-01", "epoch": 0.09738} {"step": 48695, "loss": 1.276, "grad_norm": "2.465e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.330e+00", "anc_loss": "1.457e+00", "dlm_acc": "5.257e-01", "anc_acc": "4.932e-01", "epoch": 0.09739} {"step": 48700, "loss": 1.1579, "grad_norm": "2.850e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.516e+00", "anc_loss": "1.609e+00", "dlm_acc": "4.163e-01", "anc_acc": "3.916e-01", "epoch": 0.0974} {"step": 48705, "loss": 0.9646, "grad_norm": "3.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.809e-01", "anc_loss": "8.719e-01", "dlm_acc": "6.834e-01", "anc_acc": "6.499e-01", "epoch": 0.09741} {"step": 48710, "loss": 1.7579, "grad_norm": "6.012e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.923e+00", "anc_loss": "2.019e+00", "dlm_acc": "3.459e-01", "anc_acc": "3.281e-01", "epoch": 0.09742} {"step": 48715, "loss": 1.3779, "grad_norm": "3.846e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.247e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.530e-01", "anc_acc": "5.165e-01", "epoch": 0.09743} {"step": 48720, "loss": 1.208, "grad_norm": "4.635e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.133e+00", "anc_loss": "1.308e+00", "dlm_acc": "6.374e-01", "anc_acc": "5.973e-01", "epoch": 0.09744} {"step": 48725, "loss": 1.046, "grad_norm": "4.184e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.057e+00", "anc_loss": "1.155e+00", "dlm_acc": "5.776e-01", "anc_acc": "5.481e-01", "epoch": 0.09745} {"step": 48730, "loss": 1.088, "grad_norm": "2.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.038e+00", "anc_loss": "1.193e+00", "dlm_acc": "6.034e-01", "anc_acc": "5.576e-01", "epoch": 0.09746} {"step": 48735, "loss": 1.027, "grad_norm": "4.348e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.006e+00", "anc_loss": "1.153e+00", "dlm_acc": "6.271e-01", "anc_acc": "5.877e-01", "epoch": 0.09747} {"step": 48740, "loss": 1.426, "grad_norm": "3.255e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.014e+00", "anc_loss": "1.132e+00", "dlm_acc": "6.463e-01", "anc_acc": "6.150e-01", "epoch": 0.09748} {"step": 48745, "loss": 0.8761, "grad_norm": "2.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.166e-01", "anc_loss": "7.013e-01", "dlm_acc": "7.443e-01", "anc_acc": "7.181e-01", "epoch": 0.09749} {"step": 48750, "loss": 1.0771, "grad_norm": "1.574e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.500e-01", "anc_loss": "1.081e+00", "dlm_acc": "6.595e-01", "anc_acc": "6.254e-01", "epoch": 0.0975} {"step": 48755, "loss": 0.8779, "grad_norm": "8.209e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.613e-01", "anc_loss": "7.340e-01", "dlm_acc": "6.836e-01", "anc_acc": "6.632e-01", "epoch": 0.09751} {"step": 48760, "loss": 0.9795, "grad_norm": "3.880e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.768e-01", "anc_loss": "4.945e-01", "dlm_acc": "7.096e-01", "anc_acc": "7.032e-01", "epoch": 0.09752} {"step": 48765, "loss": 1.0056, "grad_norm": "2.188e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.543e-01", "anc_loss": "4.691e-01", "dlm_acc": "6.613e-01", "anc_acc": "6.555e-01", "epoch": 0.09753} {"step": 48770, "loss": 1.0698, "grad_norm": "2.613e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.447e-01", "anc_loss": "3.605e-01", "dlm_acc": "7.763e-01", "anc_acc": "7.697e-01", "epoch": 0.09754} {"step": 48775, "loss": 1.2077, "grad_norm": "3.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.461e-01", "anc_loss": "1.018e+00", "dlm_acc": "6.244e-01", "anc_acc": "6.087e-01", "epoch": 0.09755} {"step": 48780, "loss": 1.15, "grad_norm": "2.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.144e+00", "anc_loss": "1.233e+00", "dlm_acc": "5.755e-01", "anc_acc": "5.516e-01", "epoch": 0.09756} {"step": 48785, "loss": 0.8299, "grad_norm": "1.410e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.934e-01", "anc_loss": "6.594e-01", "dlm_acc": "7.679e-01", "anc_acc": "7.471e-01", "epoch": 0.09757} {"step": 48790, "loss": 0.965, "grad_norm": "3.445e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.274e-01", "anc_loss": "5.674e-01", "dlm_acc": "7.766e-01", "anc_acc": "7.628e-01", "epoch": 0.09758} {"step": 48795, "loss": 1.003, "grad_norm": "3.129e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.685e-01", "anc_loss": "5.358e-01", "dlm_acc": "7.986e-01", "anc_acc": "7.800e-01", "epoch": 0.09759} {"step": 48800, "loss": 1.239, "grad_norm": "2.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.781e-01", "anc_loss": "7.430e-01", "dlm_acc": "6.459e-01", "anc_acc": "6.259e-01", "epoch": 0.0976} {"step": 48805, "loss": 1.2312, "grad_norm": "1.128e+00", "learning_rate": "1.000e-04", "dlm_loss": "4.710e-01", "anc_loss": "4.886e-01", "dlm_acc": "7.475e-01", "anc_acc": "7.498e-01", "epoch": 0.09761} {"step": 48810, "loss": 1.0448, "grad_norm": "2.771e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.711e-01", "anc_loss": "7.305e-01", "dlm_acc": "6.349e-01", "anc_acc": "6.205e-01", "epoch": 0.09762} {"step": 48815, "loss": 0.9791, "grad_norm": "3.238e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.746e-01", "anc_loss": "1.086e+00", "dlm_acc": "6.060e-01", "anc_acc": "5.738e-01", "epoch": 0.09763} {"step": 48820, "loss": 1.229, "grad_norm": "5.892e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.117e-01", "anc_loss": "9.828e-01", "dlm_acc": "6.530e-01", "anc_acc": "6.379e-01", "epoch": 0.09764} {"step": 48825, "loss": 0.9789, "grad_norm": "2.280e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.281e-01", "anc_loss": "8.621e-01", "dlm_acc": "5.853e-01", "anc_acc": "5.791e-01", "epoch": 0.09765} {"step": 48830, "loss": 1.0004, "grad_norm": "2.026e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.754e-01", "anc_loss": "4.865e-01", "dlm_acc": "6.875e-01", "anc_acc": "6.842e-01", "epoch": 0.09766} {"step": 48835, "loss": 1.0852, "grad_norm": "2.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.033e+00", "anc_loss": "1.168e+00", "dlm_acc": "6.503e-01", "anc_acc": "6.162e-01", "epoch": 0.09767} {"step": 48840, "loss": 1.4489, "grad_norm": "6.197e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.239e-01", "anc_loss": "6.743e-01", "dlm_acc": "7.613e-01", "anc_acc": "7.384e-01", "epoch": 0.09768} {"step": 48845, "loss": 1.4932, "grad_norm": "3.287e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.507e+00", "anc_loss": "1.633e+00", "dlm_acc": "5.171e-01", "anc_acc": "4.879e-01", "epoch": 0.09769} {"step": 48850, "loss": 1.1208, "grad_norm": "7.016e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.430e-01", "anc_loss": "8.180e-01", "dlm_acc": "6.900e-01", "anc_acc": "6.661e-01", "epoch": 0.0977} {"step": 48855, "loss": 0.918, "grad_norm": "5.262e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.354e-01", "anc_loss": "3.728e-01", "dlm_acc": "8.745e-01", "anc_acc": "8.574e-01", "epoch": 0.09771} {"step": 48860, "loss": 1.1525, "grad_norm": "2.524e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.046e+00", "anc_loss": "1.104e+00", "dlm_acc": "3.654e-01", "anc_acc": "3.490e-01", "epoch": 0.09772} {"step": 48865, "loss": 0.8935, "grad_norm": "2.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.807e-01", "anc_loss": "5.341e-01", "dlm_acc": "7.725e-01", "anc_acc": "7.577e-01", "epoch": 0.09773} {"step": 48870, "loss": 1.2434, "grad_norm": "2.745e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.341e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.260e-01", "anc_acc": "5.029e-01", "epoch": 0.09774} {"step": 48875, "loss": 0.7546, "grad_norm": "2.520e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.483e-01", "anc_loss": "6.168e-01", "dlm_acc": "7.547e-01", "anc_acc": "7.312e-01", "epoch": 0.09775} {"step": 48880, "loss": 0.8031, "grad_norm": "2.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.021e-01", "anc_loss": "5.656e-01", "dlm_acc": "6.879e-01", "anc_acc": "6.526e-01", "epoch": 0.09776} {"step": 48885, "loss": 1.0147, "grad_norm": "3.711e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.816e-01", "anc_loss": "5.414e-01", "dlm_acc": "6.428e-01", "anc_acc": "6.055e-01", "epoch": 0.09777} {"step": 48890, "loss": 1.0408, "grad_norm": "1.734e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.047e-01", "anc_loss": "4.648e-01", "dlm_acc": "6.853e-01", "anc_acc": "6.464e-01", "epoch": 0.09778} {"step": 48895, "loss": 0.9157, "grad_norm": "2.839e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.039e-01", "anc_loss": "7.656e-01", "dlm_acc": "6.706e-01", "anc_acc": "6.525e-01", "epoch": 0.09779} {"step": 48900, "loss": 0.9905, "grad_norm": "3.208e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.477e-01", "anc_loss": "3.684e-01", "dlm_acc": "7.736e-01", "anc_acc": "7.645e-01", "epoch": 0.0978} {"step": 48905, "loss": 1.027, "grad_norm": "2.181e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.690e-01", "anc_loss": "5.095e-01", "dlm_acc": "8.115e-01", "anc_acc": "7.973e-01", "epoch": 0.09781} {"step": 48910, "loss": 1.4957, "grad_norm": "7.177e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.606e-01", "anc_loss": "9.293e-01", "dlm_acc": "7.323e-01", "anc_acc": "7.081e-01", "epoch": 0.09782} {"step": 48915, "loss": 1.2095, "grad_norm": "6.559e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.634e-01", "anc_loss": "6.098e-01", "dlm_acc": "7.358e-01", "anc_acc": "7.225e-01", "epoch": 0.09783} {"step": 48920, "loss": 1.229, "grad_norm": "4.055e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.327e-01", "anc_loss": "3.773e-01", "dlm_acc": "8.556e-01", "anc_acc": "8.434e-01", "epoch": 0.09784} {"step": 48925, "loss": 1.5132, "grad_norm": "3.315e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.337e-01", "anc_loss": "5.899e-01", "dlm_acc": "7.745e-01", "anc_acc": "7.569e-01", "epoch": 0.09785} {"step": 48930, "loss": 1.0599, "grad_norm": "4.222e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.043e-01", "anc_loss": "4.396e-01", "dlm_acc": "7.837e-01", "anc_acc": "7.670e-01", "epoch": 0.09786} {"step": 48935, "loss": 1.1836, "grad_norm": "4.693e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.176e-01", "anc_loss": "1.031e+00", "dlm_acc": "6.716e-01", "anc_acc": "6.396e-01", "epoch": 0.09787} {"step": 48940, "loss": 2.0732, "grad_norm": "1.180e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.900e+00", "anc_loss": "2.014e+00", "dlm_acc": "3.441e-01", "anc_acc": "3.178e-01", "epoch": 0.09788} {"step": 48945, "loss": 1.0144, "grad_norm": "4.550e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.482e+00", "anc_loss": "1.578e+00", "dlm_acc": "3.990e-01", "anc_acc": "3.738e-01", "epoch": 0.09789} {"step": 48950, "loss": 0.9801, "grad_norm": "3.336e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.738e-01", "anc_loss": "7.563e-01", "dlm_acc": "7.635e-01", "anc_acc": "7.379e-01", "epoch": 0.0979} {"step": 48955, "loss": 1.0556, "grad_norm": "2.695e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.851e-01", "anc_loss": "8.553e-01", "dlm_acc": "6.999e-01", "anc_acc": "6.791e-01", "epoch": 0.09791} {"step": 48960, "loss": 0.8165, "grad_norm": "3.147e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.513e-01", "anc_loss": "4.933e-01", "dlm_acc": "7.522e-01", "anc_acc": "7.369e-01", "epoch": 0.09792} {"step": 48965, "loss": 1.0017, "grad_norm": "2.426e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.490e-01", "anc_loss": "7.514e-01", "dlm_acc": "7.713e-01", "anc_acc": "7.444e-01", "epoch": 0.09793} {"step": 48970, "loss": 1.066, "grad_norm": "3.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.510e-01", "anc_loss": "5.553e-01", "dlm_acc": "6.602e-01", "anc_acc": "6.533e-01", "epoch": 0.09794} {"step": 48975, "loss": 1.1513, "grad_norm": "3.346e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.125e-01", "anc_loss": "7.531e-01", "dlm_acc": "5.916e-01", "anc_acc": "5.760e-01", "epoch": 0.09795} {"step": 48980, "loss": 0.8461, "grad_norm": "2.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.031e+00", "anc_loss": "1.155e+00", "dlm_acc": "6.127e-01", "anc_acc": "5.776e-01", "epoch": 0.09796} {"step": 48985, "loss": 1.0358, "grad_norm": "3.269e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.922e-01", "anc_loss": "7.941e-01", "dlm_acc": "7.148e-01", "anc_acc": "6.839e-01", "epoch": 0.09797} {"step": 48990, "loss": 0.8403, "grad_norm": "2.245e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.516e-01", "anc_loss": "1.063e+00", "dlm_acc": "6.315e-01", "anc_acc": "5.998e-01", "epoch": 0.09798} {"step": 48995, "loss": 0.8921, "grad_norm": "2.991e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.334e+00", "anc_loss": "1.471e+00", "dlm_acc": "5.494e-01", "anc_acc": "5.183e-01", "epoch": 0.09799} {"step": 49000, "loss": 1.2007, "grad_norm": "2.295e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.358e+00", "anc_loss": "1.495e+00", "dlm_acc": "5.701e-01", "anc_acc": "5.382e-01", "epoch": 0.098} {"step": 49005, "loss": 1.1716, "grad_norm": "3.603e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.289e+00", "anc_loss": "1.418e+00", "dlm_acc": "5.327e-01", "anc_acc": "5.023e-01", "epoch": 0.09801} {"step": 49010, "loss": 0.9119, "grad_norm": "2.451e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.189e+00", "anc_loss": "1.296e+00", "dlm_acc": "5.253e-01", "anc_acc": "4.988e-01", "epoch": 0.09802} {"step": 49015, "loss": 0.9932, "grad_norm": "5.414e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.311e+00", "anc_loss": "1.438e+00", "dlm_acc": "5.721e-01", "anc_acc": "5.384e-01", "epoch": 0.09803} {"step": 49020, "loss": 1.0829, "grad_norm": "4.597e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.800e-01", "anc_loss": "1.111e+00", "dlm_acc": "6.550e-01", "anc_acc": "6.186e-01", "epoch": 0.09804} {"step": 49025, "loss": 1.1892, "grad_norm": "2.514e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.309e+00", "anc_loss": "1.490e+00", "dlm_acc": "6.038e-01", "anc_acc": "5.784e-01", "epoch": 0.09805} {"step": 49030, "loss": 1.0673, "grad_norm": "3.226e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.342e+00", "anc_loss": "1.470e+00", "dlm_acc": "5.485e-01", "anc_acc": "5.164e-01", "epoch": 0.09806} {"step": 49035, "loss": 0.8718, "grad_norm": "2.307e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.988e-01", "anc_loss": "8.582e-01", "dlm_acc": "5.516e-01", "anc_acc": "5.360e-01", "epoch": 0.09807} {"step": 49040, "loss": 1.1645, "grad_norm": "3.688e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.023e+00", "anc_loss": "1.106e+00", "dlm_acc": "5.237e-01", "anc_acc": "5.002e-01", "epoch": 0.09808} {"step": 49045, "loss": 1.0438, "grad_norm": "2.654e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.148e+00", "anc_loss": "1.187e+00", "dlm_acc": "3.743e-01", "anc_acc": "3.665e-01", "epoch": 0.09809} {"step": 49050, "loss": 1.0675, "grad_norm": "2.871e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.159e+00", "anc_loss": "1.277e+00", "dlm_acc": "5.913e-01", "anc_acc": "5.615e-01", "epoch": 0.0981} {"step": 49055, "loss": 1.1835, "grad_norm": "3.950e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.390e+00", "anc_loss": "1.516e+00", "dlm_acc": "5.418e-01", "anc_acc": "5.123e-01", "epoch": 0.09811} {"step": 49060, "loss": 1.0926, "grad_norm": "5.862e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.229e+00", "anc_loss": "1.350e+00", "dlm_acc": "5.791e-01", "anc_acc": "5.505e-01", "epoch": 0.09812} {"step": 49065, "loss": 0.8784, "grad_norm": "1.917e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.159e+00", "dlm_acc": "5.941e-01", "anc_acc": "5.627e-01", "epoch": 0.09813} {"step": 49070, "loss": 0.8958, "grad_norm": "2.594e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.161e+00", "anc_loss": "1.294e+00", "dlm_acc": "5.663e-01", "anc_acc": "5.332e-01", "epoch": 0.09814} {"step": 49075, "loss": 1.8244, "grad_norm": "2.234e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.417e+00", "anc_loss": "1.545e+00", "dlm_acc": "5.493e-01", "anc_acc": "5.218e-01", "epoch": 0.09815} {"step": 49080, "loss": 1.375, "grad_norm": "4.893e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.464e+00", "anc_loss": "1.600e+00", "dlm_acc": "5.468e-01", "anc_acc": "5.135e-01", "epoch": 0.09816} {"step": 49085, "loss": 1.1209, "grad_norm": "3.958e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.137e+00", "anc_loss": "1.275e+00", "dlm_acc": "5.806e-01", "anc_acc": "5.437e-01", "epoch": 0.09817} {"step": 49090, "loss": 1.2729, "grad_norm": "3.069e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.348e+00", "anc_loss": "1.503e+00", "dlm_acc": "5.658e-01", "anc_acc": "5.298e-01", "epoch": 0.09818} {"step": 49095, "loss": 1.3358, "grad_norm": "3.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.372e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.463e-01", "anc_acc": "5.104e-01", "epoch": 0.09819} {"step": 49100, "loss": 1.255, "grad_norm": "2.477e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.598e+00", "anc_loss": "1.739e+00", "dlm_acc": "5.093e-01", "anc_acc": "4.758e-01", "epoch": 0.0982} {"step": 49105, "loss": 1.319, "grad_norm": "9.860e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.690e+00", "anc_loss": "1.844e+00", "dlm_acc": "4.791e-01", "anc_acc": "4.325e-01", "epoch": 0.09821} {"step": 49110, "loss": 0.904, "grad_norm": "2.730e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.883e-01", "anc_loss": "9.984e-01", "dlm_acc": "6.630e-01", "anc_acc": "6.345e-01", "epoch": 0.09822} {"step": 49115, "loss": 1.3772, "grad_norm": "3.340e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.494e+00", "anc_loss": "1.608e+00", "dlm_acc": "4.799e-01", "anc_acc": "4.519e-01", "epoch": 0.09823} {"step": 49120, "loss": 1.4704, "grad_norm": "2.882e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.506e+00", "anc_loss": "1.656e+00", "dlm_acc": "5.400e-01", "anc_acc": "5.068e-01", "epoch": 0.09824} {"step": 49125, "loss": 1.1475, "grad_norm": "3.261e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.573e+00", "anc_loss": "1.698e+00", "dlm_acc": "5.000e-01", "anc_acc": "4.730e-01", "epoch": 0.09825} {"step": 49130, "loss": 0.8906, "grad_norm": "2.777e-01", "learning_rate": "1.000e-04", "dlm_loss": "3.609e-01", "anc_loss": "3.961e-01", "dlm_acc": "8.083e-01", "anc_acc": "7.954e-01", "epoch": 0.09826} {"step": 49135, "loss": 0.9584, "grad_norm": "3.170e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.012e+00", "anc_loss": "1.126e+00", "dlm_acc": "6.380e-01", "anc_acc": "6.075e-01", "epoch": 0.09827} {"step": 49140, "loss": 1.1415, "grad_norm": "7.238e-01", "learning_rate": "1.000e-04", "dlm_loss": "4.443e-01", "anc_loss": "4.773e-01", "dlm_acc": "8.407e-01", "anc_acc": "8.367e-01", "epoch": 0.09828} {"step": 49145, "loss": 0.7693, "grad_norm": "9.065e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.994e-01", "anc_loss": "2.462e-01", "dlm_acc": "8.934e-01", "anc_acc": "8.789e-01", "epoch": 0.09829} {"step": 49150, "loss": 1.1883, "grad_norm": "4.007e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.207e-01", "anc_loss": "2.678e-01", "dlm_acc": "8.955e-01", "anc_acc": "8.795e-01", "epoch": 0.0983} {"step": 49155, "loss": 0.976, "grad_norm": "2.649e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.653e-01", "anc_loss": "2.138e-01", "dlm_acc": "9.104e-01", "anc_acc": "8.882e-01", "epoch": 0.09831} {"step": 49160, "loss": 1.3114, "grad_norm": "5.114e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.234e+00", "anc_loss": "1.369e+00", "dlm_acc": "5.830e-01", "anc_acc": "5.524e-01", "epoch": 0.09832} {"step": 49165, "loss": 1.0327, "grad_norm": "2.300e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.103e+00", "anc_loss": "1.236e+00", "dlm_acc": "5.780e-01", "anc_acc": "5.440e-01", "epoch": 0.09833} {"step": 49170, "loss": 1.2643, "grad_norm": "3.508e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.297e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.049e-01", "anc_acc": "4.708e-01", "epoch": 0.09834} {"step": 49175, "loss": 1.1757, "grad_norm": "2.592e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.788e-01", "anc_loss": "6.480e-01", "dlm_acc": "7.677e-01", "anc_acc": "7.489e-01", "epoch": 0.09835} {"step": 49180, "loss": 1.155, "grad_norm": "2.762e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.383e-01", "anc_loss": "9.094e-01", "dlm_acc": "5.438e-01", "anc_acc": "5.200e-01", "epoch": 0.09836} {"step": 49185, "loss": 1.0414, "grad_norm": "3.317e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.773e-01", "anc_loss": "7.094e-01", "dlm_acc": "4.662e-01", "anc_acc": "4.466e-01", "epoch": 0.09837} {"step": 49190, "loss": 1.3742, "grad_norm": "4.878e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.609e-01", "anc_loss": "6.867e-01", "dlm_acc": "4.733e-01", "anc_acc": "4.533e-01", "epoch": 0.09838} {"step": 49195, "loss": 1.2063, "grad_norm": "4.923e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.633e-01", "anc_loss": "6.930e-01", "dlm_acc": "4.610e-01", "anc_acc": "4.393e-01", "epoch": 0.09839} {"step": 49200, "loss": 0.9031, "grad_norm": "1.546e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.492e-01", "anc_loss": "9.211e-01", "dlm_acc": "5.210e-01", "anc_acc": "4.953e-01", "epoch": 0.0984} {"step": 49205, "loss": 1.3833, "grad_norm": "5.509e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.333e+00", "anc_loss": "1.470e+00", "dlm_acc": "5.845e-01", "anc_acc": "5.540e-01", "epoch": 0.09841} {"step": 49210, "loss": 0.9534, "grad_norm": "7.225e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.945e-01", "anc_loss": "1.009e+00", "dlm_acc": "6.323e-01", "anc_acc": "6.012e-01", "epoch": 0.09842} {"step": 49215, "loss": 0.8752, "grad_norm": "5.769e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.226e-01", "anc_loss": "1.808e-01", "dlm_acc": "9.173e-01", "anc_acc": "8.791e-01", "epoch": 0.09843} {"step": 49220, "loss": 1.1791, "grad_norm": "4.644e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.129e-01", "anc_loss": "1.012e+00", "dlm_acc": "6.992e-01", "anc_acc": "6.690e-01", "epoch": 0.09844} {"step": 49225, "loss": 0.9745, "grad_norm": "3.419e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.843e-01", "anc_loss": "8.753e-01", "dlm_acc": "7.173e-01", "anc_acc": "6.909e-01", "epoch": 0.09845} {"step": 49230, "loss": 1.1076, "grad_norm": "4.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.000e-01", "anc_loss": "8.137e-01", "dlm_acc": "7.222e-01", "anc_acc": "6.920e-01", "epoch": 0.09846} {"step": 49235, "loss": 1.5947, "grad_norm": "4.076e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.238e+00", "anc_loss": "1.380e+00", "dlm_acc": "5.795e-01", "anc_acc": "5.481e-01", "epoch": 0.09847} {"step": 49240, "loss": 1.2778, "grad_norm": "2.955e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.834e-01", "anc_loss": "8.941e-01", "dlm_acc": "7.164e-01", "anc_acc": "6.810e-01", "epoch": 0.09848} {"step": 49245, "loss": 1.7752, "grad_norm": "4.095e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.162e+00", "anc_loss": "1.287e+00", "dlm_acc": "6.372e-01", "anc_acc": "6.056e-01", "epoch": 0.09849} {"step": 49250, "loss": 1.5564, "grad_norm": "3.467e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.871e-01", "anc_loss": "1.092e+00", "dlm_acc": "6.292e-01", "anc_acc": "6.022e-01", "epoch": 0.0985} {"step": 49255, "loss": 1.3854, "grad_norm": "2.857e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.216e-01", "anc_loss": "1.031e+00", "dlm_acc": "7.063e-01", "anc_acc": "6.816e-01", "epoch": 0.09851} {"step": 49260, "loss": 1.4215, "grad_norm": "1.039e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.034e+00", "anc_loss": "1.176e+00", "dlm_acc": "6.286e-01", "anc_acc": "5.854e-01", "epoch": 0.09852} {"step": 49265, "loss": 1.3932, "grad_norm": "6.242e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.201e+00", "anc_loss": "1.330e+00", "dlm_acc": "5.527e-01", "anc_acc": "5.193e-01", "epoch": 0.09853} {"step": 49270, "loss": 1.0332, "grad_norm": "2.876e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.011e+00", "anc_loss": "1.103e+00", "dlm_acc": "5.953e-01", "anc_acc": "5.727e-01", "epoch": 0.09854} {"step": 49275, "loss": 0.7892, "grad_norm": "2.960e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.982e-01", "anc_loss": "6.750e-01", "dlm_acc": "6.991e-01", "anc_acc": "6.602e-01", "epoch": 0.09855} {"step": 49280, "loss": 0.879, "grad_norm": "7.635e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.426e-01", "anc_loss": "8.187e-01", "dlm_acc": "6.197e-01", "anc_acc": "5.979e-01", "epoch": 0.09856} {"step": 49285, "loss": 0.9215, "grad_norm": "3.903e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.766e-01", "anc_loss": "6.891e-01", "dlm_acc": "4.127e-01", "anc_acc": "4.060e-01", "epoch": 0.09857} {"step": 49290, "loss": 1.2698, "grad_norm": "3.712e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.227e-01", "anc_loss": "8.367e-01", "dlm_acc": "4.039e-01", "anc_acc": "3.962e-01", "epoch": 0.09858} {"step": 49295, "loss": 1.265, "grad_norm": "4.366e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.133e-01", "anc_loss": "8.281e-01", "dlm_acc": "4.098e-01", "anc_acc": "4.012e-01", "epoch": 0.09859} {"step": 49300, "loss": 1.1638, "grad_norm": "3.355e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.141e-01", "anc_loss": "8.281e-01", "dlm_acc": "3.990e-01", "anc_acc": "3.922e-01", "epoch": 0.0986} {"step": 49305, "loss": 0.8984, "grad_norm": "3.323e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.004e-01", "anc_loss": "8.949e-01", "dlm_acc": "6.771e-01", "anc_acc": "6.506e-01", "epoch": 0.09861} {"step": 49310, "loss": 0.9476, "grad_norm": "4.843e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.930e-01", "anc_loss": "9.781e-01", "dlm_acc": "6.527e-01", "anc_acc": "6.275e-01", "epoch": 0.09862} {"step": 49315, "loss": 1.2733, "grad_norm": "2.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.703e-01", "anc_loss": "9.602e-01", "dlm_acc": "6.075e-01", "anc_acc": "5.785e-01", "epoch": 0.09863} {"step": 49320, "loss": 1.3022, "grad_norm": "4.304e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.348e-01", "anc_loss": "9.532e-01", "dlm_acc": "7.111e-01", "anc_acc": "6.829e-01", "epoch": 0.09864} {"step": 49325, "loss": 1.1107, "grad_norm": "3.255e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.113e-01", "anc_loss": "5.500e-01", "dlm_acc": "6.257e-01", "anc_acc": "6.009e-01", "epoch": 0.09865} {"step": 49330, "loss": 1.4284, "grad_norm": "5.285e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.139e+00", "anc_loss": "1.218e+00", "dlm_acc": "5.435e-01", "anc_acc": "5.236e-01", "epoch": 0.09866} {"step": 49335, "loss": 1.3888, "grad_norm": "4.029e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.137e-01", "anc_loss": "1.038e+00", "dlm_acc": "6.708e-01", "anc_acc": "6.311e-01", "epoch": 0.09867} {"step": 49340, "loss": 1.3976, "grad_norm": "3.700e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.213e+00", "anc_loss": "1.325e+00", "dlm_acc": "5.349e-01", "anc_acc": "5.100e-01", "epoch": 0.09868} {"step": 49345, "loss": 0.9158, "grad_norm": "2.721e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.895e-01", "anc_loss": "7.371e-01", "dlm_acc": "6.410e-01", "anc_acc": "6.252e-01", "epoch": 0.09869} {"step": 49350, "loss": 1.4445, "grad_norm": "3.600e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.458e+00", "anc_loss": "1.587e+00", "dlm_acc": "5.525e-01", "anc_acc": "5.253e-01", "epoch": 0.0987} {"step": 49355, "loss": 1.4221, "grad_norm": "4.568e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.180e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.817e-01", "anc_acc": "5.513e-01", "epoch": 0.09871} {"step": 49360, "loss": 1.4161, "grad_norm": "3.900e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.520e-01", "anc_loss": "8.117e-01", "dlm_acc": "5.706e-01", "anc_acc": "5.454e-01", "epoch": 0.09872} {"step": 49365, "loss": 1.1888, "grad_norm": "3.111e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.680e-01", "anc_loss": "6.070e-01", "dlm_acc": "5.938e-01", "anc_acc": "5.685e-01", "epoch": 0.09873} {"step": 49370, "loss": 1.2098, "grad_norm": "3.607e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.157e+00", "anc_loss": "1.260e+00", "dlm_acc": "5.712e-01", "anc_acc": "5.411e-01", "epoch": 0.09874} {"step": 49375, "loss": 1.1937, "grad_norm": "3.034e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.448e+00", "dlm_acc": "5.580e-01", "anc_acc": "5.234e-01", "epoch": 0.09875} {"step": 49380, "loss": 1.3616, "grad_norm": "2.144e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.001e+00", "anc_loss": "1.100e+00", "dlm_acc": "6.185e-01", "anc_acc": "5.902e-01", "epoch": 0.09876} {"step": 49385, "loss": 0.9618, "grad_norm": "1.412e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.805e-01", "anc_loss": "9.539e-01", "dlm_acc": "5.539e-01", "anc_acc": "5.289e-01", "epoch": 0.09877} {"step": 49390, "loss": 1.2965, "grad_norm": "4.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.379e-01", "anc_loss": "1.010e+00", "dlm_acc": "5.294e-01", "anc_acc": "5.073e-01", "epoch": 0.09878} {"step": 49395, "loss": 1.3769, "grad_norm": "4.889e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.152e+00", "anc_loss": "1.243e+00", "dlm_acc": "4.619e-01", "anc_acc": "4.376e-01", "epoch": 0.09879} {"step": 49400, "loss": 1.165, "grad_norm": "3.402e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.828e-01", "anc_loss": "1.096e+00", "dlm_acc": "6.695e-01", "anc_acc": "5.954e-01", "epoch": 0.0988} {"step": 49405, "loss": 1.2899, "grad_norm": "1.543e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.471e+00", "anc_loss": "1.607e+00", "dlm_acc": "5.288e-01", "anc_acc": "4.965e-01", "epoch": 0.09881} {"step": 49410, "loss": 1.3678, "grad_norm": "3.497e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.470e+00", "anc_loss": "1.598e+00", "dlm_acc": "4.490e-01", "anc_acc": "4.137e-01", "epoch": 0.09882} {"step": 49415, "loss": 1.1776, "grad_norm": "2.587e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.046e+00", "anc_loss": "1.189e+00", "dlm_acc": "5.671e-01", "anc_acc": "5.203e-01", "epoch": 0.09883} {"step": 49420, "loss": 1.4793, "grad_norm": "5.920e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.374e+00", "anc_loss": "1.385e+00", "dlm_acc": "5.064e-01", "anc_acc": "5.047e-01", "epoch": 0.09884} {"step": 49425, "loss": 1.1739, "grad_norm": "4.502e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.257e-01", "anc_loss": "8.471e-01", "dlm_acc": "7.228e-01", "anc_acc": "6.838e-01", "epoch": 0.09885} {"step": 49430, "loss": 1.1314, "grad_norm": "2.743e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.113e+00", "anc_loss": "1.248e+00", "dlm_acc": "5.721e-01", "anc_acc": "5.325e-01", "epoch": 0.09886} {"step": 49435, "loss": 1.508, "grad_norm": "5.214e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.564e+00", "anc_loss": "1.743e+00", "dlm_acc": "5.296e-01", "anc_acc": "4.925e-01", "epoch": 0.09887} {"step": 49440, "loss": 1.1728, "grad_norm": "3.107e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.377e+00", "anc_loss": "1.519e+00", "dlm_acc": "5.394e-01", "anc_acc": "5.015e-01", "epoch": 0.09888} {"step": 49445, "loss": 0.9771, "grad_norm": "2.564e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.289e-01", "anc_loss": "1.027e+00", "dlm_acc": "6.300e-01", "anc_acc": "5.960e-01", "epoch": 0.09889} {"step": 49450, "loss": 1.215, "grad_norm": "7.708e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.352e+00", "dlm_acc": "5.316e-01", "anc_acc": "4.924e-01", "epoch": 0.0989} {"step": 49455, "loss": 1.0283, "grad_norm": "1.520e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.214e-01", "anc_loss": "9.170e-01", "dlm_acc": "6.555e-01", "anc_acc": "6.246e-01", "epoch": 0.09891} {"step": 49460, "loss": 0.8484, "grad_norm": "3.960e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.852e-01", "anc_loss": "1.112e+00", "dlm_acc": "6.638e-01", "anc_acc": "6.270e-01", "epoch": 0.09892} {"step": 49465, "loss": 0.9888, "grad_norm": "5.057e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.945e-01", "anc_loss": "9.750e-01", "dlm_acc": "5.957e-01", "anc_acc": "5.661e-01", "epoch": 0.09893} {"step": 49470, "loss": 0.7466, "grad_norm": "2.713e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.770e-01", "anc_loss": "8.777e-01", "dlm_acc": "6.507e-01", "anc_acc": "6.148e-01", "epoch": 0.09894} {"step": 49475, "loss": 0.6892, "grad_norm": "3.231e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.750e-01", "anc_loss": "6.832e-01", "dlm_acc": "7.720e-01", "anc_acc": "7.335e-01", "epoch": 0.09895} {"step": 49480, "loss": 1.0468, "grad_norm": "5.423e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.248e+00", "anc_loss": "1.399e+00", "dlm_acc": "5.676e-01", "anc_acc": "5.297e-01", "epoch": 0.09896} {"step": 49485, "loss": 0.937, "grad_norm": "3.763e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.156e+00", "anc_loss": "1.305e+00", "dlm_acc": "5.662e-01", "anc_acc": "5.226e-01", "epoch": 0.09897} {"step": 49490, "loss": 1.2757, "grad_norm": "5.684e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.073e+00", "anc_loss": "1.194e+00", "dlm_acc": "5.720e-01", "anc_acc": "5.392e-01", "epoch": 0.09898} {"step": 49495, "loss": 1.187, "grad_norm": "6.278e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.342e-01", "anc_loss": "9.402e-01", "dlm_acc": "6.535e-01", "anc_acc": "6.206e-01", "epoch": 0.09899} {"step": 49500, "loss": 1.1405, "grad_norm": "6.010e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.223e+00", "anc_loss": "1.370e+00", "dlm_acc": "5.616e-01", "anc_acc": "5.191e-01", "epoch": 0.099} {"step": 49505, "loss": 1.4764, "grad_norm": "7.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.522e+00", "anc_loss": "1.684e+00", "dlm_acc": "5.089e-01", "anc_acc": "4.701e-01", "epoch": 0.09901} {"step": 49510, "loss": 1.1914, "grad_norm": "2.614e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.573e+00", "anc_loss": "1.657e+00", "dlm_acc": "4.305e-01", "anc_acc": "4.088e-01", "epoch": 0.09902} {"step": 49515, "loss": 0.9272, "grad_norm": "4.000e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.734e-01", "anc_loss": "7.334e-01", "dlm_acc": "6.528e-01", "anc_acc": "6.295e-01", "epoch": 0.09903} {"step": 49520, "loss": 1.1945, "grad_norm": "5.384e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.141e-01", "anc_loss": "6.764e-01", "dlm_acc": "7.340e-01", "anc_acc": "7.102e-01", "epoch": 0.09904} {"step": 49525, "loss": 1.0778, "grad_norm": "4.571e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.379e-01", "anc_loss": "9.527e-01", "dlm_acc": "6.558e-01", "anc_acc": "6.163e-01", "epoch": 0.09905} {"step": 49530, "loss": 1.0242, "grad_norm": "2.284e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.922e-01", "anc_loss": "1.007e+00", "dlm_acc": "6.659e-01", "anc_acc": "6.314e-01", "epoch": 0.09906} {"step": 49535, "loss": 1.4732, "grad_norm": "2.100e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.688e+00", "anc_loss": "1.789e+00", "dlm_acc": "3.350e-01", "anc_acc": "3.107e-01", "epoch": 0.09907} {"step": 49540, "loss": 2.0249, "grad_norm": "1.069e+00", "learning_rate": "1.000e-04", "dlm_loss": "2.819e+00", "anc_loss": "2.831e+00", "dlm_acc": "2.416e-02", "anc_acc": "2.289e-02", "epoch": 0.09908} {"step": 49545, "loss": 1.326, "grad_norm": "4.519e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.513e+00", "anc_loss": "2.516e+00", "dlm_acc": "2.502e-02", "anc_acc": "2.498e-02", "epoch": 0.09909} {"step": 49550, "loss": 1.6575, "grad_norm": "3.301e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.991e+00", "anc_loss": "3.003e+00", "dlm_acc": "2.737e-02", "anc_acc": "2.633e-02", "epoch": 0.0991} {"step": 49555, "loss": 1.0425, "grad_norm": "2.879e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.233e+00", "anc_loss": "1.312e+00", "dlm_acc": "3.950e-01", "anc_acc": "3.507e-01", "epoch": 0.09911} {"step": 49560, "loss": 1.1373, "grad_norm": "3.258e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.415e+00", "anc_loss": "1.541e+00", "dlm_acc": "5.401e-01", "anc_acc": "5.101e-01", "epoch": 0.09912} {"step": 49565, "loss": 0.9515, "grad_norm": "2.342e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.027e+00", "anc_loss": "1.188e+00", "dlm_acc": "6.022e-01", "anc_acc": "5.498e-01", "epoch": 0.09913} {"step": 49570, "loss": 1.3412, "grad_norm": "5.948e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.466e+00", "anc_loss": "1.583e+00", "dlm_acc": "5.023e-01", "anc_acc": "4.713e-01", "epoch": 0.09914} {"step": 49575, "loss": 1.4669, "grad_norm": "9.043e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.453e+00", "anc_loss": "1.584e+00", "dlm_acc": "5.365e-01", "anc_acc": "5.043e-01", "epoch": 0.09915} {"step": 49580, "loss": 1.0416, "grad_norm": "5.954e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.231e+00", "anc_loss": "1.364e+00", "dlm_acc": "5.652e-01", "anc_acc": "5.329e-01", "epoch": 0.09916} {"step": 49585, "loss": 1.2999, "grad_norm": "7.300e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.257e+00", "anc_loss": "1.386e+00", "dlm_acc": "5.955e-01", "anc_acc": "5.662e-01", "epoch": 0.09917} {"step": 49590, "loss": 0.8302, "grad_norm": "3.009e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.000e-01", "anc_loss": "8.883e-01", "dlm_acc": "6.623e-01", "anc_acc": "6.399e-01", "epoch": 0.09918} {"step": 49595, "loss": 1.0887, "grad_norm": "1.093e+00", "learning_rate": "1.000e-04", "dlm_loss": "1.559e+00", "anc_loss": "1.689e+00", "dlm_acc": "5.450e-01", "anc_acc": "5.276e-01", "epoch": 0.09919} {"step": 49600, "loss": 1.2126, "grad_norm": "2.561e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.437e+00", "anc_loss": "1.548e+00", "dlm_acc": "5.493e-01", "anc_acc": "5.236e-01", "epoch": 0.0992} {"step": 49605, "loss": 1.3733, "grad_norm": "2.356e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.555e+00", "anc_loss": "1.700e+00", "dlm_acc": "5.325e-01", "anc_acc": "5.012e-01", "epoch": 0.09921} {"step": 49610, "loss": 1.2429, "grad_norm": "8.753e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.150e+00", "anc_loss": "1.242e+00", "dlm_acc": "6.271e-01", "anc_acc": "6.006e-01", "epoch": 0.09922} {"step": 49615, "loss": 1.248, "grad_norm": "2.586e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.372e+00", "anc_loss": "1.506e+00", "dlm_acc": "4.756e-01", "anc_acc": "4.469e-01", "epoch": 0.09923} {"step": 49620, "loss": 1.3812, "grad_norm": "3.599e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.046e+00", "anc_loss": "1.155e+00", "dlm_acc": "6.260e-01", "anc_acc": "6.000e-01", "epoch": 0.09924} {"step": 49625, "loss": 1.2271, "grad_norm": "2.097e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.138e+00", "anc_loss": "1.216e+00", "dlm_acc": "4.406e-01", "anc_acc": "4.252e-01", "epoch": 0.09925} {"step": 49630, "loss": 1.1676, "grad_norm": "1.505e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.045e+00", "anc_loss": "1.098e+00", "dlm_acc": "4.672e-01", "anc_acc": "4.502e-01", "epoch": 0.09926} {"step": 49635, "loss": 1.8842, "grad_norm": "3.466e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.481e+00", "anc_loss": "1.609e+00", "dlm_acc": "5.198e-01", "anc_acc": "4.937e-01", "epoch": 0.09927} {"step": 49640, "loss": 1.1423, "grad_norm": "2.072e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.940e-01", "anc_loss": "9.753e-01", "dlm_acc": "6.350e-01", "anc_acc": "6.095e-01", "epoch": 0.09928} {"step": 49645, "loss": 1.2268, "grad_norm": "2.807e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.261e+00", "anc_loss": "1.414e+00", "dlm_acc": "6.094e-01", "anc_acc": "5.748e-01", "epoch": 0.09929} {"step": 49650, "loss": 1.3726, "grad_norm": "2.582e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.406e+00", "anc_loss": "1.527e+00", "dlm_acc": "5.321e-01", "anc_acc": "5.034e-01", "epoch": 0.0993} {"step": 49655, "loss": 1.078, "grad_norm": "4.212e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.327e+00", "anc_loss": "1.434e+00", "dlm_acc": "5.095e-01", "anc_acc": "4.802e-01", "epoch": 0.09931} {"step": 49660, "loss": 1.2886, "grad_norm": "3.468e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.163e+00", "anc_loss": "1.322e+00", "dlm_acc": "6.032e-01", "anc_acc": "5.646e-01", "epoch": 0.09932} {"step": 49665, "loss": 1.2962, "grad_norm": "2.387e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.252e+00", "anc_loss": "1.391e+00", "dlm_acc": "5.890e-01", "anc_acc": "5.555e-01", "epoch": 0.09933} {"step": 49670, "loss": 1.1311, "grad_norm": "3.079e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.134e+00", "anc_loss": "1.275e+00", "dlm_acc": "6.044e-01", "anc_acc": "5.707e-01", "epoch": 0.09934} {"step": 49675, "loss": 1.1622, "grad_norm": "4.685e-01", "learning_rate": "1.000e-04", "dlm_loss": "6.605e-01", "anc_loss": "7.828e-01", "dlm_acc": "7.256e-01", "anc_acc": "6.892e-01", "epoch": 0.09935} {"step": 49680, "loss": 0.725, "grad_norm": "1.881e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.180e-01", "anc_loss": "8.203e-01", "dlm_acc": "6.989e-01", "anc_acc": "6.684e-01", "epoch": 0.09936} {"step": 49685, "loss": 0.9833, "grad_norm": "2.646e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.103e+00", "anc_loss": "1.224e+00", "dlm_acc": "5.997e-01", "anc_acc": "5.680e-01", "epoch": 0.09937} {"step": 49690, "loss": 0.9569, "grad_norm": "4.371e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.015e+00", "anc_loss": "1.130e+00", "dlm_acc": "6.370e-01", "anc_acc": "6.031e-01", "epoch": 0.09938} {"step": 49695, "loss": 1.0138, "grad_norm": "1.944e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.146e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.887e-01", "anc_acc": "5.525e-01", "epoch": 0.09939} {"step": 49700, "loss": 0.9208, "grad_norm": "3.359e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.314e+00", "anc_loss": "1.451e+00", "dlm_acc": "5.591e-01", "anc_acc": "5.278e-01", "epoch": 0.0994} {"step": 49705, "loss": 1.0287, "grad_norm": "3.572e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.564e+00", "anc_loss": "1.692e+00", "dlm_acc": "4.784e-01", "anc_acc": "4.484e-01", "epoch": 0.09941} {"step": 49710, "loss": 1.4437, "grad_norm": "4.618e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.855e+00", "anc_loss": "1.981e+00", "dlm_acc": "4.730e-01", "anc_acc": "4.447e-01", "epoch": 0.09942} {"step": 49715, "loss": 1.3925, "grad_norm": "2.789e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.320e+00", "anc_loss": "1.459e+00", "dlm_acc": "5.938e-01", "anc_acc": "5.629e-01", "epoch": 0.09943} {"step": 49720, "loss": 1.5528, "grad_norm": "3.795e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.423e+00", "anc_loss": "1.557e+00", "dlm_acc": "5.353e-01", "anc_acc": "5.046e-01", "epoch": 0.09944} {"step": 49725, "loss": 1.7981, "grad_norm": "4.448e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.692e+00", "dlm_acc": "4.857e-01", "anc_acc": "4.542e-01", "epoch": 0.09945} {"step": 49730, "loss": 1.0982, "grad_norm": "3.720e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.602e-01", "anc_loss": "1.073e+00", "dlm_acc": "6.132e-01", "anc_acc": "5.786e-01", "epoch": 0.09946} {"step": 49735, "loss": 1.2778, "grad_norm": "5.633e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.254e+00", "anc_loss": "1.384e+00", "dlm_acc": "5.533e-01", "anc_acc": "5.159e-01", "epoch": 0.09947} {"step": 49740, "loss": 1.2606, "grad_norm": "2.790e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.184e+00", "anc_loss": "1.370e+00", "dlm_acc": "6.118e-01", "anc_acc": "5.677e-01", "epoch": 0.09948} {"step": 49745, "loss": 0.9235, "grad_norm": "3.163e-01", "learning_rate": "1.000e-04", "dlm_loss": "5.961e-01", "anc_loss": "6.777e-01", "dlm_acc": "7.621e-01", "anc_acc": "7.452e-01", "epoch": 0.09949} {"step": 49750, "loss": 1.0532, "grad_norm": "6.155e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.773e-01", "anc_loss": "1.198e+00", "dlm_acc": "6.194e-01", "anc_acc": "5.441e-01", "epoch": 0.0995} {"step": 49755, "loss": 1.2853, "grad_norm": "6.297e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.127e+00", "anc_loss": "1.215e+00", "dlm_acc": "5.232e-01", "anc_acc": "5.001e-01", "epoch": 0.09951} {"step": 49760, "loss": 1.4966, "grad_norm": "4.250e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.166e+00", "anc_loss": "1.291e+00", "dlm_acc": "5.377e-01", "anc_acc": "5.074e-01", "epoch": 0.09952} {"step": 49765, "loss": 1.1642, "grad_norm": "3.112e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.106e-01", "anc_loss": "7.854e-01", "dlm_acc": "6.316e-01", "anc_acc": "6.088e-01", "epoch": 0.09953} {"step": 49770, "loss": 1.2061, "grad_norm": "3.383e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.112e+00", "anc_loss": "1.180e+00", "dlm_acc": "5.922e-01", "anc_acc": "5.739e-01", "epoch": 0.09954} {"step": 49775, "loss": 1.4332, "grad_norm": "3.659e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.280e+00", "anc_loss": "1.418e+00", "dlm_acc": "5.914e-01", "anc_acc": "5.555e-01", "epoch": 0.09955} {"step": 49780, "loss": 1.4869, "grad_norm": "2.798e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.427e+00", "anc_loss": "1.556e+00", "dlm_acc": "5.347e-01", "anc_acc": "5.047e-01", "epoch": 0.09956} {"step": 49785, "loss": 1.8422, "grad_norm": "2.261e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.530e+00", "anc_loss": "1.673e+00", "dlm_acc": "5.220e-01", "anc_acc": "4.883e-01", "epoch": 0.09957} {"step": 49790, "loss": 1.0319, "grad_norm": "7.015e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.477e-01", "anc_loss": "8.344e-01", "dlm_acc": "6.540e-01", "anc_acc": "6.319e-01", "epoch": 0.09958} {"step": 49795, "loss": 1.1778, "grad_norm": "2.940e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.039e+00", "anc_loss": "1.193e+00", "dlm_acc": "6.336e-01", "anc_acc": "5.941e-01", "epoch": 0.09959} {"step": 49800, "loss": 1.1973, "grad_norm": "2.642e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.758e-01", "anc_loss": "1.202e+00", "dlm_acc": "6.242e-01", "anc_acc": "5.598e-01", "epoch": 0.0996} {"step": 49805, "loss": 1.2535, "grad_norm": "2.833e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.750e-01", "anc_loss": "1.033e+00", "dlm_acc": "6.012e-01", "anc_acc": "5.522e-01", "epoch": 0.09961} {"step": 49810, "loss": 1.0144, "grad_norm": "2.310e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.000e-01", "anc_loss": "8.949e-01", "dlm_acc": "6.642e-01", "anc_acc": "6.376e-01", "epoch": 0.09962} {"step": 49815, "loss": 1.4597, "grad_norm": "3.747e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.246e+00", "anc_loss": "1.400e+00", "dlm_acc": "5.731e-01", "anc_acc": "5.366e-01", "epoch": 0.09963} {"step": 49820, "loss": 1.3477, "grad_norm": "1.683e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.117e+00", "anc_loss": "1.237e+00", "dlm_acc": "6.192e-01", "anc_acc": "5.901e-01", "epoch": 0.09964} {"step": 49825, "loss": 1.0158, "grad_norm": "4.101e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.961e-01", "anc_loss": "1.115e+00", "dlm_acc": "6.104e-01", "anc_acc": "5.803e-01", "epoch": 0.09965} {"step": 49830, "loss": 1.5554, "grad_norm": "3.185e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.550e+00", "anc_loss": "1.691e+00", "dlm_acc": "5.180e-01", "anc_acc": "4.877e-01", "epoch": 0.09966} {"step": 49835, "loss": 1.025, "grad_norm": "2.548e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.462e+00", "anc_loss": "1.599e+00", "dlm_acc": "4.406e-01", "anc_acc": "3.958e-01", "epoch": 0.09967} {"step": 49840, "loss": 1.0734, "grad_norm": "2.221e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.001e+00", "anc_loss": "1.143e+00", "dlm_acc": "6.382e-01", "anc_acc": "5.914e-01", "epoch": 0.09968} {"step": 49845, "loss": 1.21, "grad_norm": "2.205e-01", "learning_rate": "1.000e-04", "dlm_loss": "8.287e-01", "anc_loss": "9.756e-01", "dlm_acc": "6.856e-01", "anc_acc": "6.364e-01", "epoch": 0.09969} {"step": 49850, "loss": 1.7155, "grad_norm": "2.735e-01", "learning_rate": "1.000e-04", "dlm_loss": "2.169e+00", "anc_loss": "2.220e+00", "dlm_acc": "2.620e-01", "anc_acc": "2.514e-01", "epoch": 0.0997} {"step": 49855, "loss": 1.5487, "grad_norm": "3.551e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.215e+00", "anc_loss": "1.387e+00", "dlm_acc": "5.860e-01", "anc_acc": "5.410e-01", "epoch": 0.09971} {"step": 49860, "loss": 1.5144, "grad_norm": "4.314e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.200e+00", "anc_loss": "1.330e+00", "dlm_acc": "6.044e-01", "anc_acc": "5.731e-01", "epoch": 0.09972} {"step": 49865, "loss": 1.2456, "grad_norm": "5.454e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.050e+00", "anc_loss": "1.170e+00", "dlm_acc": "6.387e-01", "anc_acc": "6.052e-01", "epoch": 0.09973} {"step": 49870, "loss": 1.3851, "grad_norm": "1.961e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.037e+00", "anc_loss": "1.145e+00", "dlm_acc": "6.586e-01", "anc_acc": "6.314e-01", "epoch": 0.09974} {"step": 49875, "loss": 1.5473, "grad_norm": "4.259e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.287e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.659e-01", "anc_acc": "5.313e-01", "epoch": 0.09975} {"step": 49880, "loss": 1.6534, "grad_norm": "2.652e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.508e+00", "anc_loss": "1.637e+00", "dlm_acc": "5.463e-01", "anc_acc": "5.161e-01", "epoch": 0.09976} {"step": 49885, "loss": 1.4263, "grad_norm": "3.845e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.278e+00", "anc_loss": "1.420e+00", "dlm_acc": "5.740e-01", "anc_acc": "5.381e-01", "epoch": 0.09977} {"step": 49890, "loss": 1.3063, "grad_norm": "4.372e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.224e+00", "anc_loss": "1.342e+00", "dlm_acc": "5.812e-01", "anc_acc": "5.510e-01", "epoch": 0.09978} {"step": 49895, "loss": 1.3908, "grad_norm": "2.120e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.368e+00", "anc_loss": "1.484e+00", "dlm_acc": "5.482e-01", "anc_acc": "5.169e-01", "epoch": 0.09979} {"step": 49900, "loss": 1.234, "grad_norm": "2.828e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.211e+00", "anc_loss": "1.342e+00", "dlm_acc": "5.814e-01", "anc_acc": "5.491e-01", "epoch": 0.0998} {"step": 49905, "loss": 1.6325, "grad_norm": "3.941e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.695e+00", "anc_loss": "1.811e+00", "dlm_acc": "4.924e-01", "anc_acc": "4.694e-01", "epoch": 0.09981} {"step": 49910, "loss": 1.1187, "grad_norm": "3.309e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.236e+00", "anc_loss": "1.349e+00", "dlm_acc": "5.798e-01", "anc_acc": "5.502e-01", "epoch": 0.09982} {"step": 49915, "loss": 1.3082, "grad_norm": "2.696e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.122e+00", "anc_loss": "1.255e+00", "dlm_acc": "6.164e-01", "anc_acc": "5.877e-01", "epoch": 0.09983} {"step": 49920, "loss": 1.3859, "grad_norm": "2.620e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.165e+00", "anc_loss": "1.298e+00", "dlm_acc": "6.102e-01", "anc_acc": "5.777e-01", "epoch": 0.09984} {"step": 49925, "loss": 1.3602, "grad_norm": "3.772e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.277e+00", "anc_loss": "1.408e+00", "dlm_acc": "5.790e-01", "anc_acc": "5.448e-01", "epoch": 0.09985} {"step": 49930, "loss": 1.0549, "grad_norm": "2.050e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.461e+00", "anc_loss": "1.567e+00", "dlm_acc": "4.538e-01", "anc_acc": "4.250e-01", "epoch": 0.09986} {"step": 49935, "loss": 1.547, "grad_norm": "3.637e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.265e+00", "anc_loss": "1.397e+00", "dlm_acc": "5.418e-01", "anc_acc": "5.085e-01", "epoch": 0.09987} {"step": 49940, "loss": 1.7828, "grad_norm": "4.227e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.867e+00", "anc_loss": "2.156e+00", "dlm_acc": "4.211e-01", "anc_acc": "3.761e-01", "epoch": 0.09988} {"step": 49945, "loss": 1.2181, "grad_norm": "4.264e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.116e+00", "anc_loss": "1.275e+00", "dlm_acc": "5.894e-01", "anc_acc": "5.451e-01", "epoch": 0.09989} {"step": 49950, "loss": 1.17, "grad_norm": "4.374e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.240e+00", "anc_loss": "1.366e+00", "dlm_acc": "5.542e-01", "anc_acc": "5.241e-01", "epoch": 0.0999} {"step": 49955, "loss": 1.3911, "grad_norm": "2.589e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.558e+00", "anc_loss": "1.695e+00", "dlm_acc": "4.908e-01", "anc_acc": "4.611e-01", "epoch": 0.09991} {"step": 49960, "loss": 1.4895, "grad_norm": "6.922e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.461e+00", "anc_loss": "1.581e+00", "dlm_acc": "5.181e-01", "anc_acc": "4.898e-01", "epoch": 0.09992} {"step": 49965, "loss": 1.5962, "grad_norm": "4.319e-01", "learning_rate": "1.000e-04", "dlm_loss": "9.594e-01", "anc_loss": "1.103e+00", "dlm_acc": "6.290e-01", "anc_acc": "5.886e-01", "epoch": 0.09993} {"step": 49970, "loss": 1.1684, "grad_norm": "4.142e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.060e+00", "anc_loss": "1.194e+00", "dlm_acc": "6.167e-01", "anc_acc": "5.814e-01", "epoch": 0.09994} {"step": 49975, "loss": 1.1318, "grad_norm": "6.102e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.002e+00", "anc_loss": "1.134e+00", "dlm_acc": "6.003e-01", "anc_acc": "5.714e-01", "epoch": 0.09995} {"step": 49980, "loss": 0.8916, "grad_norm": "2.963e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.131e+00", "anc_loss": "1.251e+00", "dlm_acc": "5.704e-01", "anc_acc": "5.401e-01", "epoch": 0.09996} {"step": 49985, "loss": 1.1422, "grad_norm": "4.204e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.614e+00", "anc_loss": "1.773e+00", "dlm_acc": "4.813e-01", "anc_acc": "4.476e-01", "epoch": 0.09997} {"step": 49990, "loss": 1.4202, "grad_norm": "4.452e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.374e+00", "anc_loss": "1.501e+00", "dlm_acc": "5.577e-01", "anc_acc": "5.271e-01", "epoch": 0.09998} {"step": 49995, "loss": 1.1059, "grad_norm": "2.886e-01", "learning_rate": "1.000e-04", "dlm_loss": "7.211e-01", "anc_loss": "9.164e-01", "dlm_acc": "6.865e-01", "anc_acc": "6.213e-01", "epoch": 0.09999} {"step": 50000, "loss": 1.0114, "grad_norm": "2.247e-01", "learning_rate": "1.000e-04", "dlm_loss": "1.044e+00", "anc_loss": "1.205e+00", "dlm_acc": "5.680e-01", "anc_acc": "5.277e-01", "epoch": 0.1}