{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "eval_steps": 500, "global_step": 239, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0, "step": 0, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.05908203125 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3245849609375 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.07611083984375 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.86309814453125 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.24755859375 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8839111328125 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.0859375 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1669921875 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.007568359375 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.21875 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1884765625 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -1.165313720703125 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.10546875 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.76806640625 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.6173095703125 }, { "epoch": 0, "step": 0, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.754638671875 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.00726318359375 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.80224609375 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2449951171875 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.69384765625 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.32781982421875 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.48638916015625 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.029296875 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.3768157958984375 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6876220703125 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.37744140625 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.58349609375 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.22119140625 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.03934478759765625 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.760986328125 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.32470703125 }, { "epoch": 0.004197271773347324, "step": 1, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.247314453125 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.4515380859375 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.837158203125 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.197021484375 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.962890625 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.187255859375 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.0146484375 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.82177734375 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2718505859375 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.25567626953125 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.41534423828125 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.52783203125 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.7525634765625 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.34375 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.18310546875 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.4468994140625 }, { "epoch": 0.008394543546694649, "step": 2, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.120361328125 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.16357421875 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.329010009765625 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8553619384765625 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1259765625 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.15679931640625 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.3687744140625 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.66064453125 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.27899169921875 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.30523681640625 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.07925796508789062 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.39813232421875 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.11376953125 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.193115234375 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.4398193359375 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.265625 }, { "epoch": 0.012591815320041973, "step": 3, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.07781982421875 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.276611328125 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.7357177734375 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.10150146484375 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.64990234375 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.350341796875 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.088287353515625 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6162109375 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.330078125 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.630279541015625 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.89593505859375 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.520263671875 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.463623046875 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7823486328125 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.3922119140625 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.39794921875 }, { "epoch": 0.016789087093389297, "step": 4, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.470947265625 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.060302734375 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.69732666015625 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.753021240234375 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.125, "train/overall_margin_mean": -0.90643310546875 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.3133544921875 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.0147552490234375 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.2781982421875 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.04174041748046875 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.49462890625 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.125, "train/overall_margin_mean": -0.41949462890625 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.34521484375 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.787078857421875 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.29638671875 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.66595458984375 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.61578369140625 }, { "epoch": 0.02098635886673662, "step": 5, "train/overall_accuracy": 0.125, "train/overall_margin_mean": -0.1878662109375 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.283203125 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.02410888671875 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.384521484375 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.742095947265625 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.184326171875 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.32672119140625 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.01318359375 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.35687255859375 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.0543212890625 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.497314453125 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3243408203125 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.205047607421875 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.886474609375 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.773193359375 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.693359375 }, { "epoch": 0.025183630640083946, "step": 6, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.470458984375 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.361572265625 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.2242431640625 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3304443359375 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.2408447265625 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.094635009765625 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.2103271484375 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.100341796875 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.61334228515625 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.1064453125 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.681396484375 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.2890625 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.1162109375 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.65606689453125 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9879150390625 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1734619140625 }, { "epoch": 0.02938090241343127, "step": 7, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.07033538818359375 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.350311279296875 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.40130615234375 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.189208984375 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6374053955078125 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.2406005859375 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.982391357421875 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0396728515625 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.097686767578125 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 0.60504150390625 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.39455413818359375 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6917724609375 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.063812255859375 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.073974609375 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.02490234375 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.07293701171875 }, { "epoch": 0.033578174186778595, "step": 8, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5244140625 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.0228271484375 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2564697265625 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.632171630859375 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.0224456787109375 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.0, "train/overall_margin_mean": -1.0205078125 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.488525390625 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.458740234375 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.41888427734375 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.5462646484375 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.125, "train/overall_margin_mean": -0.77679443359375 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.29052734375 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.061767578125 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.76654052734375 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.511962890625 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.3533935546875 }, { "epoch": 0.03777544596012592, "step": 9, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.3543701171875 }, { "epoch": 0.04197271773347324, "grad_norm": 21.625, "learning_rate": 1.8750000000000003e-06, "loss": 0.8354, "step": 10 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.0373687744140625 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3033905029296875 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0599212646484375 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.5986328125 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.03961181640625 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.38623046875 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.08251953125 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.1644287109375 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.165771484375 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.251708984375 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.41552734375 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.6373502016067505 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.33441162109375 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8915863037109375 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.213623046875 }, { "epoch": 0.04197271773347324, "step": 10, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.050048828125 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.2034912109375 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.121826171875 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.359130859375 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.009613037109375 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.19189453125 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.43408203125 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1329345703125 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.440673828125 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.41729736328125 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2056884765625 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.153076171875 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.406829833984375 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8515625 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5223617553710938 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.148193359375 }, { "epoch": 0.046169989506820566, "step": 11, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.302734375 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.3896484375 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.794921875 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.5789794921875 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.5811767578125 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0865478515625 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4654541015625 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0966796875 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.416259765625 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.1604461669921875 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4462890625 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.31884765625 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4297294616699219 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.654541015625 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.392578125 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.49078369140625 }, { "epoch": 0.05036726128016789, "step": 12, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.1919403076171875 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.151397705078125 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5863037109375 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3720970153808594 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1326904296875 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.310546875 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4886474609375 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.440185546875 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.63140869140625 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.61669921875 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.908935546875 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.541015625 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.04705810546875 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.419281005859375 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.41015625 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.294921875 }, { "epoch": 0.05456453305351522, "step": 13, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.572998046875 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.83447265625 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.1024169921875 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.64990234375 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.2482757568359375 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.27178955078125 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.206298828125 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.4486846923828125 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.2484130859375 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.24859619140625 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.1513671875 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.671875 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.00463104248046875 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.8055419921875 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.247833251953125 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.067626953125 }, { "epoch": 0.05876180482686254, "step": 14, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.41552734375 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6295166015625 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.14794921875 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.29901123046875 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.49853515625 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.08251953125 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.00414276123046875 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.799072265625 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.2392578125 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3655853271484375 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9129638671875 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.66748046875 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.659088134765625 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.506591796875 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.300048828125 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.0798187255859375 }, { "epoch": 0.06295907660020986, "step": 15, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.83258056640625 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.039642333984375 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6697998046875 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.12689208984375 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.6396484375 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.0, "train/overall_margin_mean": -1.1910362243652344 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.312255859375 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.6864013671875 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9127197265625 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.75, "train/overall_margin_mean": -0.0843505859375 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.25830078125 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.80615234375 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.5194091796875 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.26123046875 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.0, "train/overall_margin_mean": -0.8853759765625 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4079742431640625 }, { "epoch": 0.06715634837355719, "step": 16, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.40087890625 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.302734375 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.9114990234375 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4853515625 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.25, "train/overall_margin_mean": 0.1363525390625 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5009765625 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.72723388671875 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.08660888671875 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.24267578125 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.968994140625 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.32745361328125 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6825447082519531 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.3964996337890625 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.87939453125 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5500335693359375 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.68255615234375 }, { "epoch": 0.07135362014690451, "step": 17, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.071044921875 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.426513671875 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2291717529296875 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.3134765625 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2247314453125 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 0.620361328125 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8087158203125 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4302978515625 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.825927734375 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.666259765625 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4207763671875 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.318359375 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6558837890625 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.78271484375 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.92767333984375 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.747314453125 }, { "epoch": 0.07555089192025184, "step": 18, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1851806640625 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.369140625 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4431533813476562 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.28662109375 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.236968994140625 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8619384765625 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.323486328125 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0345382690429688 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.1416015625 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.1162109375 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.180267333984375 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.1392822265625 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.45941162109375 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.02922821044921875 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.12823486328125 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.25, "train/overall_margin_mean": 0.044921875 }, { "epoch": 0.07974816369359916, "step": 19, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.52178955078125 }, { "epoch": 0.08394543546694648, "grad_norm": 20.75, "learning_rate": 3.958333333333333e-06, "loss": 0.7707, "step": 20 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.0491943359375 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0882110595703125 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5673828125 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.475341796875 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0166015625 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1544189453125 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.453857421875 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.63214111328125 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.453125 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.3701171875 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.520660400390625 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.015380859375 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.7664794921875 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.553466796875 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2373046875 }, { "epoch": 0.08394543546694648, "step": 20, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.439697265625 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.31024932861328125 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.25055694580078125 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5157470703125 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7784423828125 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1937255859375 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.618896484375 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.195556640625 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4638671875 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.99041748046875 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.009033203125 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.300537109375 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6851806640625 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.7965545654296875 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8352718353271484 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.560546875 }, { "epoch": 0.08814270724029381, "step": 21, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.453857421875 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.952392578125 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.39349365234375 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.086181640625 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4462890625 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.57177734375 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.41015625 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2347412109375 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.202392578125 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.186279296875 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.4376220703125 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.71240234375 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5394287109375 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.21942138671875 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.32177734375 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.13454437255859375 }, { "epoch": 0.09233997901364113, "step": 22, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.048370361328125 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.548095703125 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.80938720703125 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5325927734375 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.614990234375 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.53118896484375 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.96044921875 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.27880859375 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.168701171875 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.093841552734375 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3590965270996094 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.67791748046875 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.3868408203125 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8203125 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.3924560546875 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4923095703125 }, { "epoch": 0.09653725078698845, "step": 23, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.006103515625 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.31744384765625 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.78143310546875 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3754997253417969 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8595428466796875 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.739990234375 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5823974609375 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.0847320556640625 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.50048828125 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2469482421875 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.88134765625 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.263427734375 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.146240234375 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.83892822265625 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.7548828125 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.167144775390625 }, { "epoch": 0.10073452256033578, "step": 24, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.59423828125 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2037353515625 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.08935546875 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0894927978515625 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3385009765625 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.68603515625 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.67919921875 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.4333152770996094 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.1797027587890625 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.74072265625 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4715576171875 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.01434326171875 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.97802734375 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.49658203125 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.34375 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.19078826904296875 }, { "epoch": 0.1049317943336831, "step": 25, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.869140625 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4609375 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7637939453125 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9422607421875 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.26123046875 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.67657470703125 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4173583984375 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3466796875 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4352923631668091 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.75, "train/overall_margin_mean": -0.3177490234375 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5205078125 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.223388671875 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.760498046875 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3411865234375 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.339996337890625 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.90594482421875 }, { "epoch": 0.10912906610703044, "step": 26, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.575592041015625 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1640625 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.1998291015625 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.00390625 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.76763916015625 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.852752685546875 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.451171875 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.13671875 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.040283203125 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.444091796875 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0238037109375 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.716217041015625 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.06427001953125 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1942138671875 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.786956787109375 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.26229000091552734 }, { "epoch": 0.11332633788037776, "step": 27, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.087188720703125 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.421875 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.544189453125 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.080078125 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4971923828125 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.243408203125 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3935546875 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.05517578125 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8912353515625 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.95770263671875 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.299560546875 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.340087890625 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.659027099609375 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.01495361328125 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.80963134765625 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.538330078125 }, { "epoch": 0.11752360965372508, "step": 28, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5626220703125 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.224365234375 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.653411865234375 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.44580078125 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.6717529296875 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5623092651367188 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.028522491455078 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.580078125 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.05340576171875 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.1925048828125 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.43377685546875 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4501190185546875 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.27587890625 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.75927734375 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0357666015625 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.017791748046875 }, { "epoch": 0.12172088142707241, "step": 29, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.407470703125 }, { "epoch": 0.1259181532004197, "grad_norm": 16.375, "learning_rate": 4.993330709158879e-06, "loss": 0.6719, "step": 30 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.69482421875 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2965087890625 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.10888671875 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0361328125 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.938720703125 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.969970703125 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.152099609375 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.02031707763671875 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.369140625 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.171630859375 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0059814453125 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.384521484375 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.328582763671875 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.68243408203125 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.78082275390625 }, { "epoch": 0.1259181532004197, "step": 30, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5095367431640625 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.02093505859375 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.001953125 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1318359375 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.031982421875 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.5445556640625 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6473388671875 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.966552734375 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.592529296875 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.2626953125 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.990997314453125 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.094696044921875 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.218292236328125 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0263671875 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.424072265625 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.0595550537109375 }, { "epoch": 0.13011542497376705, "step": 31, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.726165771484375 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1358642578125 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0589599609375 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3511962890625 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.3779296875 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8310546875 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0238037109375 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8408203125 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.5230712890625 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.1444091796875 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.13189697265625 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1766357421875 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7088623046875 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3110923767089844 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5828857421875 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.048828125 }, { "epoch": 0.13431269674711438, "step": 32, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.138916015625 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0889892578125 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.0399169921875 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8121337890625 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.66265869140625 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.22998046875 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3125 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.72589111328125 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1651020050048828 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.09429931640625 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.327880859375 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.265869140625 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.82275390625 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.3026123046875 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.361328125 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.104461669921875 }, { "epoch": 0.1385099685204617, "step": 33, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8914794921875 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4417724609375 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.68731689453125 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.836669921875 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.146209716796875 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.0284423828125 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.47894287109375 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.544342041015625 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8504638671875 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.250152587890625 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.587890625 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.902587890625 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.76348876953125 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1728515625 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.159698486328125 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.51690673828125 }, { "epoch": 0.14270724029380902, "step": 34, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.45862579345703125 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9873046875 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.171295166015625 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5284423828125 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.318359375 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.781982421875 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0235595703125 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.6572265625 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8153076171875 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.9896240234375 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.027587890625 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.75518798828125 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.1845703125 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.22406005859375 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.85052490234375 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.84326171875 }, { "epoch": 0.14690451206715635, "step": 35, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3031005859375 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0772247314453125 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.18766021728515625 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.456298828125 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.69818115234375 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7670822143554688 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3161239624023438 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8016357421875 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.487274169921875 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.125, "train/overall_margin_mean": -0.5973405838012695 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1962890625 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2398223876953125 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8447265625 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.360107421875 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.3935546875 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.592529296875 }, { "epoch": 0.15110178384050368, "step": 36, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.22103118896484375 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.82470703125 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.77392578125 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.738037109375 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.74932861328125 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.488250732421875 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2769775390625 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.50140380859375 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2315101623535156 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5731201171875 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.12811279296875 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.63720703125 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.980712890625 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1796875 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4249267578125 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8603515625 }, { "epoch": 0.155299055613851, "step": 37, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.39544677734375 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.287841796875 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.52099609375 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.547119140625 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.62274169921875 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.669189453125 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.72845458984375 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9869384765625 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.11297607421875 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.2099609375 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6542205810546875 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8199462890625 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.419921875 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.677490234375 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.689208984375 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8173828125 }, { "epoch": 0.15949632738719832, "step": 38, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.17626953125 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.265380859375 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.4574127197265625 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.04083251953125 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.416473388671875 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.716064453125 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2066650390625 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.06787109375 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.838958740234375 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.222900390625 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.750732421875 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.34808349609375 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7176513671875 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.107208251953125 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.678466796875 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.2259521484375 }, { "epoch": 0.16369359916054566, "step": 39, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.81072998046875 }, { "epoch": 0.16789087093389296, "grad_norm": 15.6875, "learning_rate": 4.940189693889819e-06, "loss": 0.5785, "step": 40 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3798828125 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1226806640625 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.57958984375 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.5312042236328125 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8193359375 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.115234375 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.17376708984375 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7486572265625 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.92138671875 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.6864013671875 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.79022216796875 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.334381103515625 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.653076171875 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.46484375 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2420654296875 }, { "epoch": 0.16789087093389296, "step": 40, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.572265625 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.04827880859375 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.56402587890625 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.46142578125 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.266357421875 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.58349609375 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.20648193359375 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.0625 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.5234832763671875 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4815216064453125 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.3245849609375 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.80419921875 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.578033447265625 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.826934814453125 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.747802734375 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.949951171875 }, { "epoch": 0.1720881427072403, "step": 41, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.3353271484375 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.934539794921875 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.2476806640625 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5494384765625 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.969970703125 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.2520751953125 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.79400634765625 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.901611328125 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.408599853515625 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7470703125 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.4466552734375 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.18487548828125 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8489913940429688 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.391233444213867 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.3240966796875 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0916213989257812 }, { "epoch": 0.17628541448058763, "step": 42, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8121337890625 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9408378601074219 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4529876708984375 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.16259765625 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1953125 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4781494140625 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7315673828125 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.832763671875 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.96875 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7396240234375 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.104736328125 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.120269775390625 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2603759765625 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.062177181243896484 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.26904296875 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3369140625 }, { "epoch": 0.18048268625393493, "step": 43, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.807861328125 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.92584228515625 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.233154296875 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.07391357421875 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5953369140625 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.84417724609375 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.539306640625 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.016845703125 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.91259765625 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.06536865234375 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.05560302734375 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.434814453125 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.046661376953125 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.0443115234375 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.2806396484375 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.614990234375 }, { "epoch": 0.18467995802728226, "step": 44, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.388427734375 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6402587890625 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.37359619140625 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.677490234375 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.728515625 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.948974609375 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.30224609375 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.11712646484375 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.94317626953125 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.60186767578125 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.43121337890625 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.762939453125 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.15985107421875 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4374752044677734 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6941680908203125 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4549560546875 }, { "epoch": 0.1888772298006296, "step": 45, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.51263427734375 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.298828125 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4282989501953125 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.89825439453125 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.59814453125 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.95733642578125 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7056884765625 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5234375 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.999267578125 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3165283203125 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.68841552734375 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7854194641113281 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.2264404296875 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6209716796875 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5081472396850586 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.384521484375 }, { "epoch": 0.1930745015739769, "step": 46, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.959716796875 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.09521484375 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.30755615234375 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9220657348632812 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.172515869140625 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9248123168945312 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.929443359375 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.0057373046875 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.64404296875 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.77325439453125 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.812744140625 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.90625 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.20159912109375 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.2327880859375 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0797271728515625 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.137451171875 }, { "epoch": 0.19727177334732424, "step": 47, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.77880859375 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.154052734375 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.4508438110351562 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3526611328125 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.66748046875 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.08807373046875 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.66162109375 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.80780029296875 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.471649169921875 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0272216796875 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.031005859375 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.92938232421875 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4091796875 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.100341796875 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4674072265625 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.51348876953125 }, { "epoch": 0.20146904512067157, "step": 48, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4952392578125 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.5064697265625 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.863525390625 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9024658203125 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.01318359375 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.841796875 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.28271484375 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.377147674560547 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.340972900390625 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3576679229736328 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.88134765625 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.18011474609375 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.96942138671875 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6397705078125 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.806640625 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.26434326171875 }, { "epoch": 0.20566631689401887, "step": 49, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.389404296875 }, { "epoch": 0.2098635886673662, "grad_norm": 15.9375, "learning_rate": 4.835040271831371e-06, "loss": 0.5588, "step": 50 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.60546875 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.958251953125 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.066650390625 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.2200927734375 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.70654296875 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.75701904296875 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.93798828125 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.39544677734375 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.914642333984375 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8143310546875 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.445556640625 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.65185546875 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.3013916015625 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.07421875 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.92578125 }, { "epoch": 0.2098635886673662, "step": 50, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.27490234375 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.678863525390625 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9149169921875 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.890380859375 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.184326171875 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3134765625 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8076171875 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5712890625 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4693059921264648 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.94085693359375 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.51025390625 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.860687255859375 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.645263671875 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1318359375 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5340576171875 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8046875 }, { "epoch": 0.21406086044071354, "step": 51, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0093994140625 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.75103759765625 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5591354370117188 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4150390625 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1881103515625 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.5634765625 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.594757080078125 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2733154296875 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8896484375 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.60089111328125 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.04541015625 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.2542724609375 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.97802734375 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.27081298828125 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.27679443359375 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2418212890625 }, { "epoch": 0.21825813221406087, "step": 52, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.128021240234375 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6759681701660156 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9512939453125 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9941635131835938 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.8994140625 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.062255859375 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.52685546875 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5743408203125 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6678466796875 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.67230224609375 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.545928955078125 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.63232421875 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8277587890625 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9842910766601562 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0042343139648438 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.630859375 }, { "epoch": 0.22245540398740818, "step": 53, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7940673828125 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.525390625 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.281005859375 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5235748291015625 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.00927734375 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4500732421875 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.498046875 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.38714599609375 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.8662109375 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0660858154296875 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.548828125 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.271728515625 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.964111328125 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.48291015625 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.73101806640625 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6363525390625 }, { "epoch": 0.2266526757607555, "step": 54, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4644775390625 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.501251220703125 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5723876953125 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.334228515625 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.142822265625 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.03571319580078125 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.75439453125 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.98687744140625 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.707763671875 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.991943359375 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.55078125 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.068603515625 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.961669921875 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.84454345703125 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.149658203125 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8663330078125 }, { "epoch": 0.23084994753410285, "step": 55, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6728515625 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.82659912109375 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.793701171875 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.603424072265625 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.3275146484375 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.93402099609375 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.37994384765625 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8577880859375 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.91998291015625 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.81201171875 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.12158203125 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3427963256835938 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.50531005859375 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.90301513671875 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.07080078125 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.644775390625 }, { "epoch": 0.23504721930745015, "step": 56, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.457427978515625 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.33203125 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.507080078125 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7454833984375 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.097076416015625 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9342117309570312 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.51898193359375 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.215576171875 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.1436920166015625 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6201171875 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1236572265625 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.3123779296875 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.18548583984375 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.32867431640625 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.837158203125 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2528076171875 }, { "epoch": 0.23924449108079748, "step": 57, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.135986328125 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0900154113769531 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2591552734375 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.38232421875 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0234375 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0147705078125 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0787353515625 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.54736328125 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.150146484375 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.41552734375 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5267333984375 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 3.13507080078125 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.547607421875 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.267333984375 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.87628173828125 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.803466796875 }, { "epoch": 0.24344176285414482, "step": 58, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.302001953125 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.18505859375 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.916259765625 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7230224609375 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.4885406494140625 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.65887451171875 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.11865234375 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1534423828125 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.047821044921875 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.25732421875 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.50897216796875 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2738037109375 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.462646484375 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.60614013671875 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.58966064453125 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9674072265625 }, { "epoch": 0.24763903462749212, "step": 59, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -1.03680419921875 }, { "epoch": 0.2518363064008394, "grad_norm": 14.25, "learning_rate": 4.68012352035952e-06, "loss": 0.5174, "step": 60 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4566650390625 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.012176513671875 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.79345703125 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.1885986328125 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.65716552734375 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9442138671875 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.669189453125 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.18511962890625 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.903076171875 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.095703125 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.056671142578125 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.58880615234375 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.28167724609375 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.698974609375 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.06982421875 }, { "epoch": 0.2518363064008394, "step": 60, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.783935546875 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.52978515625 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.494598388671875 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8519287109375 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.962158203125 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8433837890625 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.46954345703125 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.01556396484375 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.61083984375 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.49755859375 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.850830078125 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7579345703125 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.292724609375 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.650146484375 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2579345703125 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6906890869140625 }, { "epoch": 0.25603357817418676, "step": 61, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7020263671875 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7503662109375 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.5491943359375 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6490478515625 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.75726318359375 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7369384765625 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 2.03564453125 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8973541259765625 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.46533203125 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8770751953125 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.341552734375 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4547195434570312 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.427734375 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.3944091796875 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.95068359375 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4384765625 }, { "epoch": 0.2602308499475341, "step": 62, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.23956298828125 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.799560546875 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.436431884765625 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.20556640625 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.94873046875 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.8221435546875 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.97235107421875 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0749473571777344 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.663330078125 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 2.1025390625 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1678466796875 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.64532470703125 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.554443359375 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.203125 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.81298828125 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.708251953125 }, { "epoch": 0.2644281217208814, "step": 63, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.56439208984375 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.50323486328125 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0576629638671875 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.210205078125 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.50067138671875 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.208984375 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.720458984375 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.84222412109375 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.213714599609375 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.568084716796875 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3011627197265625 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.378021240234375 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.302490234375 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.08544921875 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.78143310546875 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8175048828125 }, { "epoch": 0.26862539349422876, "step": 64, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.390625 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.80419921875 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.6397705078125 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.60107421875 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1185302734375 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.404052734375 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8795166015625 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.915283203125 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1187553405761719 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8059577941894531 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.841796875 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.82281494140625 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.6689453125 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.853271484375 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.241455078125 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2664642333984375 }, { "epoch": 0.2728226652675761, "step": 65, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.785888671875 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.40576171875 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8544921875 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5449981689453125 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.6689605712890625 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.3070068359375 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.015380859375 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.400390625 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.3677978515625 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8923234939575195 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.740478515625 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.162811279296875 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6998291015625 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8326416015625 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.84716796875 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.40380859375 }, { "epoch": 0.2770199370409234, "step": 66, "train/overall_accuracy": 0.25, "train/overall_margin_mean": 0.01318359375 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3043212890625 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.46630859375 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.407470703125 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8974609375 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8546142578125 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9010009765625 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6213150024414062 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.283203125 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.515869140625 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.076171875 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.6044921875 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.47314453125 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6002197265625 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.209197998046875 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.10064697265625 }, { "epoch": 0.2812172088142707, "step": 67, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.98406982421875 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.821044921875 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.62744140625 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4122314453125 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2509765625 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.4110107421875 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.2209930419921875 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.6776123046875 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.3563232421875 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.78759765625 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.567474365234375 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.519287109375 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7568359375 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4658203125 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1561279296875 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5966796875 }, { "epoch": 0.28541448058761804, "step": 68, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0887451171875 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4033203125 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.21697998046875 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.3507080078125 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.30450439453125 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.918853759765625 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.8778076171875 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6026611328125 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4996337890625 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.28125 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.108856201171875 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.60577392578125 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.45489501953125 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5494384765625 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.752197265625 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.316650390625 }, { "epoch": 0.28961175236096537, "step": 69, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.68353271484375 }, { "epoch": 0.2938090241343127, "grad_norm": 10.875, "learning_rate": 4.478741221073136e-06, "loss": 0.5292, "step": 70 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.60565185546875 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.29498291015625 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8232421875 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.35382080078125 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.86785888671875 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.49072265625 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.154541015625 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.9732666015625 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8302001953125 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7840576171875 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7086334228515625 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.079833984375 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.30389404296875 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.506103515625 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3649368286132812 }, { "epoch": 0.2938090241343127, "step": 70, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.24365234375 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.84521484375 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.487640380859375 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3341217041015625 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.233642578125 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6177597045898438 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5704345703125 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.3846435546875 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.19439697265625 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.40875244140625 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.086181640625 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.003662109375 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.493408203125 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.210693359375 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.198486328125 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3125 }, { "epoch": 0.29800629590766003, "step": 71, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.895263671875 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.845947265625 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.791259765625 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.2919921875 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.03173828125 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.479736328125 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.2752685546875 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8956298828125 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.2459869384765625 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1259117126464844 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.93505859375 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8021240234375 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.38360595703125 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.05078125 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.917694091796875 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.272216796875 }, { "epoch": 0.30220356768100737, "step": 72, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.047119140625 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.16217041015625 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.071136474609375 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.044677734375 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.90087890625 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9490318298339844 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.036376953125 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3830642700195312 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.17236328125 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2349853515625 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.420166015625 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.52032470703125 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.228759765625 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6270751953125 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.07098388671875 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.38623046875 }, { "epoch": 0.30640083945435465, "step": 73, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5791015625 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9764404296875 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.149444580078125 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1790771484375 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5512590408325195 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.45703125 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.180267333984375 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.259674072265625 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.54229736328125 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.567138671875 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.80615234375 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.6756591796875 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.783660888671875 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.530219078063965 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.943359375 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.50262451171875 }, { "epoch": 0.310598111227702, "step": 74, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.55169677734375 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.623046875 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.366943359375 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.84527587890625 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.92431640625 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.781982421875 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.67724609375 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.0915374755859375 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8297119140625 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2999267578125 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.6429443359375 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.692626953125 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1732940673828125 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.942626953125 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.13897705078125 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9102935791015625 }, { "epoch": 0.3147953830010493, "step": 75, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.43051910400390625 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.774078369140625 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.71051025390625 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0325927734375 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.53192138671875 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.748626708984375 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.7273712158203125 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.82763671875 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2332763671875 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.269927978515625 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.571044921875 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.95367431640625 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9232177734375 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9202880859375 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.297607421875 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0894775390625 }, { "epoch": 0.31899265477439664, "step": 76, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.058349609375 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1951904296875 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.010986328125 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.142578125 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.02642822265625 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0196609497070312 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.61822509765625 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.07415771484375 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.70458984375 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8724212646484375 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0791015625 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.225372314453125 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.641704559326172 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.835113525390625 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.722412109375 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9454345703125 }, { "epoch": 0.323189926547744, "step": 77, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.414764404296875 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1142578125 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.91680908203125 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0490493774414062 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.321533203125 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.11651611328125 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6959915161132812 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.68670654296875 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5223388671875 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.60272216796875 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.05401611328125 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.70721435546875 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9356689453125 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.990234375 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2862548828125 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.78973388671875 }, { "epoch": 0.3273871983210913, "step": 78, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.81298828125 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.9130859375 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.77294921875 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.878662109375 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.6719970703125 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.46795654296875 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4326171875 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1658935546875 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.061767578125 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7734375 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.973724365234375 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.84429931640625 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2707595825195312 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.520843505859375 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.3201904296875 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.6083984375 }, { "epoch": 0.3315844700944386, "step": 79, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.779693603515625 }, { "epoch": 0.3357817418677859, "grad_norm": 13.0, "learning_rate": 4.2351854880515856e-06, "loss": 0.5227, "step": 80 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.294189453125 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.47564697265625 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.40019989013671875 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7183837890625 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.25, "train/overall_margin_mean": 0.04833984375 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6217041015625 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5140380859375 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7188720703125 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.552825927734375 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7008056640625 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.80419921875 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.013153076171875 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.494110107421875 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5467529296875 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.07720947265625 }, { "epoch": 0.3357817418677859, "step": 80, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.44403076171875 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.376708984375 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.67706298828125 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.269805908203125 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.34783935546875 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.523681640625 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.39272308349609375 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.92724609375 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1494140625 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.0687255859375 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.91943359375 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.0575332641601562 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.27685546875 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.470001220703125 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.8313980102539062 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.87518310546875 }, { "epoch": 0.33997901364113325, "step": 81, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.43438720703125 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.947998046875 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.02130126953125 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6689453125 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.12274169921875 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.402099609375 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.449737548828125 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.34033203125 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.303558349609375 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.320343017578125 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7032470703125 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.141357421875 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.61212158203125 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0006103515625 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7822723388671875 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.60791015625 }, { "epoch": 0.3441762854144806, "step": 82, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.600128173828125 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.5142822265625 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4527587890625 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.019287109375 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.891326904296875 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5970458984375 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.83544921875 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5137367248535156 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.475860595703125 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1517333984375 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.75390625 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.30059814453125 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.99609375 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8746590614318848 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4576416015625 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.015380859375 }, { "epoch": 0.3483735571878279, "step": 83, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.532958984375 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5184326171875 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.616668701171875 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.2613525390625 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.96630859375 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5302658081054688 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.19140625 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.1580810546875 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.78021240234375 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.423828125 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.118133544921875 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.915771484375 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.167037010192871 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4716796875 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6976318359375 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.82611083984375 }, { "epoch": 0.35257082896117525, "step": 84, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.36181640625 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.92120361328125 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.5792236328125 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.237060546875 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.881591796875 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.466796875 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.915771484375 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.637115478515625 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.106231689453125 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2398834228515625 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.449371337890625 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.86669921875 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.018007278442383 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1375904083251953 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.253448486328125 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.52978515625 }, { "epoch": 0.3567681007345226, "step": 85, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.21142578125 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.1004638671875 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4139404296875 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5744667053222656 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.2496337890625 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.549346923828125 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.96844482421875 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5262336730957031 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8505859375 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.352783203125 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5189895629882812 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.79638671875 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.600341796875 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.50421142578125 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.34259033203125 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.5701255798339844 }, { "epoch": 0.36096537250786986, "step": 86, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.47509765625 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.63177490234375 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.924560546875 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0794677734375 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.62786865234375 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.189697265625 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8314208984375 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.19915771484375 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.896209716796875 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9743499755859375 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5115966796875 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1526107788085938 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9055633544921875 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.06201171875 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.20947265625 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.811279296875 }, { "epoch": 0.3651626442812172, "step": 87, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0139613151550293 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.1123046875 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.92486572265625 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.86151123046875 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.36810302734375 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0848388671875 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6920166015625 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.062255859375 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.48663330078125 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.113525390625 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.421539306640625 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5704345703125 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5472186803817749 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7122802734375 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.193115234375 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.17431640625 }, { "epoch": 0.36935991605456453, "step": 88, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.579345703125 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7431640625 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4736328125 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8350830078125 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8316078186035156 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.700439453125 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.284912109375 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4202880859375 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7054443359375 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3462371826171875 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.3824462890625 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.34912109375 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.506178855895996 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.76806640625 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.1298828125 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.214111328125 }, { "epoch": 0.37355718782791186, "step": 89, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9451904296875 }, { "epoch": 0.3777544596012592, "grad_norm": 12.5625, "learning_rate": 3.9546472888948825e-06, "loss": 0.4972, "step": 90 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2385711669921875 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2294921875 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3151283264160156 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.63134765625 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.70361328125 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.24072265625 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.333984375 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7259063720703125 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.12353515625 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4836349487304688 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9197998046875 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9520263671875 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2645111083984375 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.05029296875 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.06689453125 }, { "epoch": 0.3777544596012592, "step": 90, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.9617919921875 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.56396484375 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2491455078125 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.383544921875 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.796630859375 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.853271484375 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8153076171875 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6904296875 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3257408142089844 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.116455078125 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2388763427734375 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.078857421875 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.3284912109375 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.291748046875 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8603515625 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.200927734375 }, { "epoch": 0.38195173137460653, "step": 91, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6109619140625 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.74462890625 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0523681640625 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.3916015625 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.94012451171875 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.50677490234375 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0604248046875 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5164794921875 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.7183837890625 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.030853271484375 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0694580078125 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4088134765625 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.445556640625 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.939208984375 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.04541015625 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1197509765625 }, { "epoch": 0.3861490031479538, "step": 92, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2303466796875 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.655029296875 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.22674560546875 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5963134765625 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.067352294921875 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.827392578125 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.35015869140625 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.54736328125 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0831298828125 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.59259033203125 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.47998046875 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8248138427734375 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0488853454589844 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.961181640625 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.109619140625 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9000244140625 }, { "epoch": 0.39034627492130114, "step": 93, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.93951416015625 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.238311767578125 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.62200927734375 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4921875 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.060546875 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.450439453125 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4839706420898438 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.470733642578125 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.59326171875 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4227294921875 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.593292236328125 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.608917236328125 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.09185791015625 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.531982421875 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.08123779296875 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0904541015625 }, { "epoch": 0.3945435466946485, "step": 94, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5281143188476562 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.830322265625 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.16357421875 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6029052734375 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.3887481689453125 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.062652587890625 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.528564453125 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.359375 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.00732421875 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.43408203125 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.535675048828125 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.146240234375 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3609619140625 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.546142578125 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.39453125 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1179351806640625 }, { "epoch": 0.3987408184679958, "step": 95, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.0550537109375 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5152587890625 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.85546875 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3501968383789062 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.9886202812194824 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.17626953125 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.10235595703125 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.51220703125 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.432464599609375 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7584228515625 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.357177734375 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.882965087890625 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.33548736572265625 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.68994140625 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.418212890625 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.43841552734375 }, { "epoch": 0.40293809024134314, "step": 96, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3092041015625 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.722900390625 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.23309326171875 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.962310791015625 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6137313842773438 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9114990234375 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.642333984375 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.0074462890625 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.732666015625 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.860107421875 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9495849609375 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.1279296875 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.608642578125 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.168701171875 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.81512451171875 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0396728515625 }, { "epoch": 0.40713536201469047, "step": 97, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.02392578125 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7840576171875 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.4305419921875 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.975372314453125 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.922607421875 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8596038818359375 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3885650634765625 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.346435546875 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.245849609375 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.13702392578125 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.7635498046875 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1124267578125 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.91943359375 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.151611328125 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.441162109375 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0054931640625 }, { "epoch": 0.41133263378803775, "step": 98, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.82763671875 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3568458557128906 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6971435546875 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.404876708984375 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.343017578125 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.08120346069335938 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.482914924621582 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.357177734375 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.057861328125 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.2587890625 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.260223388671875 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3492431640625 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.113525390625 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.721923828125 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.33551025390625 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.43701171875 }, { "epoch": 0.4155299055613851, "step": 99, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.47467041015625 }, { "epoch": 0.4197271773347324, "grad_norm": 12.3125, "learning_rate": 3.6431058082615966e-06, "loss": 0.518, "step": 100 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.41943359375 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.39154052734375 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.0277099609375 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7698898315429688 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.77703857421875 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.49951171875 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8087158203125 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.32958984375 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.61407470703125 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.206146240234375 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.238525390625 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.944580078125 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9219970703125 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.31915283203125 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.7134857177734375 }, { "epoch": 0.4197271773347324, "step": 100, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.672698974609375 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3004150390625 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2159423828125 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.81390380859375 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.0033416748046875 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.184661865234375 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.3714599609375 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6746826171875 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.65673828125 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.82794189453125 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.68701171875 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.3633270263671875 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.85211181640625 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.456939697265625 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.227264404296875 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.322998046875 }, { "epoch": 0.42392444910807975, "step": 101, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.2512359619140625 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.619384765625 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.877197265625 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.630615234375 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.67388916015625 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.853515625 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.655029296875 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.539794921875 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5406494140625 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.63623046875 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.25244140625 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.491455078125 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.686767578125 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1861572265625 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.24591064453125 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.451171875 }, { "epoch": 0.4281217208814271, "step": 102, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.17340087890625 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.50634765625 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.1634521484375 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1507568359375 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.095458984375 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.085052490234375 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.083038330078125 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4647216796875 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.6165771484375 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.098388671875 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.7755126953125 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.800689697265625 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.70166015625 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.244384765625 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.912322998046875 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.947265625 }, { "epoch": 0.4323189926547744, "step": 103, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7967529296875 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.119842529296875 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9436492919921875 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.54937744140625 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.786834716796875 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.489654541015625 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5001220703125 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.580230712890625 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.459320068359375 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1298828125 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.031494140625 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.09765625 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.34576416015625 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9126434326171875 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.559783935546875 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.260009765625 }, { "epoch": 0.43651626442812175, "step": 104, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.8192138671875 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0719757080078125 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.544189453125 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3934326171875 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.6293988227844238 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1356201171875 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.326416015625 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9951171875 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3834228515625 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.45263671875 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.41175079345703125 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8712158203125 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.32989501953125 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.424072265625 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.245361328125 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.97564697265625 }, { "epoch": 0.440713536201469, "step": 105, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7989501953125 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.62353515625 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.09112548828125 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.02825927734375 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.845458984375 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.419921875 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.776123046875 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.165283203125 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3533706665039062 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.214141845703125 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0117645263671875 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.13671875 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.541259765625 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4764404296875 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.064117431640625 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.81024169921875 }, { "epoch": 0.44491080797481636, "step": 106, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3470458984375 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.2204437255859375 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.545166015625 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.051849365234375 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.92852783203125 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.898284912109375 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1328125 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.4296875 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.2601318359375 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.652587890625 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.692626953125 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9769287109375 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.45623779296875 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.966796875 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.052001953125 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3583984375 }, { "epoch": 0.4491080797481637, "step": 107, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.110626220703125 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.22161865234375 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.823974609375 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.876953125 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2253856658935547 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.6251220703125 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.09521484375 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2679443359375 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.46875 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5433349609375 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.15044403076171875 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5689697265625 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7080078125 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3360595703125 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.255340576171875 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.766845703125 }, { "epoch": 0.453305351521511, "step": 108, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.909423828125 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.57427978515625 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0749053955078125 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.86505126953125 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.885498046875 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.8218994140625 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.385162353515625 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.365478515625 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.65728759765625 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.65386962890625 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.40716552734375 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.208251953125 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.46923828125 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1651611328125 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.21337890625 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5240478515625 }, { "epoch": 0.45750262329485836, "step": 109, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8441009521484375 }, { "epoch": 0.4616998950682057, "grad_norm": 12.5625, "learning_rate": 3.3072010119286156e-06, "loss": 0.5026, "step": 110 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.376739501953125 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9180908203125 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1920166015625 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.572998046875 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.454376220703125 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8505859375 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.21722412109375 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0258865356445312 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1507568359375 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.329833984375 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.233154296875 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.02630615234375 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6021957397460938 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.55517578125 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.125244140625 }, { "epoch": 0.4616998950682057, "step": 110, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.523193359375 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0640869140625 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3997650146484375 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.333770751953125 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.773681640625 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0811767578125 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.63043212890625 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.468597412109375 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4552001953125 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.28759765625 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.76708984375 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.5058670043945312 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.08416748046875 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9104537963867188 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.495147705078125 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3228759765625 }, { "epoch": 0.46589716684155297, "step": 111, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8404922485351562 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.60400390625 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.825927734375 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.189453125 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2186279296875 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5574951171875 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.26611328125 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.833740234375 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.2761459350585938 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.466796875 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.1070404052734375 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.976806640625 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.921417236328125 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.92816162109375 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9669189453125 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.359619140625 }, { "epoch": 0.4700944386149003, "step": 112, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.344146728515625 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.674072265625 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.42626953125 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.974609375 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.87457275390625 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.347900390625 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.345489501953125 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.553466796875 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.41302490234375 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 2.057373046875 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2431640625 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.024566650390625 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.216796875 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8526611328125 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.962890625 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.40753173828125 }, { "epoch": 0.47429171038824763, "step": 113, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.69189453125 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9365234375 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.169921875 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.787109375 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.21728515625 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.23663330078125 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.70843505859375 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.04736328125 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.10467529296875 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.07562255859375 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.32080078125 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.13330078125 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8748779296875 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.003662109375 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.81353759765625 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.46002197265625 }, { "epoch": 0.47848898216159497, "step": 114, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.447021484375 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.81689453125 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9241867065429688 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.2083740234375 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.16400146484375 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.837890625 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.33837890625 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.599029541015625 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.984130859375 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.4293975830078125 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8492431640625 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0665283203125 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.88897705078125 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.53076171875 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.55419921875 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0367431640625 }, { "epoch": 0.4826862539349423, "step": 115, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.490234375 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.35003662109375 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.500244140625 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.075714111328125 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.100830078125 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.55078125 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.73193359375 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.1142578125 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8392333984375 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7496337890625 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.5185546875 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.0325927734375 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6700439453125 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.783447265625 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7158203125 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.725830078125 }, { "epoch": 0.48688352570828963, "step": 116, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8331298828125 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.0958251953125 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.865234375 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7290115356445312 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7642822265625 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3641357421875 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7774658203125 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1046295166015625 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.171356201171875 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.1124267578125 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.6024169921875 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.5274658203125 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.29010009765625 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.235443115234375 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.16415786743164062 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.79681396484375 }, { "epoch": 0.4910807974816369, "step": 117, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.73193359375 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6422119140625 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.53350830078125 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.927734375 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.234832763671875 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6817626953125 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7900390625 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.602294921875 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.983978271484375 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3671875 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.291015625 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.035888671875 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.511260986328125 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9977548122406006 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5294189453125 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5305023193359375 }, { "epoch": 0.49527806925498424, "step": 118, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.235107421875 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.61602783203125 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.391357421875 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.002685546875 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2073822021484375 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.29058837890625 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.68450927734375 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.85546875 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2379150390625 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.26580810546875 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7532958984375 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.16064453125 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.123046875 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4456787109375 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.0625 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1566162109375 }, { "epoch": 0.4994753410283316, "step": 119, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.04254150390625 }, { "epoch": 0.5036726128016789, "grad_norm": 12.375, "learning_rate": 2.9540921274485913e-06, "loss": 0.5023, "step": 120 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.4501419067382812 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.29034423828125 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9482421875 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.11767578125 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5948486328125 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5908203125 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1993408203125 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.266845703125 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.7744140625 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.59423828125 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.040283203125 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.741668701171875 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9945068359375 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.308837890625 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.01220703125 }, { "epoch": 0.5036726128016789, "step": 120, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.76220703125 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.175048828125 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.60791015625 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.44775390625 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7462158203125 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.88677978515625 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6240234375 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.91204833984375 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.26611328125 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.55718994140625 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.726409912109375 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4093475341796875 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5041656494140625 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.33447265625 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.744659423828125 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.853607177734375 }, { "epoch": 0.5078698845750262, "step": 121, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.107177734375 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.6885986328125 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.033447265625 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.3095703125 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.56591796875 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.22869873046875 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.447265625 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.186614990234375 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9246978759765625 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2275390625 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.114501953125 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.81591796875 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2945556640625 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.15869140625 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0205631256103516 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.251708984375 }, { "epoch": 0.5120671563483735, "step": 122, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.414581298828125 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4119873046875 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.166107177734375 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.767333984375 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.11224365234375 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.88818359375 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.452880859375 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.803924560546875 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0968151092529297 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6533203125 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8917770385742188 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.49664306640625 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8754119873046875 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.001953125 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.36602783203125 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.7117919921875 }, { "epoch": 0.5162644281217209, "step": 123, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.014261245727539 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.726318359375 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.5101318359375 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.347900390625 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 0.97265625 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7808837890625 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.24688720703125 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.964935302734375 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.2470703125 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.1463623046875 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.8623046875 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8935546875 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6298828125 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.475341796875 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5213623046875 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7275390625 }, { "epoch": 0.5204616998950682, "step": 124, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.050994873046875 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4881591796875 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.07381439208984375 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.72760009765625 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.97412109375 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5859375 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3094940185546875 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.275726318359375 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.070068359375 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.49127197265625 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.16058349609375 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.279003143310547 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.370361328125 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9727783203125 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0830078125 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.169189453125 }, { "epoch": 0.5246589716684156, "step": 125, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.117431640625 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.506317138671875 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.68798828125 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9453125 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.287109375 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.340484619140625 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.114013671875 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7630615234375 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.828125 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.937469482421875 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.20208740234375 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.3878173828125 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1014404296875 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.11233139038085938 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4976806640625 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.431640625 }, { "epoch": 0.5288562434417629, "step": 126, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.24462890625 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.75390625 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.62017822265625 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.693359375 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7449951171875 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.337890625 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.336669921875 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.730712890625 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.191741943359375 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.89678955078125 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5909500122070312 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.3583984375 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.383056640625 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2745361328125 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.999267578125 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.2381591796875 }, { "epoch": 0.5330535152151101, "step": 127, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2772216796875 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5087890625 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.322265625 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.50677490234375 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.1763916015625 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5462646484375 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.27294921875 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3004302978515625 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.083740234375 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6512451171875 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.44390869140625 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6890869140625 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.58837890625 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.4959716796875 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.9062538146972656 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.560943603515625 }, { "epoch": 0.5372507869884575, "step": 128, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.4763259887695312 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.137451171875 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.351318359375 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0763092041015625 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.23779296875 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4274444580078125 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.50628662109375 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.658935546875 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.737548828125 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4794921875 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.193359375 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.088623046875 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.764404296875 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2471923828125 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.717529296875 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7889404296875 }, { "epoch": 0.5414480587618048, "step": 129, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.67413330078125 }, { "epoch": 0.5456453305351522, "grad_norm": 13.0, "learning_rate": 2.591305057644148e-06, "loss": 0.4873, "step": 130 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7589111328125 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7041015625 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.751220703125 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.43939208984375 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.72802734375 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.97021484375 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.116363525390625 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.724761962890625 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.40966796875 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.299560546875 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.017578125 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.621337890625 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.142333984375 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.596923828125 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.07275390625 }, { "epoch": 0.5456453305351522, "step": 130, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0612716674804688 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6671142578125 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8782958984375 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.95068359375 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.679931640625 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7601585388183594 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1199951171875 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3232421875 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.790924072265625 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.86126708984375 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3511962890625 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3800048828125 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.55877685546875 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.81646728515625 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5653076171875 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.996826171875 }, { "epoch": 0.5498426023084995, "step": 131, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.023193359375 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3802490234375 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7548828125 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.1900634765625 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.84423828125 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1330642700195312 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.523193359375 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0053653717041015625 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7111740112304688 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.862060546875 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2899169921875 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.74609375 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.411865234375 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.23193359375 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.369873046875 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.14197540283203125 }, { "epoch": 0.5540398740818469, "step": 132, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8230743408203125 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.565673828125 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.61181640625 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.32080078125 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.62408447265625 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.796630859375 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2193603515625 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.91143798828125 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.199798583984375 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.095458984375 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.037353515625 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5482177734375 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2608795166015625 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.956298828125 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.096435546875 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.09619140625 }, { "epoch": 0.5582371458551941, "step": 133, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8341064453125 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.973876953125 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.810791015625 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.573638916015625 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.622802734375 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.705810546875 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.229644775390625 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.506591796875 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.52374267578125 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5333251953125 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.345703125 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.22515869140625 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9095001220703125 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.6751708984375 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7445068359375 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.7950439453125 }, { "epoch": 0.5624344176285414, "step": 134, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.704345703125 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.7216796875 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.4154052734375 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.578369140625 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4144287109375 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.855224609375 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.900634765625 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.5589599609375 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.3712329864501953 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.500091552734375 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.93359375 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.3058624267578125 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.74462890625 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.31463623046875 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4212646484375 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.819305419921875 }, { "epoch": 0.5666316894018888, "step": 135, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6346282958984375 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.07763671875 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0249214172363281 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.611328125 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.13720703125 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4630126953125 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.554443359375 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.59405517578125 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9056396484375 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.41943359375 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.638916015625 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3157958984375 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.365234375 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.34716796875 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.68408203125 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1875 }, { "epoch": 0.5708289611752361, "step": 136, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.75048828125 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.083099365234375 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.837646484375 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.567626953125 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9371337890625 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.212890625 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.281982421875 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.36566162109375 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.524383544921875 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.13330078125 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6162872314453125 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.57171630859375 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.037109375 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.201751708984375 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7718505859375 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.31097412109375 }, { "epoch": 0.5750262329485835, "step": 137, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.439208984375 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.679931640625 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9609375 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8533935546875 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1475830078125 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.650390625 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.428680419921875 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.10888671875 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.213134765625 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4925537109375 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7006683349609375 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.5632362365722656 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3984375 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.6058349609375 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5277099609375 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5912399291992188 }, { "epoch": 0.5792235047219307, "step": 138, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.3330078125 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -1.0090866088867188 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.052734375 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.13037109375 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.98077392578125 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.804168701171875 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7030029296875 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2996826171875 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.44854736328125 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.993896484375 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.77264404296875 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.881103515625 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.7186279296875 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7628173828125 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8393096923828125 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.39410400390625 }, { "epoch": 0.583420776495278, "step": 139, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.67144775390625 }, { "epoch": 0.5876180482686254, "grad_norm": 13.0, "learning_rate": 2.2265719790553147e-06, "loss": 0.5034, "step": 140 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.970703125 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.31512451171875 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.4407958984375 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.2020263671875 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8011322021484375 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.959564208984375 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0059814453125 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.05331230163574219 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.63671875 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.720458984375 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.046630859375 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.24053955078125 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.729736328125 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.91748046875 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6854248046875 }, { "epoch": 0.5876180482686254, "step": 140, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6442642211914062 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8963623046875 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.090576171875 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3359375 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4530029296875 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.021484375 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0384521484375 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.900146484375 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.2327880859375 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.41143798828125 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.194580078125 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.219970703125 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.85595703125 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.62744140625 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.144287109375 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.46826171875 }, { "epoch": 0.5918153200419727, "step": 141, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.894287109375 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5680923461914062 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.11444091796875 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.728515625 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.864501953125 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.58978271484375 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8250732421875 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5574951171875 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.52197265625 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3970947265625 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8643798828125 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.11181640625 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.05780029296875 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3558349609375 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.08966064453125 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7941360473632812 }, { "epoch": 0.5960125918153201, "step": 142, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.06005859375 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.39697265625 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.238037109375 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.710205078125 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.94677734375 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.58740234375 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.155517578125 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8521881103515625 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.0623779296875 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.40411376953125 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.7578582763671875 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.12890625 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.052734375 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.531005859375 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8724365234375 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.6466064453125 }, { "epoch": 0.6002098635886673, "step": 143, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 0.85919189453125 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1705322265625 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.64453125 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.298431396484375 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.53192138671875 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.013092041015625 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.473907470703125 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.181640625 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1514892578125 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.584228515625 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.009033203125 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.6832809448242188 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3756103515625 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.57958984375 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.1322174072265625 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.53802490234375 }, { "epoch": 0.6044071353620147, "step": 144, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.86865234375 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.027069091796875 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.91448974609375 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5946044921875 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.20257568359375 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.76953125 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.583831787109375 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.8232421875 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4019775390625 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.841796875 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.794189453125 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2646484375 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.45501708984375 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.23876953125 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.310150146484375 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4528045654296875 }, { "epoch": 0.608604407135362, "step": 145, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.590606689453125 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.197357177734375 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.271728515625 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.75921630859375 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.6556396484375 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9864501953125 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9111328125 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.39935302734375 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.980712890625 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.286376953125 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.30322265625 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.925872802734375 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2492828369140625 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5129165649414062 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.78057861328125 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.876953125 }, { "epoch": 0.6128016789087093, "step": 146, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.85546875 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.575439453125 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.844482421875 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.457275390625 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.3974609375 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.717041015625 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.197265625 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7109375 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9034271240234375 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.33319091796875 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5257568359375 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.12890625 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.506561279296875 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5841102600097656 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.116455078125 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.51025390625 }, { "epoch": 0.6169989506820567, "step": 147, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.11663818359375 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.418914794921875 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.612518310546875 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.64947509765625 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.5284423828125 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.83050537109375 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.619384765625 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.3519287109375 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6190185546875 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.75030517578125 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.28411865234375 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7344970703125 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.56842041015625 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.19293212890625 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.51171875 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3096923828125 }, { "epoch": 0.621196222455404, "step": 148, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.83795166015625 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.08758544921875 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.224609375 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.142578125 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.80126953125 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9803466796875 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.542724609375 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.268402099609375 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2904052734375 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.850830078125 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.94091796875 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.330322265625 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2227783203125 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.275634765625 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.424896240234375 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.001708984375 }, { "epoch": 0.6253934942287513, "step": 149, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4300537109375 }, { "epoch": 0.6295907660020986, "grad_norm": 13.3125, "learning_rate": 1.8676665440207982e-06, "loss": 0.4839, "step": 150 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6554336547851562 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.580322265625 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.83056640625 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0848388671875 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8448333740234375 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.8492431640625 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.47607421875 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.462890625 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5816650390625 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.3866119384765625 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.2202072143554688 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.460693359375 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.16845703125 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7269287109375 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5223388671875 }, { "epoch": 0.6295907660020986, "step": 150, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5972900390625 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.67041015625 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.12530517578125 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2806396484375 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3697509765625 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.78485107421875 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.64208984375 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.622314453125 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7040863037109375 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.52490234375 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.75653076171875 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.48809814453125 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.907989501953125 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.62371826171875 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9425048828125 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.335693359375 }, { "epoch": 0.633788037775446, "step": 151, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.034149169921875 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.881103515625 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.907958984375 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.8671722412109375 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5106201171875 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.1274261474609375 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.923095703125 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1702880859375 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.657470703125 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0841064453125 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4097900390625 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6901397705078125 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.3035888671875 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.872344970703125 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.177734375 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.48614501953125 }, { "epoch": 0.6379853095487933, "step": 152, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7102203369140625 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.25311279296875 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.67822265625 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9530029296875 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.00750732421875 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.265625 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.35009765625 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.63916015625 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.94866943359375 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.435791015625 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.432220458984375 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.84002685546875 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.366455078125 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2296142578125 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.265625 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.857421875 }, { "epoch": 0.6421825813221406, "step": 153, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.061279296875 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.90673828125 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0240478515625 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.736328125 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.53729248046875 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.1705322265625 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.649169921875 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9876708984375 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.80364990234375 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5350341796875 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.61083984375 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.115966796875 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.321044921875 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.765045166015625 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5786209106445312 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.44818115234375 }, { "epoch": 0.646379853095488, "step": 154, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.279052734375 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.805419921875 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.334716796875 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.67724609375 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5769500732421875 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.319732666015625 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.013427734375 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.30450439453125 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8045654296875 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.33544921875 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.5837554931640625 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9566650390625 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9081840515136719 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.69293212890625 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.45758056640625 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0653076171875 }, { "epoch": 0.6505771248688352, "step": 155, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.312896728515625 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.6142578125 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.00537109375 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.07904052734375 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.14141845703125 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.354339599609375 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.731292724609375 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.028564453125 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.134613037109375 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6321868896484375 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.471435546875 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.56988525390625 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.17626953125 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2554931640625 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.01165771484375 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4450531005859375 }, { "epoch": 0.6547743966421826, "step": 156, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.147369384765625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1297607421875 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1373291015625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.05694580078125 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7822265625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9207763671875 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.810211181640625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.61822509765625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.01763916015625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.99072265625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.953765869140625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.98291015625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.05621337890625 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.664276123046875 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.677001953125 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.439453125 }, { "epoch": 0.6589716684155299, "step": 157, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.115966796875 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.267578125 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.2299346923828125 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7635498046875 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.91015625 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.269500732421875 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.668701171875 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7438201904296875 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.3597412109375 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.96435546875 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.06781005859375 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9002838134765625 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.38763427734375 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5277099609375 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0512237548828125 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7786865234375 }, { "epoch": 0.6631689401888772, "step": 158, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7818222045898438 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.7876358032226562 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.7208251953125 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.1839599609375 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.03564453125 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.708984375 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.508544921875 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4678955078125 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9662895202636719 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.38299560546875 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.209716796875 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.003173828125 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.9139404296875 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.37994384765625 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.455352783203125 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1467132568359375 }, { "epoch": 0.6673662119622246, "step": 159, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.984130859375 }, { "epoch": 0.6715634837355718, "grad_norm": 12.625, "learning_rate": 1.5222381987746104e-06, "loss": 0.5002, "step": 160 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.58953857421875 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.4229736328125 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5703125 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0009765625 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.298583984375 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.028717041015625 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1689453125 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.845947265625 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.51861572265625 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3978271484375 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.98577880859375 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.940185546875 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.673431396484375 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.668853759765625 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.883544921875 }, { "epoch": 0.6715634837355718, "step": 160, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.82421875 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.799560546875 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2708740234375 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1820068359375 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.419677734375 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1600341796875 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.795166015625 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.658935546875 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.875732421875 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.434478759765625 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.213714599609375 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.50201416015625 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.055572509765625 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.090087890625 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.113616943359375 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4004478454589844 }, { "epoch": 0.6757607555089192, "step": 161, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0934123992919922 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.076416015625 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.074462890625 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1890869140625 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.70703125 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.59619140625 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.697265625 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.96929931640625 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.4758148193359375 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.348876953125 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.427978515625 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.157928466796875 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4254150390625 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3519477844238281 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.786376953125 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.2982330322265625 }, { "epoch": 0.6799580272822665, "step": 162, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4381103515625 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.915802001953125 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.012847900390625 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6317138671875 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.159210205078125 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1960601806640625 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3226776123046875 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.696197509765625 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.467529296875 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.15631103515625 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.98150634765625 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.526397705078125 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.40185546875 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.432373046875 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.900146484375 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.195068359375 }, { "epoch": 0.6841552990556139, "step": 163, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5654296875 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.23626708984375 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.0859375 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.44329833984375 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4722900390625 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 2.0831298828125 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.2437286376953125 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.850341796875 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6304931640625 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.49853515625 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.262451171875 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7401809692382812 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.732666015625 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.22998046875 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.66217041015625 }, { "epoch": 0.6883525708289612, "step": 164, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.297607421875 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.825439453125 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.74896240234375 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.10455322265625 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.12652587890625 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.966552734375 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7874755859375 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5108108520507812 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.722503662109375 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4554443359375 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.69976806640625 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.98541259765625 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.16949462890625 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.51373291015625 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 3.00970458984375 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.91448974609375 }, { "epoch": 0.6925498426023085, "step": 165, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.808349609375 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8360595703125 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.000244140625 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.880615234375 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.64788818359375 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.52734375 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.0338134765625 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.65045166015625 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5837860107421875 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.356689453125 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4265480041503906 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4959354400634766 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5576171875 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.88555908203125 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8050537109375 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.134521484375 }, { "epoch": 0.6967471143756558, "step": 166, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.11083984375 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.073974609375 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.27227783203125 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.376953125 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.854095458984375 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.69091796875 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.05029296875 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8056640625 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7188720703125 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.910400390625 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0516357421875 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5684051513671875 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.26025390625 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.47747802734375 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.89013671875 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.199462890625 }, { "epoch": 0.7009443861490031, "step": 167, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4825439453125 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.853607177734375 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.88409423828125 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.774627685546875 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.27130126953125 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6845703125 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5780029296875 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0503082275390625 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.89208984375 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.094970703125 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.22503662109375 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6796875 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.702301025390625 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4832763671875 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9159393310546875 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.83984375 }, { "epoch": 0.7051416579223505, "step": 168, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.97686767578125 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.366455078125 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.331298828125 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5688610076904297 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.34423828125 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.7302703857421875 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8181915283203125 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.173583984375 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.727783203125 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.607574462890625 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4227294921875 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.148712158203125 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.101104736328125 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8562240600585938 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.07342529296875 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.163330078125 }, { "epoch": 0.7093389296956978, "step": 169, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4449462890625 }, { "epoch": 0.7135362014690452, "grad_norm": 11.5, "learning_rate": 1.1976491487801747e-06, "loss": 0.4743, "step": 170 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0390167236328125 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1529541015625 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.20355224609375 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.98193359375 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.955810546875 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.892333984375 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3896484375 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.734222412109375 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.02642822265625 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.66943359375 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.17974853515625 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4102783203125 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.97015380859375 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5009841918945312 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4970703125 }, { "epoch": 0.7135362014690452, "step": 170, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3836669921875 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.021240234375 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 2.3452682495117188 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2881317138671875 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.94793701171875 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.322265625 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.240234375 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3087158203125 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8992919921875 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.139404296875 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.25732421875 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.9892578125 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.11962890625 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4835205078125 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7025146484375 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8668212890625 }, { "epoch": 0.7177334732423925, "step": 171, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.72418212890625 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.664794921875 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.022216796875 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.783935546875 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3961181640625 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4017333984375 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.25299072265625 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.940704345703125 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5756988525390625 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.776336669921875 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.9447021484375 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5616884231567383 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.12890625 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.627197265625 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4591064453125 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.5479316711425781 }, { "epoch": 0.7219307450157397, "step": 172, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.639892578125 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.14862060546875 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8353271484375 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.7633056640625 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.82733154296875 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.42840576171875 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.756103515625 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.800445556640625 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.31103515625 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.68914794921875 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.44464111328125 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.0406494140625 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.822265625 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.223663330078125 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9892578125 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.49072265625 }, { "epoch": 0.7261280167890871, "step": 173, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5987548828125 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.10430908203125 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.54119873046875 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2471923828125 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.131103515625 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.53326416015625 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1949462890625 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.89007568359375 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7342529296875 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.8012237548828125 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5650634765625 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8541259765625 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.884765625 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.13336181640625 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8221817016601562 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.009246826171875 }, { "epoch": 0.7303252885624344, "step": 174, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.987060546875 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.62060546875 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9874267578125 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.791595458984375 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.14892578125 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.035400390625 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.21697998046875 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8618392944335938 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.948974609375 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.659423828125 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.9493408203125 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.51513671875 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.75927734375 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.606201171875 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.92376708984375 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.658203125 }, { "epoch": 0.7345225603357818, "step": 175, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8838348388671875 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.184814453125 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1177978515625 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9656982421875 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.03460693359375 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.16607666015625 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5699462890625 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.461416244506836 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.662933349609375 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.270416259765625 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2015380859375 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.97900390625 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.90338134765625 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6240234375 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4307861328125 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.20849609375 }, { "epoch": 0.7387198321091291, "step": 176, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2390220165252686 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.1446533203125 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8096389770507812 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.7211761474609375 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5076904296875 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.772216796875 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.9560546875 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.0679931640625 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.27349853515625 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.45794677734375 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9714508056640625 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8041610717773438 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.5212173461914062 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.704742431640625 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.25408935546875 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.423095703125 }, { "epoch": 0.7429171038824763, "step": 177, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.40386962890625 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.643798828125 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0931396484375 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.08349609375 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.291015625 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0703125 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.2958984375 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8037109375 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0321044921875 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.8586654663085938 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5269775390625 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.06976318359375 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.36865234375 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.370941162109375 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.215850830078125 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.602935791015625 }, { "epoch": 0.7471143756558237, "step": 178, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.737548828125 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.335540771484375 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8853759765625 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.548553466796875 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.318359375 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.90850830078125 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.17138671875 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0859375 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.47540283203125 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.23309326171875 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9625244140625 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.240020751953125 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.10516357421875 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7367782592773438 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.6640625 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.10052490234375 }, { "epoch": 0.751311647429171, "step": 179, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.31707763671875 }, { "epoch": 0.7555089192025184, "grad_norm": 12.625, "learning_rate": 9.008174461027724e-07, "loss": 0.504, "step": 180 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.419677734375 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8283119201660156 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.472015380859375 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.2421875 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6640625 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.87451171875 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.186187744140625 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2733612060546875 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.357666015625 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.496337890625 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.644195556640625 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.080169677734375 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.4861907958984375 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8858642578125 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.612548828125 }, { "epoch": 0.7555089192025184, "step": 180, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.76318359375 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.233154296875 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.636932373046875 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.079833984375 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.3507080078125 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.292724609375 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.83319091796875 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2742919921875 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.34539794921875 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.68896484375 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.799072265625 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6784210205078125 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.39324951171875 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.932373046875 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.406494140625 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.933349609375 }, { "epoch": 0.7597061909758657, "step": 181, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8859939575195312 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7221832275390625 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.75750732421875 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.0411376953125 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4249267578125 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.350830078125 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2840347290039062 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.17279052734375 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.69677734375 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.631103515625 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.82177734375 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.199462890625 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.86175537109375 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6134033203125 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.146148681640625 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9313201904296875 }, { "epoch": 0.7639034627492131, "step": 182, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.1356201171875 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.2513427734375 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.0750732421875 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6596240997314453 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.76611328125 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.100341796875 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.19873046875 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.67138671875 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.65386962890625 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.90234375 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.59619140625 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.3458251953125 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.996307373046875 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1970672607421875 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.39666748046875 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5625686645507812 }, { "epoch": 0.7681007345225603, "step": 183, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9752197265625 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.1545562744140625 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.0413818359375 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9093017578125 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.5682373046875 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.050750732421875 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.341796875 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.40673828125 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.17535400390625 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.426025390625 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6416015625 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.861572265625 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.529510498046875 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.018310546875 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.02197265625 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7301025390625 }, { "epoch": 0.7722980062959076, "step": 184, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4168701171875 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5701904296875 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.00048828125 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.97607421875 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9771270751953125 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.326171875 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.41571044921875 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.908477783203125 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8853759765625 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.587890625 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2109375 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4744873046875 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6306304931640625 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5981674194335938 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8297119140625 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.6973876953125 }, { "epoch": 0.776495278069255, "step": 185, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.488525390625 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.071044921875 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.14501953125 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.55755615234375 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.488555908203125 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.537353515625 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.95196533203125 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9840087890625 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.008880615234375 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2069091796875 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.855712890625 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.119873046875 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2169189453125 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4244384765625 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.536376953125 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.776123046875 }, { "epoch": 0.7806925498426023, "step": 186, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.25634765625 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5335693359375 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1290283203125 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 2.1207275390625 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.39288330078125 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.5108642578125 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.579833984375 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.88946533203125 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.368988037109375 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.611083984375 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.298095703125 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8092041015625 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5213775634765625 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.195404052734375 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.22454833984375 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.31536865234375 }, { "epoch": 0.7848898216159497, "step": 187, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6766357421875 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5794677734375 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6556196212768555 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.409423828125 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.68896484375 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.52532958984375 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.80718994140625 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.189208984375 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3443603515625 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.040557861328125 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.60345458984375 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1407470703125 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.9629745483398438 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.4180908203125 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1702880859375 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.6551513671875 }, { "epoch": 0.789087093389297, "step": 188, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.32275390625 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5703125 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5964279174804688 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.657958984375 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.76617431640625 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5623779296875 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.49169921875 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9209442138671875 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.877197265625 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.59912109375 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.277587890625 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.57720947265625 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.15966796875 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.35357666015625 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5756378173828125 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.37933349609375 }, { "epoch": 0.7932843651626443, "step": 189, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.23876953125 }, { "epoch": 0.7974816369359916, "grad_norm": 11.75, "learning_rate": 6.380695431405453e-07, "loss": 0.4662, "step": 190 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5836181640625 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.26409912109375 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.1000518798828125 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.939208984375 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4776153564453125 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.28173828125 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.076171875 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2265625 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.1881103515625 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.52294921875 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6309814453125 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6357421875 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5245361328125 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.499053955078125 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2858657836914062 }, { "epoch": 0.7974816369359916, "step": 190, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.1302490234375 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1812667846679688 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.6917724609375 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.741943359375 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.851806640625 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9015350341796875 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4869384765625 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7729415893554688 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7607421875 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.64276123046875 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.249755859375 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.144561767578125 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.48089599609375 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.25933837890625 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.520263671875 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1702880859375 }, { "epoch": 0.8016789087093389, "step": 191, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5078125 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.77362060546875 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.77569580078125 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4283447265625 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.498779296875 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6474609375 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1773681640625 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.606231689453125 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.82470703125 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.77496337890625 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.212554931640625 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.639068603515625 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.1787109375 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0103759765625 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.620452880859375 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.39208984375 }, { "epoch": 0.8058761804826863, "step": 192, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.60260009765625 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2066650390625 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.70556640625 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.489471435546875 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.40966796875 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9708251953125 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.96240234375 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.046142578125 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7122802734375 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5068359375 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9122314453125 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7960205078125 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.44537353515625 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6715087890625 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.7806186676025391 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.43414306640625 }, { "epoch": 0.8100734522560336, "step": 193, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.792724609375 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.4770660400390625 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2440185546875 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8427734375 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6719970703125 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0388031005859375 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.795745849609375 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8641357421875 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4832763671875 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.259521484375 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.37432861328125 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5372314453125 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.0580902099609375 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.42822265625 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.07550048828125 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.3922119140625 }, { "epoch": 0.8142707240293809, "step": 194, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0228271484375 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6746826171875 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8566131591796875 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.145263671875 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.959228515625 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.383056640625 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.390380859375 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.111480712890625 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.11083984375 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.52215576171875 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.76617431640625 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0723876953125 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2691650390625 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8765869140625 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.22088623046875 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.21356201171875 }, { "epoch": 0.8184679958027282, "step": 195, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.46728515625 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.6436767578125 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.88885498046875 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3673095703125 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3209991455078125 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.109832763671875 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2353515625 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.70892333984375 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.73828125 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3021240234375 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.979248046875 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.420318603515625 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8037109375 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0849609375 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.61822509765625 }, { "epoch": 0.8226652675760755, "step": 196, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.921783447265625 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0616874694824219 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.00152587890625 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2528533935546875 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.04095458984375 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.433868408203125 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.992095947265625 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.454345703125 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2259902954101562 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8018798828125 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3944091796875 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.573486328125 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 1.060546875 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.11334228515625 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.011138916015625 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.39031982421875 }, { "epoch": 0.8268625393494229, "step": 197, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3021240234375 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.734771728515625 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.3194580078125 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6546630859375 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.326416015625 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9921646118164062 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.1219482421875 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.5934066772460938 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.499755859375 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.776611328125 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7491912841796875 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.462799072265625 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.629638671875 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.29168701171875 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.784912109375 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.36083984375 }, { "epoch": 0.8310598111227702, "step": 198, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.60406494140625 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8389892578125 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.12255859375 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.581207275390625 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5736083984375 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6728477478027344 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6729736328125 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0810489654541016 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.34332275390625 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2890625 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.935302734375 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.77813720703125 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5036077499389648 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.721405029296875 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.09173583984375 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.281280517578125 }, { "epoch": 0.8352570828961176, "step": 199, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8037109375 }, { "epoch": 0.8394543546694648, "grad_norm": 11.9375, "learning_rate": 4.150054552753055e-07, "loss": 0.5039, "step": 200 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2457275390625 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.93170166015625 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9368896484375 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.595703125 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.0439376831054688 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.88427734375 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6666259765625 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.34814453125 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.51171875 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.97796630859375 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.12615966796875 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.073974609375 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.4368896484375 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8491287231445312 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.99566650390625 }, { "epoch": 0.8394543546694648, "step": 200, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2486572265625 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5243186950683594 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2388916015625 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -1.000732421875 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4242630004882812 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5157470703125 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.033203125 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8619232177734375 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1104736328125 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.180023193359375 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.50341796875 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.08056640625 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6640625 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6659088134765625 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.48834228515625 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.656494140625 }, { "epoch": 0.8436516264428122, "step": 201, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9857177734375 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5045928955078125 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3516845703125 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.55517578125 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.81494140625 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.12322998046875 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.78790283203125 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.979736328125 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.046875 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0806884765625 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.02099609375 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1007080078125 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.8355712890625 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.828125 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2869415283203125 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.565673828125 }, { "epoch": 0.8478488982161595, "step": 202, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.836181640625 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.84765625 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.400390625 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.04296875 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.513427734375 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.094482421875 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1230316162109375 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.860443115234375 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.031982421875 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.6866455078125 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.42059326171875 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.7073974609375 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.813720703125 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4990386962890625 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.5955810546875 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.32769775390625 }, { "epoch": 0.8520461699895068, "step": 203, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8720855712890625 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.826904296875 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.25244140625 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.90228271484375 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.44976806640625 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.06219482421875 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.0921783447265625 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.560546875 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.980010986328125 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.593475341796875 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.734588623046875 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.4290771484375 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0303535461425781 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.8699951171875 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.379150390625 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7034912109375 }, { "epoch": 0.8562434417628542, "step": 204, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.232696533203125 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.73095703125 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1898193359375 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6934814453125 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.84539794921875 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.251708984375 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.27886962890625 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.079833984375 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.400634765625 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.9638671875 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6705322265625 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.781564712524414 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8389892578125 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.792572021484375 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.283447265625 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.54931640625 }, { "epoch": 0.8604407135362014, "step": 205, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4348793029785156 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.389007568359375 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.3881187438964844 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.3056640625 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.3111572265625 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3397216796875 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.36669921875 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.26263427734375 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.488525390625 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.80010986328125 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5296630859375 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.61865234375 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.395782470703125 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0205078125 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.47914695739746094 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.6141891479492188 }, { "epoch": 0.8646379853095488, "step": 206, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3070220947265625 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.8992919921875 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9189453125 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.35443115234375 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.990966796875 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9317626953125 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.871826171875 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6041259765625 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.277099609375 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0467529296875 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.38427734375 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.726806640625 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8536224365234375 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.84722900390625 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2356414794921875 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1507568359375 }, { "epoch": 0.8688352570828961, "step": 207, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.877685546875 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.705474853515625 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7536773681640625 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.126220703125 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.70989990234375 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2689361572265625 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.208251953125 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.6325836181640625 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9132080078125 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6116790771484375 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.94598388671875 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.37054443359375 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8710908889770508 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.678253173828125 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.224853515625 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3812255859375 }, { "epoch": 0.8730325288562435, "step": 208, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.720947265625 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.2581787109375 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.70074462890625 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.506103515625 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 2.06494140625 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.47564697265625 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.71160888671875 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.853515625 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.061279296875 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9366455078125 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.73590087890625 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2579345703125 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.313720703125 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.99127197265625 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.827423095703125 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.167083740234375 }, { "epoch": 0.8772298006295908, "step": 209, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.262451171875 }, { "epoch": 0.881427072402938, "grad_norm": 15.4375, "learning_rate": 2.3637940626713346e-07, "loss": 0.5089, "step": 210 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.93975830078125 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.9302978515625 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.851654052734375 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.10546875 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7628173828125 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4920654296875 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.307373046875 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0302734375 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.672271728515625 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.034088134765625 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.612060546875 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.378814697265625 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.408966064453125 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2511138916015625 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.83160400390625 }, { "epoch": 0.881427072402938, "step": 210, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.65655517578125 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7753448486328125 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9171142578125 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.977783203125 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.056884765625 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8681640625 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.279052734375 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.08892822265625 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4649429321289062 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7741851806640625 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5516357421875 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.614501953125 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.94305419921875 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9520721435546875 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.15545654296875 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0379638671875 }, { "epoch": 0.8856243441762854, "step": 211, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.65533447265625 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4761962890625 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.42474365234375 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.31817626953125 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6412353515625 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.080322265625 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5447998046875 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.84521484375 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7618408203125 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.04736328125 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.228038787841797 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.484375 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.474395751953125 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7843017578125 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5560302734375 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8195638656616211 }, { "epoch": 0.8898216159496327, "step": 212, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.4326171875 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6817817687988281 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.989013671875 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8570556640625 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.2672119140625 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.15570068359375 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.15966796875 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.61572265625 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.419921875 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7256622314453125 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9476051330566406 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.248291015625 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.8958740234375 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3729248046875 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.133056640625 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.64739990234375 }, { "epoch": 0.8940188877229801, "step": 213, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.76171875 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.528411865234375 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.550506591796875 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.85394287109375 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2723846435546875 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.4527587890625 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.511505126953125 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.34765625 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0927734375 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.8487548828125 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.182342529296875 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.91259765625 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.830810546875 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.1705322265625 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6539459228515625 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1009521484375 }, { "epoch": 0.8982161594963274, "step": 214, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.65777587890625 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9175662994384766 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.479248046875 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.377685546875 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.602783203125 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8299560546875 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.48876953125 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.8896484375 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.284423828125 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.994384765625 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.67584228515625 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.064300537109375 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.521575927734375 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.077880859375 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4348325729370117 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.825408935546875 }, { "epoch": 0.9024134312696747, "step": 215, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.916229248046875 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.681884765625 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.21240234375 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.50830078125 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.83538818359375 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.3554229736328125 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.39544677734375 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.811279296875 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0244140625 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.81982421875 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.06439208984375 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.57763671875 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5281982421875 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.773712158203125 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.631103515625 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.27685546875 }, { "epoch": 0.906610703043022, "step": 216, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.66973876953125 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.135955810546875 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.82421875 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.271484375 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.4332275390625 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.03302001953125 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2310791015625 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.255126953125 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2882080078125 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.89794921875 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9288330078125 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.24462890625 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.45068359375 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.98297119140625 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.788330078125 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.723968505859375 }, { "epoch": 0.9108079748163693, "step": 217, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.638946533203125 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.6985244750976562 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.002197265625 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.94390869140625 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.65301513671875 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7978515625 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5550537109375 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.64508056640625 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.1905517578125 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.862060546875 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.694580078125 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.810791015625 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7159423828125 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.74285888671875 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.827880859375 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.49896240234375 }, { "epoch": 0.9150052465897167, "step": 218, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.21435546875 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7580718994140625 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.891357421875 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.14599609375 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.455078125 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.19677734375 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.47808837890625 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.493408203125 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9110870361328125 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.053955078125 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.301513671875 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.810455322265625 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.76611328125 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.49267578125 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2421875 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6484375 }, { "epoch": 0.919202518363064, "step": 219, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.898162841796875 }, { "epoch": 0.9233997901364114, "grad_norm": 11.375, "learning_rate": 1.0599850022898539e-07, "loss": 0.4991, "step": 220 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.490478515625 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.26947021484375 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.84716796875 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0165023803710938 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.99627685546875 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.73095703125 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8878173828125 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.45361328125 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1163177490234375 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0771484375 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.5280914306640625 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4041748046875 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.38751220703125 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.4415283203125 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0428314208984375 }, { "epoch": 0.9233997901364114, "step": 220, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7213134765625 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.958740234375 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.794677734375 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9814453125 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.91131591796875 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.4583740234375 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3017578125 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.163576126098633 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.223876953125 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.28753662109375 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.981201171875 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.01409912109375 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.48388671875 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.847259521484375 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1812744140625 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.42822265625 }, { "epoch": 0.9275970619097587, "step": 221, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.81903076171875 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.9635009765625 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9402389526367188 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.310546875 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.52294921875 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9439697265625 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.3616943359375 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.3951416015625 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5912628173828125 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.937744140625 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.00616455078125 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7162322998046875 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.447265625 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.4288330078125 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.81494140625 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.94580078125 }, { "epoch": 0.9317943336831059, "step": 222, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.935302734375 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6300048828125 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9296875 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.03662109375 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1894989013671875 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9964599609375 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.35693359375 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.41082763671875 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.4969482421875 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.619537353515625 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2291259765625 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.3427734375 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2078857421875 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6248321533203125 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.654632568359375 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1044921875 }, { "epoch": 0.9359916054564533, "step": 223, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.12677001953125 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.010009765625 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.037933349609375 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.464599609375 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.514404296875 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.2083740234375 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.831787109375 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.647705078125 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.1915283203125 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.2034912109375 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.12158203125 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.131103515625 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.578857421875 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.2708740234375 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.59130859375 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.789639949798584 }, { "epoch": 0.9401888772298006, "step": 224, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.83489990234375 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.965576171875 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7514572143554688 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.047149658203125 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6573486328125 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2132568359375 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.02874755859375 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.03472900390625 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9833984375 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.006103515625 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.601806640625 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.29150390625 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.0841064453125 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5257568359375 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.151123046875 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.263702392578125 }, { "epoch": 0.944386149003148, "step": 225, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.216552734375 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.320343017578125 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5742988586425781 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1796875 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.28009033203125 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.72503662109375 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.7003173828125 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.6341552734375 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.99365234375 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7545166015625 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1494140625 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.04931640625 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.444610595703125 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.714599609375 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.007080078125 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1029052734375 }, { "epoch": 0.9485834207764953, "step": 226, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.794952392578125 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.08056640625 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.82928466796875 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.318939208984375 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.936767578125 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.574951171875 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.593505859375 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.90618896484375 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.67510986328125 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.93560791015625 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.780670166015625 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5731201171875 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.399658203125 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.56390380859375 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0815906524658203 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.765411376953125 }, { "epoch": 0.9527806925498427, "step": 227, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.938232421875 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.841705322265625 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.11474609375 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.863189697265625 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.193603515625 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.19158935546875 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.078125 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.995086669921875 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4984130859375 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.03466796875 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0428466796875 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.8478240966796875 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.200439453125 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9227333068847656 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.783935546875 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0948486328125 }, { "epoch": 0.9569779643231899, "step": 228, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4791259765625 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.8279876708984375 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.88916015625 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.013671875 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.96630859375 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5390625 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.4991455078125 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5576171875 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.550872802734375 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.2388687133789062 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.659423828125 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.930419921875 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.298095703125 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.683929443359375 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.5736083984375 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.246063232421875 }, { "epoch": 0.9611752360965372, "step": 229, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.41552734375 }, { "epoch": 0.9653725078698846, "grad_norm": 9.8125, "learning_rate": 2.6641579812224373e-08, "loss": 0.4969, "step": 230 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.80224609375 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.63983154296875 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6217041015625 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 2.026611328125 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.88482666015625 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6334228515625 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.3328170776367188 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.480224609375 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.92578125 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.5927734375 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.6005859375 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.92559814453125 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.81207275390625 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.36865234375 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 3.0950927734375 }, { "epoch": 0.9653725078698846, "step": 230, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3714599609375 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.000732421875 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.635009765625 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.67822265625 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.5623779296875 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.2744140625 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.652587890625 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.6705322265625 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.552978515625 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.848388671875 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.5340576171875 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.8544921875 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.5378799438476562 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.32574462890625 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.0665283203125 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.1351318359375 }, { "epoch": 0.9695697796432319, "step": 231, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5513992309570312 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6120834350585938 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.167236328125 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.859619140625 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.993093490600586 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.759002685546875 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7560577392578125 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.814697265625 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.0987625122070312 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1201171875 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5908203125 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7598876953125 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 0.9091033935546875 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.137451171875 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4124755859375 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.7468833923339844 }, { "epoch": 0.9737670514165793, "step": 232, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5199317932128906 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.34942626953125 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.67144775390625 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.2156982421875 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4484405517578125 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3375244140625 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.729736328125 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.501953125 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.8819580078125 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.9447021484375 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.31884765625 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.86529541015625 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.6669921875 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.161041259765625 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.850830078125 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.997467041015625 }, { "epoch": 0.9779643231899265, "step": 233, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.6947021484375 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5234375 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.425537109375 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.5966796875 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.620361328125 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.441650390625 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.5, "train/overall_margin_mean": -0.5759735107421875 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.829345703125 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.806884765625 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.462646484375 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.58172607421875 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.763671875 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.980224609375 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1465225219726562 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.24072265625 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.81402587890625 }, { "epoch": 0.9821615949632738, "step": 234, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.357748031616211 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.9765625 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.4627685546875 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.9541015625 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.761474609375 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.618988037109375 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.52740478515625 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5029296875 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7666015625 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.043670654296875 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.82421875 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.3917617797851562 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.375, "train/overall_margin_mean": 0.4208984375 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.1458091735839844 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.7676849365234375 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.4630661010742188 }, { "epoch": 0.9863588667366212, "step": 235, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.9644775390625 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.25, "train/overall_margin_mean": -0.1749267578125 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.097900390625 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.2152099609375 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.27734375 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.99676513671875 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.375, "train/overall_margin_mean": -0.16888427734375 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.66162109375 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 1.1611328125 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.85675048828125 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.24859619140625 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.921539306640625 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.346405029296875 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.4061279296875 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.8597412109375 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.59588623046875 }, { "epoch": 0.9905561385099685, "step": 236, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.7470703125 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.2991943359375 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 1.3822021484375 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 2.0517578125 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.5504150390625 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.7998046875 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.543975830078125 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 2.1201324462890625 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 0.6055908203125 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.50885009765625 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.7017974853515625 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.75, "train/overall_margin_mean": 1.02960205078125 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 1.8994064331054688 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.893310546875 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.625, "train/overall_margin_mean": -0.0279541015625 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.6639404296875 }, { "epoch": 0.9947534102833159, "step": 237, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.9693603515625 }, { "epoch": 0.9989506820566632, "step": 238, "train/overall_accuracy": 0.5, "train/overall_margin_mean": 0.3382568359375 }, { "epoch": 0.9989506820566632, "step": 238, "train/overall_accuracy": 0.875, "train/overall_margin_mean": 1.7119140625 }, { "epoch": 0.9989506820566632, "step": 238, "train/overall_accuracy": 0.625, "train/overall_margin_mean": 0.92999267578125 }, { "epoch": 0.9989506820566632, "step": 238, "train/overall_accuracy": 1.0, "train/overall_margin_mean": 0.5966796875 } ], "logging_steps": 10, "max_steps": 239, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }