| objective,best,learning_rate,num_train_epochs,per_device_train_batch_size,warmup_steps,weight_decay,time_this_iter_s | |
| 0.5645421568643824,False,4.331856267483512e-05,1,8,0,0.07944089967936842,1018.9533109664917 | |
| 0.5308836004396339,False,3.9182510615044115e-05,1,16,1000,0.09845902649689675,944.7089395523071 | |
| 0.5480539392697081,False,1.7214822813591524e-05,2,8,250,0.144094925415577,1020.5628039836884 | |
| 0.5370892084279055,False,2.704648069279383e-05,5,16,500,0.027141889289293984,944.7776620388031 | |
| 0.5327635637405213,False,4.459899753015981e-05,5,16,1000,0.0852580117524583,944.7867786884308 | |
| 0.5190322695049081,False,1.2410705452298064e-05,5,16,0,0.08116122124035066,945.0260012149811 | |
| 0.5456873822288595,False,2.7418797048606627e-05,1,8,250,0.16915150577354252,1020.3443148136139 | |
| 0.5913354902422772,False,3.674371381938092e-05,2,16,500,0.026674369325998804,942.4582366943359 | |
| 0.6079231608164175,True,1.4176978406088547e-05,4,8,500,0.06913192321078417,1018.4374647140503 | |
| 0.5444957110604092,False,3.0290147327397735e-05,3,16,500,0.12361945588474021,943.6727764606476 | |