diff --git "a/log/debug_0.log" "b/log/debug_0.log" --- "a/log/debug_0.log" +++ "b/log/debug_0.log" @@ -38530,3 +38530,1009 @@ Use FP16 precision: False 02/26/2022 02:45:39 - INFO - codeparrot_training - Step 37998: {'lr': 7.324644623311046e-05, 'samples': 19455488, 'steps': 37998, 'loss/train': 0.07264846563339233} 02/26/2022 02:45:45 - INFO - codeparrot_training - Step 37999: {'lr': 7.323487508963392e-05, 'samples': 19456000, 'steps': 37999, 'loss/train': 1.960349678993225} 02/26/2022 02:45:45 - INFO - codeparrot_training - Evaluating and saving model checkpoint +02/26/2022 02:46:03 - WARNING - huggingface_hub.repository - Several commits (38) will be pushed upstream. +02/26/2022 02:46:03 - WARNING - huggingface_hub.repository - The progress bars may be unreliable. +02/26/2022 02:46:37 - WARNING - huggingface_hub.repository - To https://huggingface.co/ncoop57/multi-code-clippy + 333cdce..e53c3e1 floral-grass-11 -> floral-grass-11 + +02/26/2022 02:46:42 - INFO - codeparrot_training - Step 38000: {'lr': 7.322330470336314e-05, 'samples': 19456512, 'steps': 38000, 'loss/train': 1.6377456188201904} +02/26/2022 02:46:48 - INFO - codeparrot_training - Step 38001: {'lr': 7.321173507434758e-05, 'samples': 19457024, 'steps': 38001, 'loss/train': 0.6367076635360718} +02/26/2022 02:46:51 - INFO - codeparrot_training - Step 38002: {'lr': 7.320016620263673e-05, 'samples': 19457536, 'steps': 38002, 'loss/train': 2.099254608154297} +02/26/2022 02:46:57 - INFO - codeparrot_training - Step 38003: {'lr': 7.318859808828032e-05, 'samples': 19458048, 'steps': 38003, 'loss/train': 1.628173589706421} +02/26/2022 02:47:00 - INFO - codeparrot_training - Step 38004: {'lr': 7.317703073132778e-05, 'samples': 19458560, 'steps': 38004, 'loss/train': 2.3905887603759766} +02/26/2022 02:47:06 - INFO - codeparrot_training - Step 38005: {'lr': 7.316546413182874e-05, 'samples': 19459072, 'steps': 38005, 'loss/train': 0.27225345373153687} +02/26/2022 02:47:09 - INFO - codeparrot_training - Step 38006: {'lr': 7.315389828983257e-05, 'samples': 19459584, 'steps': 38006, 'loss/train': 0.3845939636230469} +02/26/2022 02:47:15 - INFO - codeparrot_training - Step 38007: {'lr': 7.314233320538907e-05, 'samples': 19460096, 'steps': 38007, 'loss/train': 0.7665659785270691} +02/26/2022 02:47:19 - INFO - codeparrot_training - Step 38008: {'lr': 7.313076887854764e-05, 'samples': 19460608, 'steps': 38008, 'loss/train': 1.9438731670379639} +02/26/2022 02:47:24 - INFO - codeparrot_training - Step 38009: {'lr': 7.311920530935781e-05, 'samples': 19461120, 'steps': 38009, 'loss/train': 1.8758307695388794} +02/26/2022 02:47:28 - INFO - codeparrot_training - Step 38010: {'lr': 7.310764249786908e-05, 'samples': 19461632, 'steps': 38010, 'loss/train': 1.646323561668396} +02/26/2022 02:47:33 - INFO - codeparrot_training - Step 38011: {'lr': 7.309608044413121e-05, 'samples': 19462144, 'steps': 38011, 'loss/train': 2.3616750240325928} +02/26/2022 02:47:37 - INFO - codeparrot_training - Step 38012: {'lr': 7.30845191481934e-05, 'samples': 19462656, 'steps': 38012, 'loss/train': 1.0274697542190552} +02/26/2022 02:47:43 - INFO - codeparrot_training - Step 38013: {'lr': 7.307295861010538e-05, 'samples': 19463168, 'steps': 38013, 'loss/train': 0.612236738204956} +02/26/2022 02:47:46 - INFO - codeparrot_training - Step 38014: {'lr': 7.306139882991656e-05, 'samples': 19463680, 'steps': 38014, 'loss/train': 0.9534772038459778} +02/26/2022 02:47:52 - INFO - codeparrot_training - Step 38015: {'lr': 7.30498398076766e-05, 'samples': 19464192, 'steps': 38015, 'loss/train': 1.9720512628555298} +02/26/2022 02:47:55 - INFO - codeparrot_training - Step 38016: {'lr': 7.303828154343494e-05, 'samples': 19464704, 'steps': 38016, 'loss/train': 0.32893434166908264} +02/26/2022 02:48:01 - INFO - codeparrot_training - Step 38017: {'lr': 7.302672403724112e-05, 'samples': 19465216, 'steps': 38017, 'loss/train': 1.5718871355056763} +02/26/2022 02:48:04 - INFO - codeparrot_training - Step 38018: {'lr': 7.301516728914451e-05, 'samples': 19465728, 'steps': 38018, 'loss/train': 2.3168623447418213} +02/26/2022 02:48:10 - INFO - codeparrot_training - Step 38019: {'lr': 7.300361129919481e-05, 'samples': 19466240, 'steps': 38019, 'loss/train': 1.5415875911712646} +02/26/2022 02:48:13 - INFO - codeparrot_training - Step 38020: {'lr': 7.299205606744142e-05, 'samples': 19466752, 'steps': 38020, 'loss/train': 1.5314196348190308} +02/26/2022 02:48:19 - INFO - codeparrot_training - Step 38021: {'lr': 7.298050159393388e-05, 'samples': 19467264, 'steps': 38021, 'loss/train': 1.9744246006011963} +02/26/2022 02:48:22 - INFO - codeparrot_training - Step 38022: {'lr': 7.296894787872158e-05, 'samples': 19467776, 'steps': 38022, 'loss/train': 1.652613639831543} +02/26/2022 02:48:28 - INFO - codeparrot_training - Step 38023: {'lr': 7.295739492185416e-05, 'samples': 19468288, 'steps': 38023, 'loss/train': 2.4441065788269043} +02/26/2022 02:48:32 - INFO - codeparrot_training - Step 38024: {'lr': 7.294584272338103e-05, 'samples': 19468800, 'steps': 38024, 'loss/train': 1.5685055255889893} +02/26/2022 02:48:37 - INFO - codeparrot_training - Step 38025: {'lr': 7.293429128335172e-05, 'samples': 19469312, 'steps': 38025, 'loss/train': 2.0573067665100098} +02/26/2022 02:48:41 - INFO - codeparrot_training - Step 38026: {'lr': 7.292274060181558e-05, 'samples': 19469824, 'steps': 38026, 'loss/train': 2.105271339416504} +02/26/2022 02:48:46 - INFO - codeparrot_training - Step 38027: {'lr': 7.29111906788223e-05, 'samples': 19470336, 'steps': 38027, 'loss/train': 1.6482328176498413} +02/26/2022 02:48:50 - INFO - codeparrot_training - Step 38028: {'lr': 7.289964151442113e-05, 'samples': 19470848, 'steps': 38028, 'loss/train': 0.9010985493659973} +02/26/2022 02:48:55 - INFO - codeparrot_training - Step 38029: {'lr': 7.288809310866182e-05, 'samples': 19471360, 'steps': 38029, 'loss/train': 2.1914548873901367} +02/26/2022 02:48:59 - INFO - codeparrot_training - Step 38030: {'lr': 7.287654546159356e-05, 'samples': 19471872, 'steps': 38030, 'loss/train': 1.8573434352874756} +02/26/2022 02:49:04 - INFO - codeparrot_training - Step 38031: {'lr': 7.286499857326597e-05, 'samples': 19472384, 'steps': 38031, 'loss/train': 1.8783557415008545} +02/26/2022 02:49:08 - INFO - codeparrot_training - Step 38032: {'lr': 7.285345244372843e-05, 'samples': 19472896, 'steps': 38032, 'loss/train': 2.015120029449463} +02/26/2022 02:49:13 - INFO - codeparrot_training - Step 38033: {'lr': 7.28419070730306e-05, 'samples': 19473408, 'steps': 38033, 'loss/train': 2.113590955734253} +02/26/2022 02:49:16 - INFO - codeparrot_training - Step 38034: {'lr': 7.283036246122163e-05, 'samples': 19473920, 'steps': 38034, 'loss/train': 2.720353364944458} +02/26/2022 02:49:22 - INFO - codeparrot_training - Step 38035: {'lr': 7.281881860835121e-05, 'samples': 19474432, 'steps': 38035, 'loss/train': 1.833739995956421} +02/26/2022 02:49:26 - INFO - codeparrot_training - Step 38036: {'lr': 7.280727551446862e-05, 'samples': 19474944, 'steps': 38036, 'loss/train': 1.8961317539215088} +02/26/2022 02:49:32 - INFO - codeparrot_training - Step 38037: {'lr': 7.279573317962348e-05, 'samples': 19475456, 'steps': 38037, 'loss/train': 1.1372878551483154} +02/26/2022 02:49:35 - INFO - codeparrot_training - Step 38038: {'lr': 7.278419160386515e-05, 'samples': 19475968, 'steps': 38038, 'loss/train': 1.3634076118469238} +02/26/2022 02:49:41 - INFO - codeparrot_training - Step 38039: {'lr': 7.277265078724308e-05, 'samples': 19476480, 'steps': 38039, 'loss/train': 0.1734483689069748} +02/26/2022 02:49:45 - INFO - codeparrot_training - Step 38040: {'lr': 7.276111072980662e-05, 'samples': 19476992, 'steps': 38040, 'loss/train': 0.5034950971603394} +02/26/2022 02:49:50 - INFO - codeparrot_training - Step 38041: {'lr': 7.274957143160535e-05, 'samples': 19477504, 'steps': 38041, 'loss/train': 1.6803172826766968} +02/26/2022 02:49:54 - INFO - codeparrot_training - Step 38042: {'lr': 7.273803289268862e-05, 'samples': 19478016, 'steps': 38042, 'loss/train': 1.9188061952590942} +02/26/2022 02:49:59 - INFO - codeparrot_training - Step 38043: {'lr': 7.272649511310589e-05, 'samples': 19478528, 'steps': 38043, 'loss/train': 1.6629756689071655} +02/26/2022 02:50:03 - INFO - codeparrot_training - Step 38044: {'lr': 7.271495809290657e-05, 'samples': 19479040, 'steps': 38044, 'loss/train': 1.9798567295074463} +02/26/2022 02:50:08 - INFO - codeparrot_training - Step 38045: {'lr': 7.270342183213999e-05, 'samples': 19479552, 'steps': 38045, 'loss/train': 0.5005486011505127} +02/26/2022 02:50:12 - INFO - codeparrot_training - Step 38046: {'lr': 7.269188633085571e-05, 'samples': 19480064, 'steps': 38046, 'loss/train': 1.2825769186019897} +02/26/2022 02:50:18 - INFO - codeparrot_training - Step 38047: {'lr': 7.26803515891031e-05, 'samples': 19480576, 'steps': 38047, 'loss/train': 1.5931419134140015} +02/26/2022 02:50:21 - INFO - codeparrot_training - Step 38048: {'lr': 7.266881760693158e-05, 'samples': 19481088, 'steps': 38048, 'loss/train': 0.5860764980316162} +02/26/2022 02:50:27 - INFO - codeparrot_training - Step 38049: {'lr': 7.265728438439046e-05, 'samples': 19481600, 'steps': 38049, 'loss/train': 2.6361136436462402} +02/26/2022 02:50:31 - INFO - codeparrot_training - Step 38050: {'lr': 7.264575192152925e-05, 'samples': 19482112, 'steps': 38050, 'loss/train': 2.3184337615966797} +02/26/2022 02:50:36 - INFO - codeparrot_training - Step 38051: {'lr': 7.263422021839736e-05, 'samples': 19482624, 'steps': 38051, 'loss/train': 1.7024630308151245} +02/26/2022 02:50:40 - INFO - codeparrot_training - Step 38052: {'lr': 7.262268927504414e-05, 'samples': 19483136, 'steps': 38052, 'loss/train': 1.4867494106292725} +02/26/2022 02:50:45 - INFO - codeparrot_training - Step 38053: {'lr': 7.261115909151894e-05, 'samples': 19483648, 'steps': 38053, 'loss/train': 0.991300106048584} +02/26/2022 02:50:49 - INFO - codeparrot_training - Step 38054: {'lr': 7.259962966787126e-05, 'samples': 19484160, 'steps': 38054, 'loss/train': 1.9065449237823486} +02/26/2022 02:50:55 - INFO - codeparrot_training - Step 38055: {'lr': 7.258810100415044e-05, 'samples': 19484672, 'steps': 38055, 'loss/train': 1.3514381647109985} +02/26/2022 02:50:58 - INFO - codeparrot_training - Step 38056: {'lr': 7.257657310040585e-05, 'samples': 19485184, 'steps': 38056, 'loss/train': 0.7219937443733215} +02/26/2022 02:51:04 - INFO - codeparrot_training - Step 38057: {'lr': 7.256504595668684e-05, 'samples': 19485696, 'steps': 38057, 'loss/train': 1.651576042175293} +02/26/2022 02:51:07 - INFO - codeparrot_training - Step 38058: {'lr': 7.255351957304287e-05, 'samples': 19486208, 'steps': 38058, 'loss/train': 2.153428554534912} +02/26/2022 02:51:13 - INFO - codeparrot_training - Step 38059: {'lr': 7.25419939495233e-05, 'samples': 19486720, 'steps': 38059, 'loss/train': 2.180460214614868} +02/26/2022 02:51:17 - INFO - codeparrot_training - Step 38060: {'lr': 7.253046908617747e-05, 'samples': 19487232, 'steps': 38060, 'loss/train': 1.2783384323120117} +02/26/2022 02:51:22 - INFO - codeparrot_training - Step 38061: {'lr': 7.25189449830547e-05, 'samples': 19487744, 'steps': 38061, 'loss/train': 1.4480818510055542} +02/26/2022 02:51:26 - INFO - codeparrot_training - Step 38062: {'lr': 7.250742164020446e-05, 'samples': 19488256, 'steps': 38062, 'loss/train': 1.1692036390304565} +02/26/2022 02:51:31 - INFO - codeparrot_training - Step 38063: {'lr': 7.249589905767601e-05, 'samples': 19488768, 'steps': 38063, 'loss/train': 1.20078706741333} +02/26/2022 02:51:35 - INFO - codeparrot_training - Step 38064: {'lr': 7.24843772355189e-05, 'samples': 19489280, 'steps': 38064, 'loss/train': 1.283164143562317} +02/26/2022 02:51:40 - INFO - codeparrot_training - Step 38065: {'lr': 7.247285617378221e-05, 'samples': 19489792, 'steps': 38065, 'loss/train': 1.3847582340240479} +02/26/2022 02:51:44 - INFO - codeparrot_training - Step 38066: {'lr': 7.246133587251549e-05, 'samples': 19490304, 'steps': 38066, 'loss/train': 1.312401533126831} +02/26/2022 02:51:49 - INFO - codeparrot_training - Step 38067: {'lr': 7.244981633176798e-05, 'samples': 19490816, 'steps': 38067, 'loss/train': 1.566505789756775} +02/26/2022 02:51:53 - INFO - codeparrot_training - Step 38068: {'lr': 7.243829755158923e-05, 'samples': 19491328, 'steps': 38068, 'loss/train': 1.360145092010498} +02/26/2022 02:51:58 - INFO - codeparrot_training - Step 38069: {'lr': 7.242677953202828e-05, 'samples': 19491840, 'steps': 38069, 'loss/train': 0.4492625892162323} +02/26/2022 02:52:02 - INFO - codeparrot_training - Step 38070: {'lr': 7.241526227313469e-05, 'samples': 19492352, 'steps': 38070, 'loss/train': 1.487532377243042} +02/26/2022 02:52:08 - INFO - codeparrot_training - Step 38071: {'lr': 7.240374577495765e-05, 'samples': 19492864, 'steps': 38071, 'loss/train': 1.5095921754837036} +02/26/2022 02:52:12 - INFO - codeparrot_training - Step 38072: {'lr': 7.239223003754672e-05, 'samples': 19493376, 'steps': 38072, 'loss/train': 1.449380874633789} +02/26/2022 02:52:17 - INFO - codeparrot_training - Step 38073: {'lr': 7.238071506095093e-05, 'samples': 19493888, 'steps': 38073, 'loss/train': 1.179553747177124} +02/26/2022 02:52:21 - INFO - codeparrot_training - Step 38074: {'lr': 7.236920084521981e-05, 'samples': 19494400, 'steps': 38074, 'loss/train': 2.299309015274048} +02/26/2022 02:52:26 - INFO - codeparrot_training - Step 38075: {'lr': 7.235768739040257e-05, 'samples': 19494912, 'steps': 38075, 'loss/train': 1.764549732208252} +02/26/2022 02:52:30 - INFO - codeparrot_training - Step 38076: {'lr': 7.234617469654866e-05, 'samples': 19495424, 'steps': 38076, 'loss/train': 1.7865841388702393} +02/26/2022 02:52:35 - INFO - codeparrot_training - Step 38077: {'lr': 7.233466276370735e-05, 'samples': 19495936, 'steps': 38077, 'loss/train': 1.5146217346191406} +02/26/2022 02:52:38 - INFO - codeparrot_training - Step 38078: {'lr': 7.232315159192793e-05, 'samples': 19496448, 'steps': 38078, 'loss/train': 2.66728138923645} +02/26/2022 02:52:44 - INFO - codeparrot_training - Step 38079: {'lr': 7.23116411812596e-05, 'samples': 19496960, 'steps': 38079, 'loss/train': 0.6679148077964783} +02/26/2022 02:52:48 - INFO - codeparrot_training - Step 38080: {'lr': 7.230013153175189e-05, 'samples': 19497472, 'steps': 38080, 'loss/train': 2.0153379440307617} +02/26/2022 02:52:53 - INFO - codeparrot_training - Step 38081: {'lr': 7.228862264345395e-05, 'samples': 19497984, 'steps': 38081, 'loss/train': 0.03077789396047592} +02/26/2022 02:52:57 - INFO - codeparrot_training - Step 38082: {'lr': 7.227711451641516e-05, 'samples': 19498496, 'steps': 38082, 'loss/train': 1.6509605646133423} +02/26/2022 02:53:02 - INFO - codeparrot_training - Step 38083: {'lr': 7.226560715068467e-05, 'samples': 19499008, 'steps': 38083, 'loss/train': 2.0321590900421143} +02/26/2022 02:53:06 - INFO - codeparrot_training - Step 38084: {'lr': 7.225410054631199e-05, 'samples': 19499520, 'steps': 38084, 'loss/train': 2.4848997592926025} +02/26/2022 02:53:12 - INFO - codeparrot_training - Step 38085: {'lr': 7.224259470334629e-05, 'samples': 19500032, 'steps': 38085, 'loss/train': 1.8340669870376587} +02/26/2022 02:53:16 - INFO - codeparrot_training - Step 38086: {'lr': 7.223108962183685e-05, 'samples': 19500544, 'steps': 38086, 'loss/train': 2.246068239212036} +02/26/2022 02:53:21 - INFO - codeparrot_training - Step 38087: {'lr': 7.221958530183293e-05, 'samples': 19501056, 'steps': 38087, 'loss/train': 0.7005888223648071} +02/26/2022 02:53:25 - INFO - codeparrot_training - Step 38088: {'lr': 7.22080817433839e-05, 'samples': 19501568, 'steps': 38088, 'loss/train': 0.1733948439359665} +02/26/2022 02:53:30 - INFO - codeparrot_training - Step 38089: {'lr': 7.2196578946539e-05, 'samples': 19502080, 'steps': 38089, 'loss/train': 2.106456756591797} +02/26/2022 02:53:34 - INFO - codeparrot_training - Step 38090: {'lr': 7.218507691134752e-05, 'samples': 19502592, 'steps': 38090, 'loss/train': 2.003767728805542} +02/26/2022 02:53:39 - INFO - codeparrot_training - Step 38091: {'lr': 7.21735756378587e-05, 'samples': 19503104, 'steps': 38091, 'loss/train': 1.810054063796997} +02/26/2022 02:53:43 - INFO - codeparrot_training - Step 38092: {'lr': 7.216207512612172e-05, 'samples': 19503616, 'steps': 38092, 'loss/train': 1.4031343460083008} +02/26/2022 02:53:48 - INFO - codeparrot_training - Step 38093: {'lr': 7.215057537618602e-05, 'samples': 19504128, 'steps': 38093, 'loss/train': 1.9758297204971313} +02/26/2022 02:53:52 - INFO - codeparrot_training - Step 38094: {'lr': 7.21390763881008e-05, 'samples': 19504640, 'steps': 38094, 'loss/train': 1.3060182332992554} +02/26/2022 02:53:57 - INFO - codeparrot_training - Step 38095: {'lr': 7.212757816191528e-05, 'samples': 19505152, 'steps': 38095, 'loss/train': 1.9382715225219727} +02/26/2022 02:54:01 - INFO - codeparrot_training - Step 38096: {'lr': 7.211608069767867e-05, 'samples': 19505664, 'steps': 38096, 'loss/train': 2.108659505844116} +02/26/2022 02:54:07 - INFO - codeparrot_training - Step 38097: {'lr': 7.210458399544037e-05, 'samples': 19506176, 'steps': 38097, 'loss/train': 2.769747257232666} +02/26/2022 02:54:11 - INFO - codeparrot_training - Step 38098: {'lr': 7.209308805524944e-05, 'samples': 19506688, 'steps': 38098, 'loss/train': 0.6523610353469849} +02/26/2022 02:54:16 - INFO - codeparrot_training - Step 38099: {'lr': 7.20815928771554e-05, 'samples': 19507200, 'steps': 38099, 'loss/train': 1.8880488872528076} +02/26/2022 02:54:20 - INFO - codeparrot_training - Step 38100: {'lr': 7.207009846120718e-05, 'samples': 19507712, 'steps': 38100, 'loss/train': 0.9422760009765625} +02/26/2022 02:54:25 - INFO - codeparrot_training - Step 38101: {'lr': 7.205860480745422e-05, 'samples': 19508224, 'steps': 38101, 'loss/train': 2.408179759979248} +02/26/2022 02:54:29 - INFO - codeparrot_training - Step 38102: {'lr': 7.204711191594562e-05, 'samples': 19508736, 'steps': 38102, 'loss/train': 2.15340518951416} +02/26/2022 02:54:34 - INFO - codeparrot_training - Step 38103: {'lr': 7.203561978673085e-05, 'samples': 19509248, 'steps': 38103, 'loss/train': 1.6576495170593262} +02/26/2022 02:54:38 - INFO - codeparrot_training - Step 38104: {'lr': 7.202412841985879e-05, 'samples': 19509760, 'steps': 38104, 'loss/train': 2.358712673187256} +02/26/2022 02:54:43 - INFO - codeparrot_training - Step 38105: {'lr': 7.201263781537895e-05, 'samples': 19510272, 'steps': 38105, 'loss/train': 1.4066082239151} +02/26/2022 02:54:47 - INFO - codeparrot_training - Step 38106: {'lr': 7.200114797334037e-05, 'samples': 19510784, 'steps': 38106, 'loss/train': 1.8579227924346924} +02/26/2022 02:54:53 - INFO - codeparrot_training - Step 38107: {'lr': 7.198965889379253e-05, 'samples': 19511296, 'steps': 38107, 'loss/train': 1.561664342880249} +02/26/2022 02:54:57 - INFO - codeparrot_training - Step 38108: {'lr': 7.197817057678427e-05, 'samples': 19511808, 'steps': 38108, 'loss/train': 1.1147043704986572} +02/26/2022 02:55:02 - INFO - codeparrot_training - Step 38109: {'lr': 7.196668302236509e-05, 'samples': 19512320, 'steps': 38109, 'loss/train': 2.020216941833496} +02/26/2022 02:55:06 - INFO - codeparrot_training - Step 38110: {'lr': 7.195519623058405e-05, 'samples': 19512832, 'steps': 38110, 'loss/train': 2.7649996280670166} +02/26/2022 02:55:11 - INFO - codeparrot_training - Step 38111: {'lr': 7.194371020149048e-05, 'samples': 19513344, 'steps': 38111, 'loss/train': 1.8314980268478394} +02/26/2022 02:55:15 - INFO - codeparrot_training - Step 38112: {'lr': 7.193222493513352e-05, 'samples': 19513856, 'steps': 38112, 'loss/train': 2.3585622310638428} +02/26/2022 02:55:20 - INFO - codeparrot_training - Step 38113: {'lr': 7.192074043156235e-05, 'samples': 19514368, 'steps': 38113, 'loss/train': 1.9599764347076416} +02/26/2022 02:55:24 - INFO - codeparrot_training - Step 38114: {'lr': 7.190925669082613e-05, 'samples': 19514880, 'steps': 38114, 'loss/train': 1.68540358543396} +02/26/2022 02:55:29 - INFO - codeparrot_training - Step 38115: {'lr': 7.189777371297415e-05, 'samples': 19515392, 'steps': 38115, 'loss/train': 1.7949540615081787} +02/26/2022 02:55:35 - INFO - codeparrot_training - Step 38116: {'lr': 7.188629149805556e-05, 'samples': 19515904, 'steps': 38116, 'loss/train': 1.2822867631912231} +02/26/2022 02:55:38 - INFO - codeparrot_training - Step 38117: {'lr': 7.187481004611956e-05, 'samples': 19516416, 'steps': 38117, 'loss/train': 0.1690545529127121} +02/26/2022 02:55:44 - INFO - codeparrot_training - Step 38118: {'lr': 7.18633293572152e-05, 'samples': 19516928, 'steps': 38118, 'loss/train': 1.5017328262329102} +02/26/2022 02:55:47 - INFO - codeparrot_training - Step 38119: {'lr': 7.18518494313919e-05, 'samples': 19517440, 'steps': 38119, 'loss/train': 1.8454328775405884} +02/26/2022 02:55:54 - INFO - codeparrot_training - Step 38120: {'lr': 7.184037026869867e-05, 'samples': 19517952, 'steps': 38120, 'loss/train': 1.5571293830871582} +02/26/2022 02:55:57 - INFO - codeparrot_training - Step 38121: {'lr': 7.182889186918474e-05, 'samples': 19518464, 'steps': 38121, 'loss/train': 2.341313600540161} +02/26/2022 02:56:01 - INFO - codeparrot_training - Step 38122: {'lr': 7.181741423289917e-05, 'samples': 19518976, 'steps': 38122, 'loss/train': 2.2340619564056396} +02/26/2022 02:56:06 - INFO - codeparrot_training - Step 38123: {'lr': 7.180593735989129e-05, 'samples': 19519488, 'steps': 38123, 'loss/train': 1.768855333328247} +02/26/2022 02:56:10 - INFO - codeparrot_training - Step 38124: {'lr': 7.179446125021022e-05, 'samples': 19520000, 'steps': 38124, 'loss/train': 2.415536880493164} +02/26/2022 02:56:15 - INFO - codeparrot_training - Step 38125: {'lr': 7.178298590390509e-05, 'samples': 19520512, 'steps': 38125, 'loss/train': 2.193103075027466} +02/26/2022 02:56:19 - INFO - codeparrot_training - Step 38126: {'lr': 7.177151132102496e-05, 'samples': 19521024, 'steps': 38126, 'loss/train': 1.5276339054107666} +02/26/2022 02:56:25 - INFO - codeparrot_training - Step 38127: {'lr': 7.176003750161916e-05, 'samples': 19521536, 'steps': 38127, 'loss/train': 1.4621673822402954} +02/26/2022 02:56:28 - INFO - codeparrot_training - Step 38128: {'lr': 7.174856444573676e-05, 'samples': 19522048, 'steps': 38128, 'loss/train': 1.3434168100357056} +02/26/2022 02:56:32 - INFO - codeparrot_training - Step 38129: {'lr': 7.173709215342695e-05, 'samples': 19522560, 'steps': 38129, 'loss/train': 0.39635080099105835} +02/26/2022 02:56:37 - INFO - codeparrot_training - Step 38130: {'lr': 7.17256206247387e-05, 'samples': 19523072, 'steps': 38130, 'loss/train': 2.165515899658203} +02/26/2022 02:56:41 - INFO - codeparrot_training - Step 38131: {'lr': 7.171414985972138e-05, 'samples': 19523584, 'steps': 38131, 'loss/train': 1.5523850917816162} +02/26/2022 02:56:48 - INFO - codeparrot_training - Step 38132: {'lr': 7.170267985842405e-05, 'samples': 19524096, 'steps': 38132, 'loss/train': 1.6655939817428589} +02/26/2022 02:56:52 - INFO - codeparrot_training - Step 38133: {'lr': 7.169121062089578e-05, 'samples': 19524608, 'steps': 38133, 'loss/train': 1.7885385751724243} +02/26/2022 02:56:57 - INFO - codeparrot_training - Step 38134: {'lr': 7.16797421471857e-05, 'samples': 19525120, 'steps': 38134, 'loss/train': 1.0705183744430542} +02/26/2022 02:57:03 - INFO - codeparrot_training - Step 38135: {'lr': 7.166827443734306e-05, 'samples': 19525632, 'steps': 38135, 'loss/train': 1.5479942560195923} +02/26/2022 02:57:06 - INFO - codeparrot_training - Step 38136: {'lr': 7.165680749141689e-05, 'samples': 19526144, 'steps': 38136, 'loss/train': 2.13727068901062} +02/26/2022 02:57:12 - INFO - codeparrot_training - Step 38137: {'lr': 7.164534130945624e-05, 'samples': 19526656, 'steps': 38137, 'loss/train': 0.5930886268615723} +02/26/2022 02:57:15 - INFO - codeparrot_training - Step 38138: {'lr': 7.16338758915105e-05, 'samples': 19527168, 'steps': 38138, 'loss/train': 0.3744605779647827} +02/26/2022 02:57:21 - INFO - codeparrot_training - Step 38139: {'lr': 7.162241123762841e-05, 'samples': 19527680, 'steps': 38139, 'loss/train': 0.6163443326950073} +02/26/2022 02:57:24 - INFO - codeparrot_training - Step 38140: {'lr': 7.16109473478594e-05, 'samples': 19528192, 'steps': 38140, 'loss/train': 2.636695384979248} +02/26/2022 02:57:32 - INFO - codeparrot_training - Step 38141: {'lr': 7.159948422225232e-05, 'samples': 19528704, 'steps': 38141, 'loss/train': 2.381225109100342} +02/26/2022 02:57:35 - INFO - codeparrot_training - Step 38142: {'lr': 7.158802186085656e-05, 'samples': 19529216, 'steps': 38142, 'loss/train': 1.7457891702651978} +02/26/2022 02:57:41 - INFO - codeparrot_training - Step 38143: {'lr': 7.157656026372092e-05, 'samples': 19529728, 'steps': 38143, 'loss/train': 1.2105522155761719} +02/26/2022 02:57:44 - INFO - codeparrot_training - Step 38144: {'lr': 7.156509943089471e-05, 'samples': 19530240, 'steps': 38144, 'loss/train': 1.0127432346343994} +02/26/2022 02:57:50 - INFO - codeparrot_training - Step 38145: {'lr': 7.155363936242686e-05, 'samples': 19530752, 'steps': 38145, 'loss/train': 1.8298380374908447} +02/26/2022 02:57:53 - INFO - codeparrot_training - Step 38146: {'lr': 7.154218005836668e-05, 'samples': 19531264, 'steps': 38146, 'loss/train': 1.9088324308395386} +02/26/2022 02:57:59 - INFO - codeparrot_training - Step 38147: {'lr': 7.153072151876311e-05, 'samples': 19531776, 'steps': 38147, 'loss/train': 0.6606325507164001} +02/26/2022 02:58:02 - INFO - codeparrot_training - Step 38148: {'lr': 7.151926374366524e-05, 'samples': 19532288, 'steps': 38148, 'loss/train': 1.7188962697982788} +02/26/2022 02:58:08 - INFO - codeparrot_training - Step 38149: {'lr': 7.150780673312212e-05, 'samples': 19532800, 'steps': 38149, 'loss/train': 2.3273098468780518} +02/26/2022 02:58:11 - INFO - codeparrot_training - Step 38150: {'lr': 7.149635048718294e-05, 'samples': 19533312, 'steps': 38150, 'loss/train': 2.488645315170288} +02/26/2022 02:58:17 - INFO - codeparrot_training - Step 38151: {'lr': 7.148489500589673e-05, 'samples': 19533824, 'steps': 38151, 'loss/train': 3.1085617542266846} +02/26/2022 02:58:20 - INFO - codeparrot_training - Step 38152: {'lr': 7.147344028931252e-05, 'samples': 19534336, 'steps': 38152, 'loss/train': 2.4928834438323975} +02/26/2022 02:58:24 - INFO - codeparrot_training - Step 38153: {'lr': 7.146198633747936e-05, 'samples': 19534848, 'steps': 38153, 'loss/train': 1.8379136323928833} +02/26/2022 02:58:31 - INFO - codeparrot_training - Step 38154: {'lr': 7.145053315044639e-05, 'samples': 19535360, 'steps': 38154, 'loss/train': 1.7272346019744873} +02/26/2022 02:58:34 - INFO - codeparrot_training - Step 38155: {'lr': 7.143908072826269e-05, 'samples': 19535872, 'steps': 38155, 'loss/train': 0.97761070728302} +02/26/2022 02:58:40 - INFO - codeparrot_training - Step 38156: {'lr': 7.142762907097721e-05, 'samples': 19536384, 'steps': 38156, 'loss/train': 1.1927820444107056} +02/26/2022 02:58:46 - INFO - codeparrot_training - Step 38157: {'lr': 7.141617817863905e-05, 'samples': 19536896, 'steps': 38157, 'loss/train': 1.2962172031402588} +02/26/2022 02:58:49 - INFO - codeparrot_training - Step 38158: {'lr': 7.14047280512973e-05, 'samples': 19537408, 'steps': 38158, 'loss/train': 1.986090898513794} +02/26/2022 02:58:53 - INFO - codeparrot_training - Step 38159: {'lr': 7.139327868900094e-05, 'samples': 19537920, 'steps': 38159, 'loss/train': 1.7715954780578613} +02/26/2022 02:58:58 - INFO - codeparrot_training - Step 38160: {'lr': 7.138183009179921e-05, 'samples': 19538432, 'steps': 38160, 'loss/train': 0.8882639408111572} +02/26/2022 02:59:04 - INFO - codeparrot_training - Step 38161: {'lr': 7.137038225974085e-05, 'samples': 19538944, 'steps': 38161, 'loss/train': 1.5299500226974487} +02/26/2022 02:59:07 - INFO - codeparrot_training - Step 38162: {'lr': 7.135893519287512e-05, 'samples': 19539456, 'steps': 38162, 'loss/train': 0.7520651817321777} +02/26/2022 02:59:15 - INFO - codeparrot_training - Step 38163: {'lr': 7.13474888912509e-05, 'samples': 19539968, 'steps': 38163, 'loss/train': 1.6187598705291748} +02/26/2022 02:59:18 - INFO - codeparrot_training - Step 38164: {'lr': 7.133604335491747e-05, 'samples': 19540480, 'steps': 38164, 'loss/train': 0.7635990381240845} +02/26/2022 02:59:24 - INFO - codeparrot_training - Step 38165: {'lr': 7.132459858392357e-05, 'samples': 19540992, 'steps': 38165, 'loss/train': 1.7196338176727295} +02/26/2022 02:59:27 - INFO - codeparrot_training - Step 38166: {'lr': 7.131315457831841e-05, 'samples': 19541504, 'steps': 38166, 'loss/train': 2.479658365249634} +02/26/2022 02:59:33 - INFO - codeparrot_training - Step 38167: {'lr': 7.130171133815086e-05, 'samples': 19542016, 'steps': 38167, 'loss/train': 1.700913667678833} +02/26/2022 02:59:36 - INFO - codeparrot_training - Step 38168: {'lr': 7.12902688634702e-05, 'samples': 19542528, 'steps': 38168, 'loss/train': 3.29341721534729} +02/26/2022 02:59:42 - INFO - codeparrot_training - Step 38169: {'lr': 7.127882715432515e-05, 'samples': 19543040, 'steps': 38169, 'loss/train': 1.369329571723938} +02/26/2022 02:59:45 - INFO - codeparrot_training - Step 38170: {'lr': 7.126738621076493e-05, 'samples': 19543552, 'steps': 38170, 'loss/train': 0.4311719834804535} +02/26/2022 02:59:51 - INFO - codeparrot_training - Step 38171: {'lr': 7.125594603283845e-05, 'samples': 19544064, 'steps': 38171, 'loss/train': 1.105877161026001} +02/26/2022 02:59:54 - INFO - codeparrot_training - Step 38172: {'lr': 7.124450662059468e-05, 'samples': 19544576, 'steps': 38172, 'loss/train': 1.7536799907684326} +02/26/2022 03:00:00 - INFO - codeparrot_training - Step 38173: {'lr': 7.123306797408274e-05, 'samples': 19545088, 'steps': 38173, 'loss/train': 1.8302478790283203} +02/26/2022 03:00:03 - INFO - codeparrot_training - Step 38174: {'lr': 7.122163009335159e-05, 'samples': 19545600, 'steps': 38174, 'loss/train': 0.6642072796821594} +02/26/2022 03:00:09 - INFO - codeparrot_training - Step 38175: {'lr': 7.121019297845019e-05, 'samples': 19546112, 'steps': 38175, 'loss/train': 1.7727161645889282} +02/26/2022 03:00:12 - INFO - codeparrot_training - Step 38176: {'lr': 7.119875662942748e-05, 'samples': 19546624, 'steps': 38176, 'loss/train': 1.3386083841323853} +02/26/2022 03:00:20 - INFO - codeparrot_training - Step 38177: {'lr': 7.11873210463326e-05, 'samples': 19547136, 'steps': 38177, 'loss/train': 1.9967362880706787} +02/26/2022 03:00:23 - INFO - codeparrot_training - Step 38178: {'lr': 7.117588622921448e-05, 'samples': 19547648, 'steps': 38178, 'loss/train': 1.3029136657714844} +02/26/2022 03:00:27 - INFO - codeparrot_training - Step 38179: {'lr': 7.116445217812207e-05, 'samples': 19548160, 'steps': 38179, 'loss/train': 1.8939669132232666} +02/26/2022 03:00:32 - INFO - codeparrot_training - Step 38180: {'lr': 7.115301889310427e-05, 'samples': 19548672, 'steps': 38180, 'loss/train': 1.8544868230819702} +02/26/2022 03:00:36 - INFO - codeparrot_training - Step 38181: {'lr': 7.114158637421023e-05, 'samples': 19549184, 'steps': 38181, 'loss/train': 1.6866735219955444} +02/26/2022 03:00:41 - INFO - codeparrot_training - Step 38182: {'lr': 7.113015462148884e-05, 'samples': 19549696, 'steps': 38182, 'loss/train': 1.9695546627044678} +02/26/2022 03:00:45 - INFO - codeparrot_training - Step 38183: {'lr': 7.111872363498905e-05, 'samples': 19550208, 'steps': 38183, 'loss/train': 3.7168359756469727} +02/26/2022 03:00:50 - INFO - codeparrot_training - Step 38184: {'lr': 7.11072934147598e-05, 'samples': 19550720, 'steps': 38184, 'loss/train': 1.8615844249725342} +02/26/2022 03:00:54 - INFO - codeparrot_training - Step 38185: {'lr': 7.109586396085016e-05, 'samples': 19551232, 'steps': 38185, 'loss/train': 2.2218596935272217} +02/26/2022 03:00:59 - INFO - codeparrot_training - Step 38186: {'lr': 7.108443527330904e-05, 'samples': 19551744, 'steps': 38186, 'loss/train': 1.7533131837844849} +02/26/2022 03:01:03 - INFO - codeparrot_training - Step 38187: {'lr': 7.107300735218539e-05, 'samples': 19552256, 'steps': 38187, 'loss/train': 1.4288514852523804} +02/26/2022 03:01:08 - INFO - codeparrot_training - Step 38188: {'lr': 7.106158019752806e-05, 'samples': 19552768, 'steps': 38188, 'loss/train': 1.6369614601135254} +02/26/2022 03:01:12 - INFO - codeparrot_training - Step 38189: {'lr': 7.10501538093862e-05, 'samples': 19553280, 'steps': 38189, 'loss/train': 1.2787474393844604} +02/26/2022 03:01:19 - INFO - codeparrot_training - Step 38190: {'lr': 7.103872818780866e-05, 'samples': 19553792, 'steps': 38190, 'loss/train': 1.8749148845672607} +02/26/2022 03:01:22 - INFO - codeparrot_training - Step 38191: {'lr': 7.102730333284438e-05, 'samples': 19554304, 'steps': 38191, 'loss/train': 2.030489444732666} +02/26/2022 03:01:28 - INFO - codeparrot_training - Step 38192: {'lr': 7.10158792445422e-05, 'samples': 19554816, 'steps': 38192, 'loss/train': 1.023307204246521} +02/26/2022 03:01:34 - INFO - codeparrot_training - Step 38193: {'lr': 7.100445592295126e-05, 'samples': 19555328, 'steps': 38193, 'loss/train': 1.9115947484970093} +02/26/2022 03:01:37 - INFO - codeparrot_training - Step 38194: {'lr': 7.099303336812032e-05, 'samples': 19555840, 'steps': 38194, 'loss/train': 1.884045124053955} +02/26/2022 03:01:43 - INFO - codeparrot_training - Step 38195: {'lr': 7.098161158009853e-05, 'samples': 19556352, 'steps': 38195, 'loss/train': 1.5298393964767456} +02/26/2022 03:01:46 - INFO - codeparrot_training - Step 38196: {'lr': 7.097019055893452e-05, 'samples': 19556864, 'steps': 38196, 'loss/train': 1.0842851400375366} +02/26/2022 03:01:52 - INFO - codeparrot_training - Step 38197: {'lr': 7.095877030467743e-05, 'samples': 19557376, 'steps': 38197, 'loss/train': 0.9352651238441467} +02/26/2022 03:01:55 - INFO - codeparrot_training - Step 38198: {'lr': 7.094735081737605e-05, 'samples': 19557888, 'steps': 38198, 'loss/train': 1.6735531091690063} +02/26/2022 03:02:02 - INFO - codeparrot_training - Step 38199: {'lr': 7.093593209707952e-05, 'samples': 19558400, 'steps': 38199, 'loss/train': 0.9866325259208679} +02/26/2022 03:02:06 - INFO - codeparrot_training - Step 38200: {'lr': 7.092451414383643e-05, 'samples': 19558912, 'steps': 38200, 'loss/train': 0.46933799982070923} +02/26/2022 03:02:12 - INFO - codeparrot_training - Step 38201: {'lr': 7.091309695769596e-05, 'samples': 19559424, 'steps': 38201, 'loss/train': 2.1038448810577393} +02/26/2022 03:02:15 - INFO - codeparrot_training - Step 38202: {'lr': 7.090168053870683e-05, 'samples': 19559936, 'steps': 38202, 'loss/train': 2.31260085105896} +02/26/2022 03:02:19 - INFO - codeparrot_training - Step 38203: {'lr': 7.089026488691817e-05, 'samples': 19560448, 'steps': 38203, 'loss/train': 2.04152250289917} +02/26/2022 03:02:24 - INFO - codeparrot_training - Step 38204: {'lr': 7.087885000237859e-05, 'samples': 19560960, 'steps': 38204, 'loss/train': 1.5692404508590698} +02/26/2022 03:02:28 - INFO - codeparrot_training - Step 38205: {'lr': 7.086743588513723e-05, 'samples': 19561472, 'steps': 38205, 'loss/train': 1.3013707399368286} +02/26/2022 03:02:33 - INFO - codeparrot_training - Step 38206: {'lr': 7.085602253524281e-05, 'samples': 19561984, 'steps': 38206, 'loss/train': 1.498496174812317} +02/26/2022 03:02:37 - INFO - codeparrot_training - Step 38207: {'lr': 7.084460995274439e-05, 'samples': 19562496, 'steps': 38207, 'loss/train': 1.7957921028137207} +02/26/2022 03:02:42 - INFO - codeparrot_training - Step 38208: {'lr': 7.083319813769076e-05, 'samples': 19563008, 'steps': 38208, 'loss/train': 0.141988143324852} +02/26/2022 03:02:46 - INFO - codeparrot_training - Step 38209: {'lr': 7.082178709013082e-05, 'samples': 19563520, 'steps': 38209, 'loss/train': 1.4009586572647095} +02/26/2022 03:02:53 - INFO - codeparrot_training - Step 38210: {'lr': 7.081037681011338e-05, 'samples': 19564032, 'steps': 38210, 'loss/train': 2.7622272968292236} +02/26/2022 03:02:56 - INFO - codeparrot_training - Step 38211: {'lr': 7.079896729768745e-05, 'samples': 19564544, 'steps': 38211, 'loss/train': 1.6070525646209717} +02/26/2022 03:03:02 - INFO - codeparrot_training - Step 38212: {'lr': 7.078755855290183e-05, 'samples': 19565056, 'steps': 38212, 'loss/train': 1.5549302101135254} +02/26/2022 03:03:05 - INFO - codeparrot_training - Step 38213: {'lr': 7.077615057580545e-05, 'samples': 19565568, 'steps': 38213, 'loss/train': 0.098085917532444} +02/26/2022 03:03:11 - INFO - codeparrot_training - Step 38214: {'lr': 7.0764743366447e-05, 'samples': 19566080, 'steps': 38214, 'loss/train': 2.2977380752563477} +02/26/2022 03:03:14 - INFO - codeparrot_training - Step 38215: {'lr': 7.075333692487559e-05, 'samples': 19566592, 'steps': 38215, 'loss/train': 1.908610463142395} +02/26/2022 03:03:20 - INFO - codeparrot_training - Step 38216: {'lr': 7.074193125113996e-05, 'samples': 19567104, 'steps': 38216, 'loss/train': 1.382575273513794} +02/26/2022 03:03:23 - INFO - codeparrot_training - Step 38217: {'lr': 7.073052634528898e-05, 'samples': 19567616, 'steps': 38217, 'loss/train': 2.211209774017334} +02/26/2022 03:03:29 - INFO - codeparrot_training - Step 38218: {'lr': 7.071912220737147e-05, 'samples': 19568128, 'steps': 38218, 'loss/train': 1.5111160278320312} +02/26/2022 03:03:32 - INFO - codeparrot_training - Step 38219: {'lr': 7.070771883743626e-05, 'samples': 19568640, 'steps': 38219, 'loss/train': 2.004314422607422} +02/26/2022 03:03:40 - INFO - codeparrot_training - Step 38220: {'lr': 7.069631623553232e-05, 'samples': 19569152, 'steps': 38220, 'loss/train': 0.437398761510849} +02/26/2022 03:03:43 - INFO - codeparrot_training - Step 38221: {'lr': 7.068491440170843e-05, 'samples': 19569664, 'steps': 38221, 'loss/train': 1.8562313318252563} +02/26/2022 03:03:49 - INFO - codeparrot_training - Step 38222: {'lr': 7.067351333601343e-05, 'samples': 19570176, 'steps': 38222, 'loss/train': 1.1736711263656616} +02/26/2022 03:03:52 - INFO - codeparrot_training - Step 38223: {'lr': 7.06621130384961e-05, 'samples': 19570688, 'steps': 38223, 'loss/train': 1.7102985382080078} +02/26/2022 03:03:58 - INFO - codeparrot_training - Step 38224: {'lr': 7.065071350920538e-05, 'samples': 19571200, 'steps': 38224, 'loss/train': 0.5994188785552979} +02/26/2022 03:04:01 - INFO - codeparrot_training - Step 38225: {'lr': 7.063931474819005e-05, 'samples': 19571712, 'steps': 38225, 'loss/train': 2.1661248207092285} +02/26/2022 03:04:07 - INFO - codeparrot_training - Step 38226: {'lr': 7.062791675549896e-05, 'samples': 19572224, 'steps': 38226, 'loss/train': 2.3120572566986084} +02/26/2022 03:04:10 - INFO - codeparrot_training - Step 38227: {'lr': 7.061651953118084e-05, 'samples': 19572736, 'steps': 38227, 'loss/train': 2.0443308353424072} +02/26/2022 03:04:16 - INFO - codeparrot_training - Step 38228: {'lr': 7.060512307528466e-05, 'samples': 19573248, 'steps': 38228, 'loss/train': 1.6328598260879517} +02/26/2022 03:04:19 - INFO - codeparrot_training - Step 38229: {'lr': 7.059372738785915e-05, 'samples': 19573760, 'steps': 38229, 'loss/train': 3.0696194171905518} +02/26/2022 03:04:25 - INFO - codeparrot_training - Step 38230: {'lr': 7.058233246895315e-05, 'samples': 19574272, 'steps': 38230, 'loss/train': 1.9886451959609985} +02/26/2022 03:04:28 - INFO - codeparrot_training - Step 38231: {'lr': 7.057093831861542e-05, 'samples': 19574784, 'steps': 38231, 'loss/train': 0.9862726926803589} +02/26/2022 03:04:34 - INFO - codeparrot_training - Step 38232: {'lr': 7.055954493689487e-05, 'samples': 19575296, 'steps': 38232, 'loss/train': 2.040212392807007} +02/26/2022 03:04:37 - INFO - codeparrot_training - Step 38233: {'lr': 7.054815232384018e-05, 'samples': 19575808, 'steps': 38233, 'loss/train': 1.2924765348434448} +02/26/2022 03:04:43 - INFO - codeparrot_training - Step 38234: {'lr': 7.053676047950037e-05, 'samples': 19576320, 'steps': 38234, 'loss/train': 2.6697871685028076} +02/26/2022 03:04:46 - INFO - codeparrot_training - Step 38235: {'lr': 7.052536940392393e-05, 'samples': 19576832, 'steps': 38235, 'loss/train': 1.3289813995361328} +02/26/2022 03:04:54 - INFO - codeparrot_training - Step 38236: {'lr': 7.051397909715992e-05, 'samples': 19577344, 'steps': 38236, 'loss/train': 1.9227101802825928} +02/26/2022 03:04:57 - INFO - codeparrot_training - Step 38237: {'lr': 7.050258955925692e-05, 'samples': 19577856, 'steps': 38237, 'loss/train': 1.0109972953796387} +02/26/2022 03:05:02 - INFO - codeparrot_training - Step 38238: {'lr': 7.049120079026403e-05, 'samples': 19578368, 'steps': 38238, 'loss/train': 0.5722323656082153} +02/26/2022 03:05:06 - INFO - codeparrot_training - Step 38239: {'lr': 7.047981279022964e-05, 'samples': 19578880, 'steps': 38239, 'loss/train': 2.2172272205352783} +02/26/2022 03:05:11 - INFO - codeparrot_training - Step 38240: {'lr': 7.046842555920283e-05, 'samples': 19579392, 'steps': 38240, 'loss/train': 2.937234878540039} +02/26/2022 03:05:15 - INFO - codeparrot_training - Step 38241: {'lr': 7.04570390972322e-05, 'samples': 19579904, 'steps': 38241, 'loss/train': 0.5131740570068359} +02/26/2022 03:05:20 - INFO - codeparrot_training - Step 38242: {'lr': 7.044565340436664e-05, 'samples': 19580416, 'steps': 38242, 'loss/train': 1.65739107131958} +02/26/2022 03:05:24 - INFO - codeparrot_training - Step 38243: {'lr': 7.043426848065493e-05, 'samples': 19580928, 'steps': 38243, 'loss/train': 1.4585521221160889} +02/26/2022 03:05:29 - INFO - codeparrot_training - Step 38244: {'lr': 7.042288432614577e-05, 'samples': 19581440, 'steps': 38244, 'loss/train': 1.4854989051818848} +02/26/2022 03:05:33 - INFO - codeparrot_training - Step 38245: {'lr': 7.041150094088788e-05, 'samples': 19581952, 'steps': 38245, 'loss/train': 1.4963589906692505} +02/26/2022 03:05:40 - INFO - codeparrot_training - Step 38246: {'lr': 7.040011832493021e-05, 'samples': 19582464, 'steps': 38246, 'loss/train': 1.304911494255066} +02/26/2022 03:05:43 - INFO - codeparrot_training - Step 38247: {'lr': 7.038873647832137e-05, 'samples': 19582976, 'steps': 38247, 'loss/train': 0.5257362723350525} +02/26/2022 03:05:49 - INFO - codeparrot_training - Step 38248: {'lr': 7.037735540111015e-05, 'samples': 19583488, 'steps': 38248, 'loss/train': 2.09340763092041} +02/26/2022 03:05:52 - INFO - codeparrot_training - Step 38249: {'lr': 7.036597509334521e-05, 'samples': 19584000, 'steps': 38249, 'loss/train': 1.0398221015930176} +02/26/2022 03:05:58 - INFO - codeparrot_training - Step 38250: {'lr': 7.035459555507548e-05, 'samples': 19584512, 'steps': 38250, 'loss/train': 0.8158255219459534} +02/26/2022 03:06:01 - INFO - codeparrot_training - Step 38251: {'lr': 7.034321678634964e-05, 'samples': 19585024, 'steps': 38251, 'loss/train': 0.887293815612793} +02/26/2022 03:06:07 - INFO - codeparrot_training - Step 38252: {'lr': 7.033183878721639e-05, 'samples': 19585536, 'steps': 38252, 'loss/train': 1.9078387022018433} +02/26/2022 03:06:12 - INFO - codeparrot_training - Step 38253: {'lr': 7.032046155772442e-05, 'samples': 19586048, 'steps': 38253, 'loss/train': 2.415226697921753} +02/26/2022 03:06:16 - INFO - codeparrot_training - Step 38254: {'lr': 7.030908509792261e-05, 'samples': 19586560, 'steps': 38254, 'loss/train': 0.4588976204395294} +02/26/2022 03:06:23 - INFO - codeparrot_training - Step 38255: {'lr': 7.029770940785963e-05, 'samples': 19587072, 'steps': 38255, 'loss/train': 2.852640151977539} +02/26/2022 03:06:26 - INFO - codeparrot_training - Step 38256: {'lr': 7.028633448758421e-05, 'samples': 19587584, 'steps': 38256, 'loss/train': 1.6801319122314453} +02/26/2022 03:06:32 - INFO - codeparrot_training - Step 38257: {'lr': 7.027496033714498e-05, 'samples': 19588096, 'steps': 38257, 'loss/train': 1.0426446199417114} +02/26/2022 03:06:35 - INFO - codeparrot_training - Step 38258: {'lr': 7.026358695659082e-05, 'samples': 19588608, 'steps': 38258, 'loss/train': 2.1895763874053955} +02/26/2022 03:06:41 - INFO - codeparrot_training - Step 38259: {'lr': 7.025221434597037e-05, 'samples': 19589120, 'steps': 38259, 'loss/train': 1.5701831579208374} +02/26/2022 03:06:45 - INFO - codeparrot_training - Step 38260: {'lr': 7.024084250533239e-05, 'samples': 19589632, 'steps': 38260, 'loss/train': 0.7637211084365845} +02/26/2022 03:06:50 - INFO - codeparrot_training - Step 38261: {'lr': 7.022947143472547e-05, 'samples': 19590144, 'steps': 38261, 'loss/train': 1.3565819263458252} +02/26/2022 03:06:54 - INFO - codeparrot_training - Step 38262: {'lr': 7.02181011341985e-05, 'samples': 19590656, 'steps': 38262, 'loss/train': 2.545463800430298} +02/26/2022 03:06:59 - INFO - codeparrot_training - Step 38263: {'lr': 7.020673160380006e-05, 'samples': 19591168, 'steps': 38263, 'loss/train': 2.026808500289917} +02/26/2022 03:07:03 - INFO - codeparrot_training - Step 38264: {'lr': 7.019536284357891e-05, 'samples': 19591680, 'steps': 38264, 'loss/train': 1.3249893188476562} +02/26/2022 03:07:10 - INFO - codeparrot_training - Step 38265: {'lr': 7.018399485358367e-05, 'samples': 19592192, 'steps': 38265, 'loss/train': 1.671152114868164} +02/26/2022 03:07:13 - INFO - codeparrot_training - Step 38266: {'lr': 7.017262763386317e-05, 'samples': 19592704, 'steps': 38266, 'loss/train': 2.67478084564209} +02/26/2022 03:07:19 - INFO - codeparrot_training - Step 38267: {'lr': 7.016126118446603e-05, 'samples': 19593216, 'steps': 38267, 'loss/train': 1.779833197593689} +02/26/2022 03:07:22 - INFO - codeparrot_training - Step 38268: {'lr': 7.014989550544085e-05, 'samples': 19593728, 'steps': 38268, 'loss/train': 1.939889669418335} +02/26/2022 03:07:28 - INFO - codeparrot_training - Step 38269: {'lr': 7.013853059683655e-05, 'samples': 19594240, 'steps': 38269, 'loss/train': 2.837552785873413} +02/26/2022 03:07:32 - INFO - codeparrot_training - Step 38270: {'lr': 7.012716645870157e-05, 'samples': 19594752, 'steps': 38270, 'loss/train': 1.5576125383377075} +02/26/2022 03:07:37 - INFO - codeparrot_training - Step 38271: {'lr': 7.011580309108472e-05, 'samples': 19595264, 'steps': 38271, 'loss/train': 1.4813158512115479} +02/26/2022 03:07:41 - INFO - codeparrot_training - Step 38272: {'lr': 7.01044404940346e-05, 'samples': 19595776, 'steps': 38272, 'loss/train': 2.7505342960357666} +02/26/2022 03:07:46 - INFO - codeparrot_training - Step 38273: {'lr': 7.009307866760008e-05, 'samples': 19596288, 'steps': 38273, 'loss/train': 1.6960562467575073} +02/26/2022 03:07:50 - INFO - codeparrot_training - Step 38274: {'lr': 7.008171761182955e-05, 'samples': 19596800, 'steps': 38274, 'loss/train': 2.1555190086364746} +02/26/2022 03:07:55 - INFO - codeparrot_training - Step 38275: {'lr': 7.007035732677186e-05, 'samples': 19597312, 'steps': 38275, 'loss/train': 2.4800174236297607} +02/26/2022 03:07:59 - INFO - codeparrot_training - Step 38276: {'lr': 7.005899781247557e-05, 'samples': 19597824, 'steps': 38276, 'loss/train': 2.0562477111816406} +02/26/2022 03:08:04 - INFO - codeparrot_training - Step 38277: {'lr': 7.004763906898953e-05, 'samples': 19598336, 'steps': 38277, 'loss/train': 1.5696412324905396} +02/26/2022 03:08:08 - INFO - codeparrot_training - Step 38278: {'lr': 7.003628109636212e-05, 'samples': 19598848, 'steps': 38278, 'loss/train': 1.393474817276001} +02/26/2022 03:08:13 - INFO - codeparrot_training - Step 38279: {'lr': 7.00249238946422e-05, 'samples': 19599360, 'steps': 38279, 'loss/train': 1.925711989402771} +02/26/2022 03:08:17 - INFO - codeparrot_training - Step 38280: {'lr': 7.001356746387829e-05, 'samples': 19599872, 'steps': 38280, 'loss/train': 1.9334263801574707} +02/26/2022 03:08:22 - INFO - codeparrot_training - Step 38281: {'lr': 7.00022118041192e-05, 'samples': 19600384, 'steps': 38281, 'loss/train': 1.6700961589813232} +02/26/2022 03:08:26 - INFO - codeparrot_training - Step 38282: {'lr': 6.999085691541346e-05, 'samples': 19600896, 'steps': 38282, 'loss/train': 1.2895236015319824} +02/26/2022 03:08:33 - INFO - codeparrot_training - Step 38283: {'lr': 6.997950279780974e-05, 'samples': 19601408, 'steps': 38283, 'loss/train': 1.5613279342651367} +02/26/2022 03:08:36 - INFO - codeparrot_training - Step 38284: {'lr': 6.996814945135657e-05, 'samples': 19601920, 'steps': 38284, 'loss/train': 2.217952251434326} +02/26/2022 03:08:42 - INFO - codeparrot_training - Step 38285: {'lr': 6.995679687610276e-05, 'samples': 19602432, 'steps': 38285, 'loss/train': 2.027120351791382} +02/26/2022 03:08:45 - INFO - codeparrot_training - Step 38286: {'lr': 6.994544507209688e-05, 'samples': 19602944, 'steps': 38286, 'loss/train': 1.4986342191696167} +02/26/2022 03:08:51 - INFO - codeparrot_training - Step 38287: {'lr': 6.993409403938752e-05, 'samples': 19603456, 'steps': 38287, 'loss/train': 1.6712936162948608} +02/26/2022 03:08:54 - INFO - codeparrot_training - Step 38288: {'lr': 6.992274377802327e-05, 'samples': 19603968, 'steps': 38288, 'loss/train': 3.0750985145568848} +02/26/2022 03:09:00 - INFO - codeparrot_training - Step 38289: {'lr': 6.991139428805288e-05, 'samples': 19604480, 'steps': 38289, 'loss/train': 1.3052424192428589} +02/26/2022 03:09:03 - INFO - codeparrot_training - Step 38290: {'lr': 6.990004556952487e-05, 'samples': 19604992, 'steps': 38290, 'loss/train': 1.5871858596801758} +02/26/2022 03:09:09 - INFO - codeparrot_training - Step 38291: {'lr': 6.98886976224879e-05, 'samples': 19605504, 'steps': 38291, 'loss/train': 1.7583281993865967} +02/26/2022 03:09:12 - INFO - codeparrot_training - Step 38292: {'lr': 6.987735044699045e-05, 'samples': 19606016, 'steps': 38292, 'loss/train': 2.274233102798462} +02/26/2022 03:09:20 - INFO - codeparrot_training - Step 38293: {'lr': 6.986600404308132e-05, 'samples': 19606528, 'steps': 38293, 'loss/train': 2.299293041229248} +02/26/2022 03:09:23 - INFO - codeparrot_training - Step 38294: {'lr': 6.985465841080899e-05, 'samples': 19607040, 'steps': 38294, 'loss/train': 1.7122441530227661} +02/26/2022 03:09:29 - INFO - codeparrot_training - Step 38295: {'lr': 6.984331355022222e-05, 'samples': 19607552, 'steps': 38295, 'loss/train': 1.8874236345291138} +02/26/2022 03:09:32 - INFO - codeparrot_training - Step 38296: {'lr': 6.983196946136935e-05, 'samples': 19608064, 'steps': 38296, 'loss/train': 1.9548982381820679} +02/26/2022 03:09:38 - INFO - codeparrot_training - Step 38297: {'lr': 6.982062614429918e-05, 'samples': 19608576, 'steps': 38297, 'loss/train': 3.8726401329040527} +02/26/2022 03:09:41 - INFO - codeparrot_training - Step 38298: {'lr': 6.980928359906025e-05, 'samples': 19609088, 'steps': 38298, 'loss/train': 0.9677563905715942} +02/26/2022 03:09:47 - INFO - codeparrot_training - Step 38299: {'lr': 6.979794182570112e-05, 'samples': 19609600, 'steps': 38299, 'loss/train': 1.4185266494750977} +02/26/2022 03:09:50 - INFO - codeparrot_training - Step 38300: {'lr': 6.97866008242703e-05, 'samples': 19610112, 'steps': 38300, 'loss/train': 1.8968249559402466} +02/26/2022 03:09:56 - INFO - codeparrot_training - Step 38301: {'lr': 6.977526059481653e-05, 'samples': 19610624, 'steps': 38301, 'loss/train': 7.962368488311768} +02/26/2022 03:10:00 - INFO - codeparrot_training - Step 38302: {'lr': 6.976392113738833e-05, 'samples': 19611136, 'steps': 38302, 'loss/train': 2.0363941192626953} +02/26/2022 03:10:05 - INFO - codeparrot_training - Step 38303: {'lr': 6.97525824520342e-05, 'samples': 19611648, 'steps': 38303, 'loss/train': 1.7641922235488892} +02/26/2022 03:10:09 - INFO - codeparrot_training - Step 38304: {'lr': 6.974124453880282e-05, 'samples': 19612160, 'steps': 38304, 'loss/train': 1.8338292837142944} +02/26/2022 03:10:14 - INFO - codeparrot_training - Step 38305: {'lr': 6.972990739774274e-05, 'samples': 19612672, 'steps': 38305, 'loss/train': 1.7249993085861206} +02/26/2022 03:10:18 - INFO - codeparrot_training - Step 38306: {'lr': 6.971857102890247e-05, 'samples': 19613184, 'steps': 38306, 'loss/train': 1.5775387287139893} +02/26/2022 03:10:23 - INFO - codeparrot_training - Step 38307: {'lr': 6.97072354323305e-05, 'samples': 19613696, 'steps': 38307, 'loss/train': 1.1379903554916382} +02/26/2022 03:10:27 - INFO - codeparrot_training - Step 38308: {'lr': 6.969590060807563e-05, 'samples': 19614208, 'steps': 38308, 'loss/train': 1.80392324924469} +02/26/2022 03:10:32 - INFO - codeparrot_training - Step 38309: {'lr': 6.968456655618621e-05, 'samples': 19614720, 'steps': 38309, 'loss/train': 1.4866101741790771} +02/26/2022 03:10:36 - INFO - codeparrot_training - Step 38310: {'lr': 6.967323327671085e-05, 'samples': 19615232, 'steps': 38310, 'loss/train': 0.8231110572814941} +02/26/2022 03:10:41 - INFO - codeparrot_training - Step 38311: {'lr': 6.966190076969806e-05, 'samples': 19615744, 'steps': 38311, 'loss/train': 1.5180293321609497} +02/26/2022 03:10:45 - INFO - codeparrot_training - Step 38312: {'lr': 6.965056903519648e-05, 'samples': 19616256, 'steps': 38312, 'loss/train': 1.631626844406128} +02/26/2022 03:10:51 - INFO - codeparrot_training - Step 38313: {'lr': 6.96392380732546e-05, 'samples': 19616768, 'steps': 38313, 'loss/train': 1.9530813694000244} +02/26/2022 03:10:56 - INFO - codeparrot_training - Step 38314: {'lr': 6.962790788392093e-05, 'samples': 19617280, 'steps': 38314, 'loss/train': 1.4769620895385742} +02/26/2022 03:11:00 - INFO - codeparrot_training - Step 38315: {'lr': 6.961657846724395e-05, 'samples': 19617792, 'steps': 38315, 'loss/train': 2.2006146907806396} +02/26/2022 03:11:05 - INFO - codeparrot_training - Step 38316: {'lr': 6.960524982327238e-05, 'samples': 19618304, 'steps': 38316, 'loss/train': 1.8449044227600098} +02/26/2022 03:11:09 - INFO - codeparrot_training - Step 38317: {'lr': 6.959392195205461e-05, 'samples': 19618816, 'steps': 38317, 'loss/train': 1.8796827793121338} +02/26/2022 03:11:12 - INFO - codeparrot_training - Step 38318: {'lr': 6.958259485363922e-05, 'samples': 19619328, 'steps': 38318, 'loss/train': 0.7383489608764648} +02/26/2022 03:11:18 - INFO - codeparrot_training - Step 38319: {'lr': 6.95712685280746e-05, 'samples': 19619840, 'steps': 38319, 'loss/train': 1.6463539600372314} +02/26/2022 03:11:21 - INFO - codeparrot_training - Step 38320: {'lr': 6.955994297540946e-05, 'samples': 19620352, 'steps': 38320, 'loss/train': 2.559006690979004} +02/26/2022 03:11:27 - INFO - codeparrot_training - Step 38321: {'lr': 6.954861819569225e-05, 'samples': 19620864, 'steps': 38321, 'loss/train': 1.0560564994812012} +02/26/2022 03:11:30 - INFO - codeparrot_training - Step 38322: {'lr': 6.953729418897142e-05, 'samples': 19621376, 'steps': 38322, 'loss/train': 1.7350120544433594} +02/26/2022 03:11:36 - INFO - codeparrot_training - Step 38323: {'lr': 6.952597095529548e-05, 'samples': 19621888, 'steps': 38323, 'loss/train': 0.9742646217346191} +02/26/2022 03:11:42 - INFO - codeparrot_training - Step 38324: {'lr': 6.9514648494713e-05, 'samples': 19622400, 'steps': 38324, 'loss/train': 2.3117151260375977} +02/26/2022 03:11:45 - INFO - codeparrot_training - Step 38325: {'lr': 6.95033268072725e-05, 'samples': 19622912, 'steps': 38325, 'loss/train': 1.4532585144042969} +02/26/2022 03:11:51 - INFO - codeparrot_training - Step 38326: {'lr': 6.949200589302243e-05, 'samples': 19623424, 'steps': 38326, 'loss/train': 1.5678054094314575} +02/26/2022 03:11:54 - INFO - codeparrot_training - Step 38327: {'lr': 6.948068575201118e-05, 'samples': 19623936, 'steps': 38327, 'loss/train': 0.8305355906486511} +02/26/2022 03:12:01 - INFO - codeparrot_training - Step 38328: {'lr': 6.946936638428747e-05, 'samples': 19624448, 'steps': 38328, 'loss/train': 1.9675689935684204} +02/26/2022 03:12:04 - INFO - codeparrot_training - Step 38329: {'lr': 6.945804778989959e-05, 'samples': 19624960, 'steps': 38329, 'loss/train': 1.5720771551132202} +02/26/2022 03:12:08 - INFO - codeparrot_training - Step 38330: {'lr': 6.944672996889623e-05, 'samples': 19625472, 'steps': 38330, 'loss/train': 2.2868762016296387} +02/26/2022 03:12:13 - INFO - codeparrot_training - Step 38331: {'lr': 6.94354129213256e-05, 'samples': 19625984, 'steps': 38331, 'loss/train': 1.3972021341323853} +02/26/2022 03:12:17 - INFO - codeparrot_training - Step 38332: {'lr': 6.94240966472364e-05, 'samples': 19626496, 'steps': 38332, 'loss/train': 1.7493994235992432} +02/26/2022 03:12:22 - INFO - codeparrot_training - Step 38333: {'lr': 6.941278114667696e-05, 'samples': 19627008, 'steps': 38333, 'loss/train': 1.1633567810058594} +02/26/2022 03:12:26 - INFO - codeparrot_training - Step 38334: {'lr': 6.940146641969599e-05, 'samples': 19627520, 'steps': 38334, 'loss/train': 0.05693844333291054} +02/26/2022 03:12:31 - INFO - codeparrot_training - Step 38335: {'lr': 6.939015246634162e-05, 'samples': 19628032, 'steps': 38335, 'loss/train': 1.7946480512619019} +02/26/2022 03:12:35 - INFO - codeparrot_training - Step 38336: {'lr': 6.937883928666256e-05, 'samples': 19628544, 'steps': 38336, 'loss/train': 2.596149444580078} +02/26/2022 03:12:40 - INFO - codeparrot_training - Step 38337: {'lr': 6.936752688070713e-05, 'samples': 19629056, 'steps': 38337, 'loss/train': 1.6972674131393433} +02/26/2022 03:12:44 - INFO - codeparrot_training - Step 38338: {'lr': 6.9356215248524e-05, 'samples': 19629568, 'steps': 38338, 'loss/train': 2.2823193073272705} +02/26/2022 03:12:51 - INFO - codeparrot_training - Step 38339: {'lr': 6.934490439016136e-05, 'samples': 19630080, 'steps': 38339, 'loss/train': 1.9745047092437744} +02/26/2022 03:12:54 - INFO - codeparrot_training - Step 38340: {'lr': 6.933359430566785e-05, 'samples': 19630592, 'steps': 38340, 'loss/train': 2.5512940883636475} +02/26/2022 03:13:00 - INFO - codeparrot_training - Step 38341: {'lr': 6.932228499509177e-05, 'samples': 19631104, 'steps': 38341, 'loss/train': 1.4923121929168701} +02/26/2022 03:13:03 - INFO - codeparrot_training - Step 38342: {'lr': 6.931097645848172e-05, 'samples': 19631616, 'steps': 38342, 'loss/train': 1.9151735305786133} +02/26/2022 03:13:09 - INFO - codeparrot_training - Step 38343: {'lr': 6.929966869588609e-05, 'samples': 19632128, 'steps': 38343, 'loss/train': 2.281074047088623} +02/26/2022 03:13:12 - INFO - codeparrot_training - Step 38344: {'lr': 6.928836170735328e-05, 'samples': 19632640, 'steps': 38344, 'loss/train': 1.8603179454803467} +02/26/2022 03:13:18 - INFO - codeparrot_training - Step 38345: {'lr': 6.927705549293167e-05, 'samples': 19633152, 'steps': 38345, 'loss/train': 1.8410143852233887} +02/26/2022 03:13:21 - INFO - codeparrot_training - Step 38346: {'lr': 6.926575005266986e-05, 'samples': 19633664, 'steps': 38346, 'loss/train': 2.4325764179229736} +02/26/2022 03:13:27 - INFO - codeparrot_training - Step 38347: {'lr': 6.925444538661618e-05, 'samples': 19634176, 'steps': 38347, 'loss/train': 1.8347617387771606} +02/26/2022 03:13:30 - INFO - codeparrot_training - Step 38348: {'lr': 6.924314149481905e-05, 'samples': 19634688, 'steps': 38348, 'loss/train': 1.1782866716384888} +02/26/2022 03:13:37 - INFO - codeparrot_training - Step 38349: {'lr': 6.923183837732694e-05, 'samples': 19635200, 'steps': 38349, 'loss/train': 1.8457951545715332} +02/26/2022 03:13:40 - INFO - codeparrot_training - Step 38350: {'lr': 6.922053603418812e-05, 'samples': 19635712, 'steps': 38350, 'loss/train': 2.0619657039642334} +02/26/2022 03:13:46 - INFO - codeparrot_training - Step 38351: {'lr': 6.920923446545121e-05, 'samples': 19636224, 'steps': 38351, 'loss/train': 2.1893832683563232} +02/26/2022 03:13:49 - INFO - codeparrot_training - Step 38352: {'lr': 6.919793367116453e-05, 'samples': 19636736, 'steps': 38352, 'loss/train': 1.5401129722595215} +02/26/2022 03:13:55 - INFO - codeparrot_training - Step 38353: {'lr': 6.918663365137651e-05, 'samples': 19637248, 'steps': 38353, 'loss/train': 0.9590820074081421} +02/26/2022 03:13:58 - INFO - codeparrot_training - Step 38354: {'lr': 6.917533440613543e-05, 'samples': 19637760, 'steps': 38354, 'loss/train': 1.5230873823165894} +02/26/2022 03:14:04 - INFO - codeparrot_training - Step 38355: {'lr': 6.91640359354899e-05, 'samples': 19638272, 'steps': 38355, 'loss/train': 1.3341290950775146} +02/26/2022 03:14:07 - INFO - codeparrot_training - Step 38356: {'lr': 6.91527382394882e-05, 'samples': 19638784, 'steps': 38356, 'loss/train': 1.6489259004592896} +02/26/2022 03:14:13 - INFO - codeparrot_training - Step 38357: {'lr': 6.914144131817876e-05, 'samples': 19639296, 'steps': 38357, 'loss/train': 1.5889368057250977} +02/26/2022 03:14:16 - INFO - codeparrot_training - Step 38358: {'lr': 6.913014517160986e-05, 'samples': 19639808, 'steps': 38358, 'loss/train': 2.0269086360931396} +02/26/2022 03:14:23 - INFO - codeparrot_training - Step 38359: {'lr': 6.911884979983007e-05, 'samples': 19640320, 'steps': 38359, 'loss/train': 2.6325814723968506} +02/26/2022 03:14:26 - INFO - codeparrot_training - Step 38360: {'lr': 6.91075552028877e-05, 'samples': 19640832, 'steps': 38360, 'loss/train': 1.1975805759429932} +02/26/2022 03:14:31 - INFO - codeparrot_training - Step 38361: {'lr': 6.909626138083114e-05, 'samples': 19641344, 'steps': 38361, 'loss/train': 1.8384859561920166} +02/26/2022 03:14:35 - INFO - codeparrot_training - Step 38362: {'lr': 6.908496833370865e-05, 'samples': 19641856, 'steps': 38362, 'loss/train': 3.091197967529297} +02/26/2022 03:14:41 - INFO - codeparrot_training - Step 38363: {'lr': 6.907367606156878e-05, 'samples': 19642368, 'steps': 38363, 'loss/train': 0.1851411908864975} +02/26/2022 03:14:44 - INFO - codeparrot_training - Step 38364: {'lr': 6.906238456445977e-05, 'samples': 19642880, 'steps': 38364, 'loss/train': 2.2467594146728516} +02/26/2022 03:14:50 - INFO - codeparrot_training - Step 38365: {'lr': 6.905109384243019e-05, 'samples': 19643392, 'steps': 38365, 'loss/train': 1.6727991104125977} +02/26/2022 03:14:53 - INFO - codeparrot_training - Step 38366: {'lr': 6.903980389552814e-05, 'samples': 19643904, 'steps': 38366, 'loss/train': 2.3676037788391113} +02/26/2022 03:14:59 - INFO - codeparrot_training - Step 38367: {'lr': 6.902851472380215e-05, 'samples': 19644416, 'steps': 38367, 'loss/train': 1.8005988597869873} +02/26/2022 03:15:02 - INFO - codeparrot_training - Step 38368: {'lr': 6.901722632730048e-05, 'samples': 19644928, 'steps': 38368, 'loss/train': 1.013195514678955} +02/26/2022 03:15:08 - INFO - codeparrot_training - Step 38369: {'lr': 6.900593870607169e-05, 'samples': 19645440, 'steps': 38369, 'loss/train': 1.7053675651550293} +02/26/2022 03:15:12 - INFO - codeparrot_training - Step 38370: {'lr': 6.899465186016385e-05, 'samples': 19645952, 'steps': 38370, 'loss/train': 0.2534477710723877} +02/26/2022 03:15:17 - INFO - codeparrot_training - Step 38371: {'lr': 6.898336578962549e-05, 'samples': 19646464, 'steps': 38371, 'loss/train': 0.800690233707428} +02/26/2022 03:15:21 - INFO - codeparrot_training - Step 38372: {'lr': 6.897208049450488e-05, 'samples': 19646976, 'steps': 38372, 'loss/train': 0.7948448061943054} +02/26/2022 03:15:26 - INFO - codeparrot_training - Step 38373: {'lr': 6.896079597485053e-05, 'samples': 19647488, 'steps': 38373, 'loss/train': 1.2068716287612915} +02/26/2022 03:15:30 - INFO - codeparrot_training - Step 38374: {'lr': 6.894951223071046e-05, 'samples': 19648000, 'steps': 38374, 'loss/train': 0.7735446691513062} +02/26/2022 03:15:35 - INFO - codeparrot_training - Step 38375: {'lr': 6.893822926213331e-05, 'samples': 19648512, 'steps': 38375, 'loss/train': 1.6190383434295654} +02/26/2022 03:15:39 - INFO - codeparrot_training - Step 38376: {'lr': 6.892694706916719e-05, 'samples': 19649024, 'steps': 38376, 'loss/train': 0.7150295972824097} +02/26/2022 03:15:44 - INFO - codeparrot_training - Step 38377: {'lr': 6.89156656518606e-05, 'samples': 19649536, 'steps': 38377, 'loss/train': 1.3908824920654297} +02/26/2022 03:15:48 - INFO - codeparrot_training - Step 38378: {'lr': 6.890438501026183e-05, 'samples': 19650048, 'steps': 38378, 'loss/train': 2.4899752140045166} +02/26/2022 03:15:53 - INFO - codeparrot_training - Step 38379: {'lr': 6.889310514441915e-05, 'samples': 19650560, 'steps': 38379, 'loss/train': 0.7606871724128723} +02/26/2022 03:15:57 - INFO - codeparrot_training - Step 38380: {'lr': 6.888182605438082e-05, 'samples': 19651072, 'steps': 38380, 'loss/train': 0.705439567565918} +02/26/2022 03:16:03 - INFO - codeparrot_training - Step 38381: {'lr': 6.887054774019533e-05, 'samples': 19651584, 'steps': 38381, 'loss/train': 4.246715545654297} +02/26/2022 03:16:07 - INFO - codeparrot_training - Step 38382: {'lr': 6.885927020191088e-05, 'samples': 19652096, 'steps': 38382, 'loss/train': 8.242523193359375} +02/26/2022 03:16:12 - INFO - codeparrot_training - Step 38383: {'lr': 6.884799343957579e-05, 'samples': 19652608, 'steps': 38383, 'loss/train': 2.509084463119507} +02/26/2022 03:16:16 - INFO - codeparrot_training - Step 38384: {'lr': 6.883671745323833e-05, 'samples': 19653120, 'steps': 38384, 'loss/train': 1.7395373582839966} +02/26/2022 03:16:22 - INFO - codeparrot_training - Step 38385: {'lr': 6.88254422429469e-05, 'samples': 19653632, 'steps': 38385, 'loss/train': 1.5212839841842651} +02/26/2022 03:16:25 - INFO - codeparrot_training - Step 38386: {'lr': 6.881416780874975e-05, 'samples': 19654144, 'steps': 38386, 'loss/train': 0.922737717628479} +02/26/2022 03:16:31 - INFO - codeparrot_training - Step 38387: {'lr': 6.880289415069516e-05, 'samples': 19654656, 'steps': 38387, 'loss/train': 1.8092321157455444} +02/26/2022 03:16:34 - INFO - codeparrot_training - Step 38388: {'lr': 6.879162126883137e-05, 'samples': 19655168, 'steps': 38388, 'loss/train': 1.829150676727295} +02/26/2022 03:16:40 - INFO - codeparrot_training - Step 38389: {'lr': 6.878034916320683e-05, 'samples': 19655680, 'steps': 38389, 'loss/train': 2.053861379623413} +02/26/2022 03:16:44 - INFO - codeparrot_training - Step 38390: {'lr': 6.876907783386971e-05, 'samples': 19656192, 'steps': 38390, 'loss/train': 1.4137603044509888} +02/26/2022 03:16:49 - INFO - codeparrot_training - Step 38391: {'lr': 6.875780728086831e-05, 'samples': 19656704, 'steps': 38391, 'loss/train': 1.724225640296936} +02/26/2022 03:16:53 - INFO - codeparrot_training - Step 38392: {'lr': 6.874653750425083e-05, 'samples': 19657216, 'steps': 38392, 'loss/train': 2.4909112453460693} +02/26/2022 03:16:58 - INFO - codeparrot_training - Step 38393: {'lr': 6.873526850406573e-05, 'samples': 19657728, 'steps': 38393, 'loss/train': 0.9760668277740479} +02/26/2022 03:17:02 - INFO - codeparrot_training - Step 38394: {'lr': 6.872400028036116e-05, 'samples': 19658240, 'steps': 38394, 'loss/train': 2.6618876457214355} +02/26/2022 03:17:08 - INFO - codeparrot_training - Step 38395: {'lr': 6.871273283318541e-05, 'samples': 19658752, 'steps': 38395, 'loss/train': 2.468435049057007} +02/26/2022 03:17:11 - INFO - codeparrot_training - Step 38396: {'lr': 6.870146616258677e-05, 'samples': 19659264, 'steps': 38396, 'loss/train': 1.029135823249817} +02/26/2022 03:17:17 - INFO - codeparrot_training - Step 38397: {'lr': 6.869020026861339e-05, 'samples': 19659776, 'steps': 38397, 'loss/train': 2.4733827114105225} +02/26/2022 03:17:20 - INFO - codeparrot_training - Step 38398: {'lr': 6.867893515131368e-05, 'samples': 19660288, 'steps': 38398, 'loss/train': 0.9131062030792236} +02/26/2022 03:17:26 - INFO - codeparrot_training - Step 38399: {'lr': 6.866767081073586e-05, 'samples': 19660800, 'steps': 38399, 'loss/train': 1.0162612199783325} +02/26/2022 03:17:29 - INFO - codeparrot_training - Step 38400: {'lr': 6.865640724692814e-05, 'samples': 19661312, 'steps': 38400, 'loss/train': 1.7749122381210327} +02/26/2022 03:17:35 - INFO - codeparrot_training - Step 38401: {'lr': 6.864514445993875e-05, 'samples': 19661824, 'steps': 38401, 'loss/train': 1.9093453884124756} +02/26/2022 03:17:38 - INFO - codeparrot_training - Step 38402: {'lr': 6.863388244981602e-05, 'samples': 19662336, 'steps': 38402, 'loss/train': 2.0899407863616943} +02/26/2022 03:17:44 - INFO - codeparrot_training - Step 38403: {'lr': 6.862262121660806e-05, 'samples': 19662848, 'steps': 38403, 'loss/train': 2.282686233520508} +02/26/2022 03:17:47 - INFO - codeparrot_training - Step 38404: {'lr': 6.861136076036337e-05, 'samples': 19663360, 'steps': 38404, 'loss/train': 2.10834002494812} +02/26/2022 03:17:51 - INFO - codeparrot_training - Step 38405: {'lr': 6.860010108112985e-05, 'samples': 19663872, 'steps': 38405, 'loss/train': 2.057204008102417} +02/26/2022 03:17:57 - INFO - codeparrot_training - Step 38406: {'lr': 6.8588842178956e-05, 'samples': 19664384, 'steps': 38406, 'loss/train': 1.6700900793075562} +02/26/2022 03:18:01 - INFO - codeparrot_training - Step 38407: {'lr': 6.857758405388984e-05, 'samples': 19664896, 'steps': 38407, 'loss/train': 2.088494300842285} +02/26/2022 03:18:06 - INFO - codeparrot_training - Step 38408: {'lr': 6.856632670597988e-05, 'samples': 19665408, 'steps': 38408, 'loss/train': 1.6609251499176025} +02/26/2022 03:18:10 - INFO - codeparrot_training - Step 38409: {'lr': 6.855507013527398e-05, 'samples': 19665920, 'steps': 38409, 'loss/train': 1.5301356315612793} +02/26/2022 03:18:15 - INFO - codeparrot_training - Step 38410: {'lr': 6.854381434182063e-05, 'samples': 19666432, 'steps': 38410, 'loss/train': 1.9033960103988647} +02/26/2022 03:18:19 - INFO - codeparrot_training - Step 38411: {'lr': 6.853255932566788e-05, 'samples': 19666944, 'steps': 38411, 'loss/train': 1.6113755702972412} +02/26/2022 03:18:24 - INFO - codeparrot_training - Step 38412: {'lr': 6.85213050868641e-05, 'samples': 19667456, 'steps': 38412, 'loss/train': 2.4330015182495117} +02/26/2022 03:18:30 - INFO - codeparrot_training - Step 38413: {'lr': 6.851005162545746e-05, 'samples': 19667968, 'steps': 38413, 'loss/train': 2.0863029956817627} +02/26/2022 03:18:33 - INFO - codeparrot_training - Step 38414: {'lr': 6.849879894149607e-05, 'samples': 19668480, 'steps': 38414, 'loss/train': 1.26804518699646} +02/26/2022 03:18:39 - INFO - codeparrot_training - Step 38415: {'lr': 6.848754703502815e-05, 'samples': 19668992, 'steps': 38415, 'loss/train': 0.8444098234176636} +02/26/2022 03:18:42 - INFO - codeparrot_training - Step 38416: {'lr': 6.847629590610202e-05, 'samples': 19669504, 'steps': 38416, 'loss/train': 0.7023478746414185} +02/26/2022 03:18:49 - INFO - codeparrot_training - Step 38417: {'lr': 6.846504555476579e-05, 'samples': 19670016, 'steps': 38417, 'loss/train': 1.8845778703689575} +02/26/2022 03:18:52 - INFO - codeparrot_training - Step 38418: {'lr': 6.845379598106766e-05, 'samples': 19670528, 'steps': 38418, 'loss/train': 2.440739393234253} +02/26/2022 03:18:58 - INFO - codeparrot_training - Step 38419: {'lr': 6.844254718505574e-05, 'samples': 19671040, 'steps': 38419, 'loss/train': 1.5760228633880615} +02/26/2022 03:19:01 - INFO - codeparrot_training - Step 38420: {'lr': 6.84312991667784e-05, 'samples': 19671552, 'steps': 38420, 'loss/train': 1.8081988096237183} +02/26/2022 03:19:07 - INFO - codeparrot_training - Step 38421: {'lr': 6.84200519262837e-05, 'samples': 19672064, 'steps': 38421, 'loss/train': 1.5852195024490356} +02/26/2022 03:19:10 - INFO - codeparrot_training - Step 38422: {'lr': 6.840880546361983e-05, 'samples': 19672576, 'steps': 38422, 'loss/train': 2.1679470539093018} +02/26/2022 03:19:16 - INFO - codeparrot_training - Step 38423: {'lr': 6.839755977883491e-05, 'samples': 19673088, 'steps': 38423, 'loss/train': 1.893385410308838} +02/26/2022 03:19:19 - INFO - codeparrot_training - Step 38424: {'lr': 6.838631487197728e-05, 'samples': 19673600, 'steps': 38424, 'loss/train': 1.641092300415039} +02/26/2022 03:19:24 - INFO - codeparrot_training - Step 38425: {'lr': 6.837507074309488e-05, 'samples': 19674112, 'steps': 38425, 'loss/train': 1.9038786888122559} +02/26/2022 03:19:28 - INFO - codeparrot_training - Step 38426: {'lr': 6.836382739223618e-05, 'samples': 19674624, 'steps': 38426, 'loss/train': 1.2102866172790527} +02/26/2022 03:19:34 - INFO - codeparrot_training - Step 38427: {'lr': 6.835258481944904e-05, 'samples': 19675136, 'steps': 38427, 'loss/train': 2.333507537841797} +02/26/2022 03:19:38 - INFO - codeparrot_training - Step 38428: {'lr': 6.834134302478179e-05, 'samples': 19675648, 'steps': 38428, 'loss/train': 2.0154917240142822} +02/26/2022 03:19:43 - INFO - codeparrot_training - Step 38429: {'lr': 6.833010200828255e-05, 'samples': 19676160, 'steps': 38429, 'loss/train': 0.6300233602523804} +02/26/2022 03:19:46 - INFO - codeparrot_training - Step 38430: {'lr': 6.831886176999947e-05, 'samples': 19676672, 'steps': 38430, 'loss/train': 1.9117789268493652} +02/26/2022 03:19:52 - INFO - codeparrot_training - Step 38431: {'lr': 6.830762230998064e-05, 'samples': 19677184, 'steps': 38431, 'loss/train': 1.068660855293274} +02/26/2022 03:19:55 - INFO - codeparrot_training - Step 38432: {'lr': 6.829638362827431e-05, 'samples': 19677696, 'steps': 38432, 'loss/train': 2.11419415473938} +02/26/2022 03:20:01 - INFO - codeparrot_training - Step 38433: {'lr': 6.828514572492859e-05, 'samples': 19678208, 'steps': 38433, 'loss/train': 1.270612359046936} +02/26/2022 03:20:04 - INFO - codeparrot_training - Step 38434: {'lr': 6.827390859999158e-05, 'samples': 19678720, 'steps': 38434, 'loss/train': 1.7337863445281982} +02/26/2022 03:20:10 - INFO - codeparrot_training - Step 38435: {'lr': 6.826267225351141e-05, 'samples': 19679232, 'steps': 38435, 'loss/train': 1.9830979108810425} +02/26/2022 03:20:13 - INFO - codeparrot_training - Step 38436: {'lr': 6.825143668553626e-05, 'samples': 19679744, 'steps': 38436, 'loss/train': 2.1001436710357666} +02/26/2022 03:20:19 - INFO - codeparrot_training - Step 38437: {'lr': 6.82402018961143e-05, 'samples': 19680256, 'steps': 38437, 'loss/train': 1.7360002994537354} +02/26/2022 03:20:22 - INFO - codeparrot_training - Step 38438: {'lr': 6.82289678852935e-05, 'samples': 19680768, 'steps': 38438, 'loss/train': 1.8273926973342896} +02/26/2022 03:20:28 - INFO - codeparrot_training - Step 38439: {'lr': 6.821773465312216e-05, 'samples': 19681280, 'steps': 38439, 'loss/train': 1.8329812288284302} +02/26/2022 03:20:31 - INFO - codeparrot_training - Step 38440: {'lr': 6.820650219964833e-05, 'samples': 19681792, 'steps': 38440, 'loss/train': 0.7322726249694824} +02/26/2022 03:20:37 - INFO - codeparrot_training - Step 38441: {'lr': 6.819527052492011e-05, 'samples': 19682304, 'steps': 38441, 'loss/train': 0.5114310383796692} +02/26/2022 03:20:41 - INFO - codeparrot_training - Step 38442: {'lr': 6.818403962898553e-05, 'samples': 19682816, 'steps': 38442, 'loss/train': 1.5200272798538208} +02/26/2022 03:20:46 - INFO - codeparrot_training - Step 38443: {'lr': 6.817280951189298e-05, 'samples': 19683328, 'steps': 38443, 'loss/train': 1.7517212629318237} +02/26/2022 03:20:50 - INFO - codeparrot_training - Step 38444: {'lr': 6.81615801736902e-05, 'samples': 19683840, 'steps': 38444, 'loss/train': 0.21692833304405212} +02/26/2022 03:20:55 - INFO - codeparrot_training - Step 38445: {'lr': 6.815035161442554e-05, 'samples': 19684352, 'steps': 38445, 'loss/train': 1.6718298196792603} +02/26/2022 03:20:59 - INFO - codeparrot_training - Step 38446: {'lr': 6.813912383414698e-05, 'samples': 19684864, 'steps': 38446, 'loss/train': 2.0770835876464844} +02/26/2022 03:21:04 - INFO - codeparrot_training - Step 38447: {'lr': 6.81278968329028e-05, 'samples': 19685376, 'steps': 38447, 'loss/train': 0.7157784104347229} +02/26/2022 03:21:08 - INFO - codeparrot_training - Step 38448: {'lr': 6.811667061074082e-05, 'samples': 19685888, 'steps': 38448, 'loss/train': 0.8628271818161011} +02/26/2022 03:21:13 - INFO - codeparrot_training - Step 38449: {'lr': 6.810544516770934e-05, 'samples': 19686400, 'steps': 38449, 'loss/train': 1.2255158424377441} +02/26/2022 03:21:19 - INFO - codeparrot_training - Step 38450: {'lr': 6.809422050385628e-05, 'samples': 19686912, 'steps': 38450, 'loss/train': 2.3205976486206055} +02/26/2022 03:21:22 - INFO - codeparrot_training - Step 38451: {'lr': 6.80829966192299e-05, 'samples': 19687424, 'steps': 38451, 'loss/train': 1.3617819547653198} +02/26/2022 03:21:29 - INFO - codeparrot_training - Step 38452: {'lr': 6.807177351387823e-05, 'samples': 19687936, 'steps': 38452, 'loss/train': 2.2382023334503174} +02/26/2022 03:21:32 - INFO - codeparrot_training - Step 38453: {'lr': 6.806055118784926e-05, 'samples': 19688448, 'steps': 38453, 'loss/train': 2.1060197353363037} +02/26/2022 03:21:37 - INFO - codeparrot_training - Step 38454: {'lr': 6.804932964119109e-05, 'samples': 19688960, 'steps': 38454, 'loss/train': 2.0379011631011963} +02/26/2022 03:21:41 - INFO - codeparrot_training - Step 38455: {'lr': 6.803810887395187e-05, 'samples': 19689472, 'steps': 38455, 'loss/train': 2.00443696975708} +02/26/2022 03:21:46 - INFO - codeparrot_training - Step 38456: {'lr': 6.802688888617962e-05, 'samples': 19689984, 'steps': 38456, 'loss/train': 2.0512964725494385} +02/26/2022 03:21:50 - INFO - codeparrot_training - Step 38457: {'lr': 6.801566967792239e-05, 'samples': 19690496, 'steps': 38457, 'loss/train': 1.3247833251953125} +02/26/2022 03:21:56 - INFO - codeparrot_training - Step 38458: {'lr': 6.800445124922816e-05, 'samples': 19691008, 'steps': 38458, 'loss/train': 0.9699744582176208} +02/26/2022 03:21:59 - INFO - codeparrot_training - Step 38459: {'lr': 6.799323360014514e-05, 'samples': 19691520, 'steps': 38459, 'loss/train': 1.271215796470642} +02/26/2022 03:22:02 - INFO - codeparrot_training - Step 38460: {'lr': 6.798201673072127e-05, 'samples': 19692032, 'steps': 38460, 'loss/train': 1.1692957878112793} +02/26/2022 03:22:08 - INFO - codeparrot_training - Step 38461: {'lr': 6.797080064100478e-05, 'samples': 19692544, 'steps': 38461, 'loss/train': 3.000379800796509} +02/26/2022 03:22:14 - INFO - codeparrot_training - Step 38462: {'lr': 6.79595853310434e-05, 'samples': 19693056, 'steps': 38462, 'loss/train': 2.173128843307495} +02/26/2022 03:22:18 - INFO - codeparrot_training - Step 38463: {'lr': 6.794837080088545e-05, 'samples': 19693568, 'steps': 38463, 'loss/train': 1.9213277101516724} +02/26/2022 03:22:21 - INFO - codeparrot_training - Step 38464: {'lr': 6.793715705057882e-05, 'samples': 19694080, 'steps': 38464, 'loss/train': 2.5000038146972656} +02/26/2022 03:22:27 - INFO - codeparrot_training - Step 38465: {'lr': 6.792594408017172e-05, 'samples': 19694592, 'steps': 38465, 'loss/train': 2.22418212890625} +02/26/2022 03:22:30 - INFO - codeparrot_training - Step 38466: {'lr': 6.791473188971192e-05, 'samples': 19695104, 'steps': 38466, 'loss/train': 2.945513963699341} +02/26/2022 03:22:36 - INFO - codeparrot_training - Step 38467: {'lr': 6.790352047924766e-05, 'samples': 19695616, 'steps': 38467, 'loss/train': 1.5484987497329712} +02/26/2022 03:22:39 - INFO - codeparrot_training - Step 38468: {'lr': 6.789230984882683e-05, 'samples': 19696128, 'steps': 38468, 'loss/train': 2.054885149002075} +02/26/2022 03:22:45 - INFO - codeparrot_training - Step 38469: {'lr': 6.788109999849765e-05, 'samples': 19696640, 'steps': 38469, 'loss/train': 1.6869285106658936} +02/26/2022 03:22:48 - INFO - codeparrot_training - Step 38470: {'lr': 6.786989092830786e-05, 'samples': 19697152, 'steps': 38470, 'loss/train': 1.016160249710083} +02/26/2022 03:22:54 - INFO - codeparrot_training - Step 38471: {'lr': 6.785868263830572e-05, 'samples': 19697664, 'steps': 38471, 'loss/train': 1.838807463645935} +02/26/2022 03:22:57 - INFO - codeparrot_training - Step 38472: {'lr': 6.784747512853905e-05, 'samples': 19698176, 'steps': 38472, 'loss/train': 1.3608500957489014} +02/26/2022 03:23:04 - INFO - codeparrot_training - Step 38473: {'lr': 6.783626839905605e-05, 'samples': 19698688, 'steps': 38473, 'loss/train': 2.1875054836273193} +02/26/2022 03:23:07 - INFO - codeparrot_training - Step 38474: {'lr': 6.782506244990463e-05, 'samples': 19699200, 'steps': 38474, 'loss/train': 1.6835252046585083} +02/26/2022 03:23:13 - INFO - codeparrot_training - Step 38475: {'lr': 6.78138572811328e-05, 'samples': 19699712, 'steps': 38475, 'loss/train': 0.9680857062339783} +02/26/2022 03:23:16 - INFO - codeparrot_training - Step 38476: {'lr': 6.780265289278852e-05, 'samples': 19700224, 'steps': 38476, 'loss/train': 1.007615089416504} +02/26/2022 03:23:22 - INFO - codeparrot_training - Step 38477: {'lr': 6.779144928491979e-05, 'samples': 19700736, 'steps': 38477, 'loss/train': 0.8837943077087402} +02/26/2022 03:23:25 - INFO - codeparrot_training - Step 38478: {'lr': 6.778024645757469e-05, 'samples': 19701248, 'steps': 38478, 'loss/train': 2.108769655227661} +02/26/2022 03:23:31 - INFO - codeparrot_training - Step 38479: {'lr': 6.776904441080115e-05, 'samples': 19701760, 'steps': 38479, 'loss/train': 2.174123525619507} +02/26/2022 03:23:34 - INFO - codeparrot_training - Step 38480: {'lr': 6.775784314464717e-05, 'samples': 19702272, 'steps': 38480, 'loss/train': 1.1795350313186646} +02/26/2022 03:23:40 - INFO - codeparrot_training - Step 38481: {'lr': 6.774664265916064e-05, 'samples': 19702784, 'steps': 38481, 'loss/train': 2.4828836917877197} +02/26/2022 03:23:43 - INFO - codeparrot_training - Step 38482: {'lr': 6.773544295438968e-05, 'samples': 19703296, 'steps': 38482, 'loss/train': 1.465942621231079} +02/26/2022 03:23:49 - INFO - codeparrot_training - Step 38483: {'lr': 6.772424403038224e-05, 'samples': 19703808, 'steps': 38483, 'loss/train': 2.299922466278076} +02/26/2022 03:23:54 - INFO - codeparrot_training - Step 38484: {'lr': 6.771304588718624e-05, 'samples': 19704320, 'steps': 38484, 'loss/train': 0.9538729786872864} +02/26/2022 03:23:58 - INFO - codeparrot_training - Step 38485: {'lr': 6.77018485248496e-05, 'samples': 19704832, 'steps': 38485, 'loss/train': 0.2449597269296646} +02/26/2022 03:24:04 - INFO - codeparrot_training - Step 38486: {'lr': 6.769065194342042e-05, 'samples': 19705344, 'steps': 38486, 'loss/train': 0.9421229362487793} +02/26/2022 03:24:07 - INFO - codeparrot_training - Step 38487: {'lr': 6.76794561429466e-05, 'samples': 19705856, 'steps': 38487, 'loss/train': 1.514542579650879} +02/26/2022 03:24:13 - INFO - codeparrot_training - Step 38488: {'lr': 6.76682611234761e-05, 'samples': 19706368, 'steps': 38488, 'loss/train': 0.4306022524833679} +02/26/2022 03:24:17 - INFO - codeparrot_training - Step 38489: {'lr': 6.76570668850568e-05, 'samples': 19706880, 'steps': 38489, 'loss/train': 1.4481408596038818} +02/26/2022 03:24:20 - INFO - codeparrot_training - Step 38490: {'lr': 6.764587342773679e-05, 'samples': 19707392, 'steps': 38490, 'loss/train': 1.9651048183441162} +02/26/2022 03:24:26 - INFO - codeparrot_training - Step 38491: {'lr': 6.763468075156395e-05, 'samples': 19707904, 'steps': 38491, 'loss/train': 2.8414618968963623} +02/26/2022 03:24:29 - INFO - codeparrot_training - Step 38492: {'lr': 6.762348885658626e-05, 'samples': 19708416, 'steps': 38492, 'loss/train': 2.0153722763061523} +02/26/2022 03:24:34 - INFO - codeparrot_training - Step 38493: {'lr': 6.761229774285152e-05, 'samples': 19708928, 'steps': 38493, 'loss/train': 2.105882167816162} +02/26/2022 03:24:38 - INFO - codeparrot_training - Step 38494: {'lr': 6.760110741040787e-05, 'samples': 19709440, 'steps': 38494, 'loss/train': 2.6483542919158936} +02/26/2022 03:24:43 - INFO - codeparrot_training - Step 38495: {'lr': 6.758991785930319e-05, 'samples': 19709952, 'steps': 38495, 'loss/train': 2.1674225330352783} +02/26/2022 03:24:47 - INFO - codeparrot_training - Step 38496: {'lr': 6.757872908958535e-05, 'samples': 19710464, 'steps': 38496, 'loss/train': 0.3592943549156189} +02/26/2022 03:24:52 - INFO - codeparrot_training - Step 38497: {'lr': 6.756754110130223e-05, 'samples': 19710976, 'steps': 38497, 'loss/train': 1.817550539970398} +02/26/2022 03:24:56 - INFO - codeparrot_training - Step 38498: {'lr': 6.755635389450191e-05, 'samples': 19711488, 'steps': 38498, 'loss/train': 1.4259891510009766} +02/26/2022 03:25:02 - INFO - codeparrot_training - Step 38499: {'lr': 6.754516746923217e-05, 'samples': 19712000, 'steps': 38499, 'loss/train': 1.8990557193756104} +02/26/2022 03:25:06 - INFO - codeparrot_training - Step 38500: {'lr': 6.753398182554116e-05, 'samples': 19712512, 'steps': 38500, 'loss/train': 1.7087346315383911} +02/26/2022 03:25:11 - INFO - codeparrot_training - Step 38501: {'lr': 6.752279696347646e-05, 'samples': 19713024, 'steps': 38501, 'loss/train': 2.697360038757324} +02/26/2022 03:25:15 - INFO - codeparrot_training - Step 38502: {'lr': 6.751161288308624e-05, 'samples': 19713536, 'steps': 38502, 'loss/train': 2.1709935665130615} +02/26/2022 03:25:20 - INFO - codeparrot_training - Step 38503: {'lr': 6.750042958441824e-05, 'samples': 19714048, 'steps': 38503, 'loss/train': 1.0028451681137085} +02/26/2022 03:25:24 - INFO - codeparrot_training - Step 38504: {'lr': 6.748924706752061e-05, 'samples': 19714560, 'steps': 38504, 'loss/train': 2.146336793899536} +02/26/2022 03:25:29 - INFO - codeparrot_training - Step 38505: {'lr': 6.747806533244093e-05, 'samples': 19715072, 'steps': 38505, 'loss/train': 1.8683357238769531} +02/26/2022 03:25:33 - INFO - codeparrot_training - Step 38506: {'lr': 6.746688437922736e-05, 'samples': 19715584, 'steps': 38506, 'loss/train': 1.897711157798767} +02/26/2022 03:25:38 - INFO - codeparrot_training - Step 38507: {'lr': 6.74557042079276e-05, 'samples': 19716096, 'steps': 38507, 'loss/train': 1.9326940774917603} +02/26/2022 03:25:42 - INFO - codeparrot_training - Step 38508: {'lr': 6.744452481858979e-05, 'samples': 19716608, 'steps': 38508, 'loss/train': 1.3787177801132202} +02/26/2022 03:25:49 - INFO - codeparrot_training - Step 38509: {'lr': 6.743334621126151e-05, 'samples': 19717120, 'steps': 38509, 'loss/train': 2.2313151359558105} +02/26/2022 03:25:52 - INFO - codeparrot_training - Step 38510: {'lr': 6.742216838599091e-05, 'samples': 19717632, 'steps': 38510, 'loss/train': 0.6717408895492554} +02/26/2022 03:25:58 - INFO - codeparrot_training - Step 38511: {'lr': 6.741099134282567e-05, 'samples': 19718144, 'steps': 38511, 'loss/train': 1.9280356168746948} +02/26/2022 03:26:01 - INFO - codeparrot_training - Step 38512: {'lr': 6.739981508181383e-05, 'samples': 19718656, 'steps': 38512, 'loss/train': 1.2840335369110107} +02/26/2022 03:26:07 - INFO - codeparrot_training - Step 38513: {'lr': 6.738863960300324e-05, 'samples': 19719168, 'steps': 38513, 'loss/train': 1.8356081247329712} +02/26/2022 03:26:10 - INFO - codeparrot_training - Step 38514: {'lr': 6.73774649064417e-05, 'samples': 19719680, 'steps': 38514, 'loss/train': 1.203269124031067} +02/26/2022 03:26:16 - INFO - codeparrot_training - Step 38515: {'lr': 6.736629099217703e-05, 'samples': 19720192, 'steps': 38515, 'loss/train': 2.4249298572540283} +02/26/2022 03:26:19 - INFO - codeparrot_training - Step 38516: {'lr': 6.735511786025725e-05, 'samples': 19720704, 'steps': 38516, 'loss/train': 1.4649714231491089} +02/26/2022 03:26:25 - INFO - codeparrot_training - Step 38517: {'lr': 6.734394551073017e-05, 'samples': 19721216, 'steps': 38517, 'loss/train': 2.0018768310546875} +02/26/2022 03:26:28 - INFO - codeparrot_training - Step 38518: {'lr': 6.733277394364363e-05, 'samples': 19721728, 'steps': 38518, 'loss/train': 0.41589176654815674} +02/26/2022 03:26:34 - INFO - codeparrot_training - Step 38519: {'lr': 6.732160315904538e-05, 'samples': 19722240, 'steps': 38519, 'loss/train': 1.5262006521224976} +02/26/2022 03:26:40 - INFO - codeparrot_training - Step 38520: {'lr': 6.731043315698346e-05, 'samples': 19722752, 'steps': 38520, 'loss/train': 1.461841344833374} +02/26/2022 03:26:44 - INFO - codeparrot_training - Step 38521: {'lr': 6.729926393750566e-05, 'samples': 19723264, 'steps': 38521, 'loss/train': 1.5198719501495361} +02/26/2022 03:26:47 - INFO - codeparrot_training - Step 38522: {'lr': 6.728809550065976e-05, 'samples': 19723776, 'steps': 38522, 'loss/train': 0.3158608376979828} +02/26/2022 03:26:52 - INFO - codeparrot_training - Step 38523: {'lr': 6.727692784649367e-05, 'samples': 19724288, 'steps': 38523, 'loss/train': 1.0442678928375244} +02/26/2022 03:26:56 - INFO - codeparrot_training - Step 38524: {'lr': 6.72657609750551e-05, 'samples': 19724800, 'steps': 38524, 'loss/train': 1.4605982303619385} +02/26/2022 03:27:01 - INFO - codeparrot_training - Step 38525: {'lr': 6.72545948863921e-05, 'samples': 19725312, 'steps': 38525, 'loss/train': 2.4296481609344482} +02/26/2022 03:27:05 - INFO - codeparrot_training - Step 38526: {'lr': 6.724342958055236e-05, 'samples': 19725824, 'steps': 38526, 'loss/train': 1.6514232158660889} +02/26/2022 03:27:10 - INFO - codeparrot_training - Step 38527: {'lr': 6.723226505758373e-05, 'samples': 19726336, 'steps': 38527, 'loss/train': 2.0844454765319824} +02/26/2022 03:27:14 - INFO - codeparrot_training - Step 38528: {'lr': 6.722110131753398e-05, 'samples': 19726848, 'steps': 38528, 'loss/train': 1.9466315507888794} +02/26/2022 03:27:20 - INFO - codeparrot_training - Step 38529: {'lr': 6.720993836045105e-05, 'samples': 19727360, 'steps': 38529, 'loss/train': 1.6696027517318726} +02/26/2022 03:27:25 - INFO - codeparrot_training - Step 38530: {'lr': 6.719877618638273e-05, 'samples': 19727872, 'steps': 38530, 'loss/train': 0.8651958107948303} +02/26/2022 03:27:28 - INFO - codeparrot_training - Step 38531: {'lr': 6.71876147953768e-05, 'samples': 19728384, 'steps': 38531, 'loss/train': 1.2277593612670898} +02/26/2022 03:27:34 - INFO - codeparrot_training - Step 38532: {'lr': 6.717645418748097e-05, 'samples': 19728896, 'steps': 38532, 'loss/train': 2.0817205905914307} +02/26/2022 03:27:37 - INFO - codeparrot_training - Step 38533: {'lr': 6.716529436274327e-05, 'samples': 19729408, 'steps': 38533, 'loss/train': 1.5316346883773804} +02/26/2022 03:27:44 - INFO - codeparrot_training - Step 38534: {'lr': 6.715413532121131e-05, 'samples': 19729920, 'steps': 38534, 'loss/train': 0.212492898106575} +02/26/2022 03:27:47 - INFO - codeparrot_training - Step 38535: {'lr': 6.714297706293313e-05, 'samples': 19730432, 'steps': 38535, 'loss/train': 2.2703354358673096} +02/26/2022 03:27:52 - INFO - codeparrot_training - Step 38536: {'lr': 6.71318195879562e-05, 'samples': 19730944, 'steps': 38536, 'loss/train': 2.4443178176879883} +02/26/2022 03:27:56 - INFO - codeparrot_training - Step 38537: {'lr': 6.712066289632856e-05, 'samples': 19731456, 'steps': 38537, 'loss/train': 2.447617530822754} +02/26/2022 03:28:01 - INFO - codeparrot_training - Step 38538: {'lr': 6.710950698809789e-05, 'samples': 19731968, 'steps': 38538, 'loss/train': 1.8363568782806396} +02/26/2022 03:28:05 - INFO - codeparrot_training - Step 38539: {'lr': 6.709835186331214e-05, 'samples': 19732480, 'steps': 38539, 'loss/train': 2.056351900100708} +02/26/2022 03:28:11 - INFO - codeparrot_training - Step 38540: {'lr': 6.708719752201883e-05, 'samples': 19732992, 'steps': 38540, 'loss/train': 1.7019981145858765} +02/26/2022 03:28:14 - INFO - codeparrot_training - Step 38541: {'lr': 6.707604396426595e-05, 'samples': 19733504, 'steps': 38541, 'loss/train': 1.4125553369522095} +02/26/2022 03:28:19 - INFO - codeparrot_training - Step 38542: {'lr': 6.706489119010115e-05, 'samples': 19734016, 'steps': 38542, 'loss/train': 0.6963955163955688} +02/26/2022 03:28:23 - INFO - codeparrot_training - Step 38543: {'lr': 6.705373919957241e-05, 'samples': 19734528, 'steps': 38543, 'loss/train': 2.0790679454803467} +02/26/2022 03:28:29 - INFO - codeparrot_training - Step 38544: {'lr': 6.704258799272722e-05, 'samples': 19735040, 'steps': 38544, 'loss/train': 0.8199334144592285} +02/26/2022 03:28:33 - INFO - codeparrot_training - Step 38545: {'lr': 6.703143756961355e-05, 'samples': 19735552, 'steps': 38545, 'loss/train': 1.4792839288711548} +02/26/2022 03:28:38 - INFO - codeparrot_training - Step 38546: {'lr': 6.702028793027906e-05, 'samples': 19736064, 'steps': 38546, 'loss/train': 1.3455629348754883} +02/26/2022 03:28:42 - INFO - codeparrot_training - Step 38547: {'lr': 6.70091390747716e-05, 'samples': 19736576, 'steps': 38547, 'loss/train': 0.7645719051361084} +02/26/2022 03:28:47 - INFO - codeparrot_training - Step 38548: {'lr': 6.699799100313888e-05, 'samples': 19737088, 'steps': 38548, 'loss/train': 1.2810925245285034} +02/26/2022 03:28:51 - INFO - codeparrot_training - Step 38549: {'lr': 6.698684371542866e-05, 'samples': 19737600, 'steps': 38549, 'loss/train': 1.9323935508728027} +02/26/2022 03:28:56 - INFO - codeparrot_training - Step 38550: {'lr': 6.697569721168861e-05, 'samples': 19738112, 'steps': 38550, 'loss/train': 1.6603186130523682} +02/26/2022 03:29:00 - INFO - codeparrot_training - Step 38551: {'lr': 6.696455149196664e-05, 'samples': 19738624, 'steps': 38551, 'loss/train': 2.3496146202087402} +02/26/2022 03:29:05 - INFO - codeparrot_training - Step 38552: {'lr': 6.695340655631041e-05, 'samples': 19739136, 'steps': 38552, 'loss/train': 1.5190728902816772} +02/26/2022 03:29:09 - INFO - codeparrot_training - Step 38553: {'lr': 6.694226240476767e-05, 'samples': 19739648, 'steps': 38553, 'loss/train': 1.7923954725265503} +02/26/2022 03:29:15 - INFO - codeparrot_training - Step 38554: {'lr': 6.693111903738605e-05, 'samples': 19740160, 'steps': 38554, 'loss/train': 0.9450716376304626} +02/26/2022 03:29:18 - INFO - codeparrot_training - Step 38555: {'lr': 6.691997645421347e-05, 'samples': 19740672, 'steps': 38555, 'loss/train': 1.521878719329834} +02/26/2022 03:29:24 - INFO - codeparrot_training - Step 38556: {'lr': 6.69088346552976e-05, 'samples': 19741184, 'steps': 38556, 'loss/train': 1.3934801816940308} +02/26/2022 03:29:27 - INFO - codeparrot_training - Step 38557: {'lr': 6.689769364068613e-05, 'samples': 19741696, 'steps': 38557, 'loss/train': 1.8056319952011108} +02/26/2022 03:29:33 - INFO - codeparrot_training - Step 38558: {'lr': 6.68865534104267e-05, 'samples': 19742208, 'steps': 38558, 'loss/train': 2.134234666824341} +02/26/2022 03:29:36 - INFO - codeparrot_training - Step 38559: {'lr': 6.687541396456723e-05, 'samples': 19742720, 'steps': 38559, 'loss/train': 2.627307653427124} +02/26/2022 03:29:42 - INFO - codeparrot_training - Step 38560: {'lr': 6.686427530315534e-05, 'samples': 19743232, 'steps': 38560, 'loss/train': 1.8709713220596313} +02/26/2022 03:29:45 - INFO - codeparrot_training - Step 38561: {'lr': 6.685313742623872e-05, 'samples': 19743744, 'steps': 38561, 'loss/train': 2.4307448863983154} +02/26/2022 03:29:51 - INFO - codeparrot_training - Step 38562: {'lr': 6.684200033386506e-05, 'samples': 19744256, 'steps': 38562, 'loss/train': 1.7083773612976074} +02/26/2022 03:29:54 - INFO - codeparrot_training - Step 38563: {'lr': 6.683086402608215e-05, 'samples': 19744768, 'steps': 38563, 'loss/train': 0.7015232443809509} +02/26/2022 03:30:01 - INFO - codeparrot_training - Step 38564: {'lr': 6.681972850293769e-05, 'samples': 19745280, 'steps': 38564, 'loss/train': 1.6064817905426025} +02/26/2022 03:30:04 - INFO - codeparrot_training - Step 38565: {'lr': 6.680859376447934e-05, 'samples': 19745792, 'steps': 38565, 'loss/train': 2.768766403198242} +02/26/2022 03:30:10 - INFO - codeparrot_training - Step 38566: {'lr': 6.679745981075472e-05, 'samples': 19746304, 'steps': 38566, 'loss/train': 1.3902474641799927} +02/26/2022 03:30:13 - INFO - codeparrot_training - Step 38567: {'lr': 6.67863266418117e-05, 'samples': 19746816, 'steps': 38567, 'loss/train': 1.518554925918579} +02/26/2022 03:30:19 - INFO - codeparrot_training - Step 38568: {'lr': 6.677519425769784e-05, 'samples': 19747328, 'steps': 38568, 'loss/train': 2.504375696182251} +02/26/2022 03:30:22 - INFO - codeparrot_training - Step 38569: {'lr': 6.676406265846083e-05, 'samples': 19747840, 'steps': 38569, 'loss/train': 1.2691808938980103} +02/26/2022 03:30:28 - INFO - codeparrot_training - Step 38570: {'lr': 6.675293184414846e-05, 'samples': 19748352, 'steps': 38570, 'loss/train': 1.733219861984253} +02/26/2022 03:30:31 - INFO - codeparrot_training - Step 38571: {'lr': 6.674180181480835e-05, 'samples': 19748864, 'steps': 38571, 'loss/train': 1.622839331626892} +02/26/2022 03:30:37 - INFO - codeparrot_training - Step 38572: {'lr': 6.673067257048815e-05, 'samples': 19749376, 'steps': 38572, 'loss/train': 1.3758234977722168} +02/26/2022 03:30:40 - INFO - codeparrot_training - Step 38573: {'lr': 6.671954411123549e-05, 'samples': 19749888, 'steps': 38573, 'loss/train': 1.2200340032577515} +02/26/2022 03:30:46 - INFO - codeparrot_training - Step 38574: {'lr': 6.670841643709824e-05, 'samples': 19750400, 'steps': 38574, 'loss/train': 1.8557848930358887} +02/26/2022 03:30:49 - INFO - codeparrot_training - Step 38575: {'lr': 6.669728954812379e-05, 'samples': 19750912, 'steps': 38575, 'loss/train': 1.7742339372634888} +02/26/2022 03:30:55 - INFO - codeparrot_training - Step 38576: {'lr': 6.668616344436005e-05, 'samples': 19751424, 'steps': 38576, 'loss/train': 0.9452046751976013} +02/26/2022 03:30:58 - INFO - codeparrot_training - Step 38577: {'lr': 6.667503812585446e-05, 'samples': 19751936, 'steps': 38577, 'loss/train': 1.2546623945236206} +02/26/2022 03:31:04 - INFO - codeparrot_training - Step 38578: {'lr': 6.666391359265497e-05, 'samples': 19752448, 'steps': 38578, 'loss/train': 2.090447187423706} +02/26/2022 03:31:07 - INFO - codeparrot_training - Step 38579: {'lr': 6.665278984480889e-05, 'samples': 19752960, 'steps': 38579, 'loss/train': 2.8809638023376465} +02/26/2022 03:31:13 - INFO - codeparrot_training - Step 38580: {'lr': 6.664166688236411e-05, 'samples': 19753472, 'steps': 38580, 'loss/train': 1.667805790901184} +02/26/2022 03:31:17 - INFO - codeparrot_training - Step 38581: {'lr': 6.663054470536816e-05, 'samples': 19753984, 'steps': 38581, 'loss/train': 1.2165825366973877} +02/26/2022 03:31:22 - INFO - codeparrot_training - Step 38582: {'lr': 6.66194233138688e-05, 'samples': 19754496, 'steps': 38582, 'loss/train': 2.2430546283721924} +02/26/2022 03:31:26 - INFO - codeparrot_training - Step 38583: {'lr': 6.66083027079136e-05, 'samples': 19755008, 'steps': 38583, 'loss/train': 0.7722062468528748} +02/26/2022 03:31:31 - INFO - codeparrot_training - Step 38584: {'lr': 6.659718288755018e-05, 'samples': 19755520, 'steps': 38584, 'loss/train': 1.7943100929260254} +02/26/2022 03:31:35 - INFO - codeparrot_training - Step 38585: {'lr': 6.658606385282612e-05, 'samples': 19756032, 'steps': 38585, 'loss/train': 1.3602079153060913} +02/26/2022 03:31:40 - INFO - codeparrot_training - Step 38586: {'lr': 6.657494560378922e-05, 'samples': 19756544, 'steps': 38586, 'loss/train': 1.8367716073989868} +02/26/2022 03:31:46 - INFO - codeparrot_training - Step 38587: {'lr': 6.656382814048698e-05, 'samples': 19757056, 'steps': 38587, 'loss/train': 1.418237566947937} +02/26/2022 03:31:49 - INFO - codeparrot_training - Step 38588: {'lr': 6.655271146296707e-05, 'samples': 19757568, 'steps': 38588, 'loss/train': 2.427154779434204} +02/26/2022 03:31:56 - INFO - codeparrot_training - Step 38589: {'lr': 6.654159557127701e-05, 'samples': 19758080, 'steps': 38589, 'loss/train': 0.9327219724655151} +02/26/2022 03:31:59 - INFO - codeparrot_training - Step 38590: {'lr': 6.653048046546456e-05, 'samples': 19758592, 'steps': 38590, 'loss/train': 1.7165138721466064} +02/26/2022 03:32:05 - INFO - codeparrot_training - Step 38591: {'lr': 6.65193661455773e-05, 'samples': 19759104, 'steps': 38591, 'loss/train': 2.1705565452575684} +02/26/2022 03:32:08 - INFO - codeparrot_training - Step 38592: {'lr': 6.650825261166282e-05, 'samples': 19759616, 'steps': 38592, 'loss/train': 1.8768551349639893} +02/26/2022 03:32:14 - INFO - codeparrot_training - Step 38593: {'lr': 6.649713986376862e-05, 'samples': 19760128, 'steps': 38593, 'loss/train': 1.4631894826889038} +02/26/2022 03:32:17 - INFO - codeparrot_training - Step 38594: {'lr': 6.64860279019425e-05, 'samples': 19760640, 'steps': 38594, 'loss/train': 2.925553560256958} +02/26/2022 03:32:23 - INFO - codeparrot_training - Step 38595: {'lr': 6.647491672623187e-05, 'samples': 19761152, 'steps': 38595, 'loss/train': 0.7812713980674744} +02/26/2022 03:32:26 - INFO - codeparrot_training - Step 38596: {'lr': 6.646380633668459e-05, 'samples': 19761664, 'steps': 38596, 'loss/train': 1.0813846588134766} +02/26/2022 03:32:32 - INFO - codeparrot_training - Step 38597: {'lr': 6.645269673334792e-05, 'samples': 19762176, 'steps': 38597, 'loss/train': 2.621788740158081} +02/26/2022 03:32:35 - INFO - codeparrot_training - Step 38598: {'lr': 6.64415879162697e-05, 'samples': 19762688, 'steps': 38598, 'loss/train': 1.9680814743041992} +02/26/2022 03:32:41 - INFO - codeparrot_training - Step 38599: {'lr': 6.643047988549733e-05, 'samples': 19763200, 'steps': 38599, 'loss/train': 1.3169771432876587} +02/26/2022 03:32:44 - INFO - codeparrot_training - Step 38600: {'lr': 6.641937264107867e-05, 'samples': 19763712, 'steps': 38600, 'loss/train': 3.1705527305603027} +02/26/2022 03:32:50 - INFO - codeparrot_training - Step 38601: {'lr': 6.640826618306098e-05, 'samples': 19764224, 'steps': 38601, 'loss/train': 1.2211713790893555} +02/26/2022 03:32:54 - INFO - codeparrot_training - Step 38602: {'lr': 6.639716051149203e-05, 'samples': 19764736, 'steps': 38602, 'loss/train': 1.803682565689087} +02/26/2022 03:32:59 - INFO - codeparrot_training - Step 38603: {'lr': 6.638605562641928e-05, 'samples': 19765248, 'steps': 38603, 'loss/train': 2.1569159030914307} +02/26/2022 03:33:03 - INFO - codeparrot_training - Step 38604: {'lr': 6.637495152789052e-05, 'samples': 19765760, 'steps': 38604, 'loss/train': 1.285002589225769} +02/26/2022 03:33:08 - INFO - codeparrot_training - Step 38605: {'lr': 6.636384821595302e-05, 'samples': 19766272, 'steps': 38605, 'loss/train': 1.8323359489440918} +02/26/2022 03:33:12 - INFO - codeparrot_training - Step 38606: {'lr': 6.635274569065452e-05, 'samples': 19766784, 'steps': 38606, 'loss/train': 1.6491860151290894} +02/26/2022 03:33:17 - INFO - codeparrot_training - Step 38607: {'lr': 6.634164395204259e-05, 'samples': 19767296, 'steps': 38607, 'loss/train': 2.204594373703003} +02/26/2022 03:33:21 - INFO - codeparrot_training - Step 38608: {'lr': 6.633054300016465e-05, 'samples': 19767808, 'steps': 38608, 'loss/train': 1.0186845064163208} +02/26/2022 03:33:26 - INFO - codeparrot_training - Step 38609: {'lr': 6.631944283506838e-05, 'samples': 19768320, 'steps': 38609, 'loss/train': 0.9944896101951599} +02/26/2022 03:33:30 - INFO - codeparrot_training - Step 38610: {'lr': 6.630834345680135e-05, 'samples': 19768832, 'steps': 38610, 'loss/train': 1.1949081420898438} +02/26/2022 03:33:36 - INFO - codeparrot_training - Step 38611: {'lr': 6.6297244865411e-05, 'samples': 19769344, 'steps': 38611, 'loss/train': 2.241675853729248} +02/26/2022 03:33:39 - INFO - codeparrot_training - Step 38612: {'lr': 6.628614706094488e-05, 'samples': 19769856, 'steps': 38612, 'loss/train': 1.6453428268432617} +02/26/2022 03:33:45 - INFO - codeparrot_training - Step 38613: {'lr': 6.627505004345061e-05, 'samples': 19770368, 'steps': 38613, 'loss/train': 0.45854154229164124} +02/26/2022 03:33:48 - INFO - codeparrot_training - Step 38614: {'lr': 6.62639538129757e-05, 'samples': 19770880, 'steps': 38614, 'loss/train': 1.6465308666229248} +02/26/2022 03:33:52 - INFO - codeparrot_training - Step 38615: {'lr': 6.625285836956769e-05, 'samples': 19771392, 'steps': 38615, 'loss/train': 1.4277374744415283} +02/26/2022 03:33:58 - INFO - codeparrot_training - Step 38616: {'lr': 6.624176371327401e-05, 'samples': 19771904, 'steps': 38616, 'loss/train': 1.0375969409942627} +02/26/2022 03:34:03 - INFO - codeparrot_training - Step 38617: {'lr': 6.62306698441423e-05, 'samples': 19772416, 'steps': 38617, 'loss/train': 1.7115790843963623} +02/26/2022 03:34:07 - INFO - codeparrot_training - Step 38618: {'lr': 6.62195767622201e-05, 'samples': 19772928, 'steps': 38618, 'loss/train': 2.1650514602661133} +02/26/2022 03:34:12 - INFO - codeparrot_training - Step 38619: {'lr': 6.620848446755485e-05, 'samples': 19773440, 'steps': 38619, 'loss/train': 1.8237920999526978} +02/26/2022 03:34:16 - INFO - codeparrot_training - Step 38620: {'lr': 6.6197392960194e-05, 'samples': 19773952, 'steps': 38620, 'loss/train': 0.21208587288856506} +02/26/2022 03:34:21 - INFO - codeparrot_training - Step 38621: {'lr': 6.618630224018526e-05, 'samples': 19774464, 'steps': 38621, 'loss/train': 1.5871200561523438} +02/26/2022 03:34:25 - INFO - codeparrot_training - Step 38622: {'lr': 6.617521230757603e-05, 'samples': 19774976, 'steps': 38622, 'loss/train': 2.3343801498413086} +02/26/2022 03:34:30 - INFO - codeparrot_training - Step 38623: {'lr': 6.616412316241379e-05, 'samples': 19775488, 'steps': 38623, 'loss/train': 1.4226933717727661} +02/26/2022 03:34:34 - INFO - codeparrot_training - Step 38624: {'lr': 6.615303480474601e-05, 'samples': 19776000, 'steps': 38624, 'loss/train': 1.3573405742645264} +02/26/2022 03:34:39 - INFO - codeparrot_training - Step 38625: {'lr': 6.614194723462036e-05, 'samples': 19776512, 'steps': 38625, 'loss/train': 2.7144830226898193} +02/26/2022 03:34:43 - INFO - codeparrot_training - Step 38626: {'lr': 6.61308604520842e-05, 'samples': 19777024, 'steps': 38626, 'loss/train': 0.4123234152793884} +02/26/2022 03:34:49 - INFO - codeparrot_training - Step 38627: {'lr': 6.611977445718504e-05, 'samples': 19777536, 'steps': 38627, 'loss/train': 1.7759041786193848} +02/26/2022 03:34:52 - INFO - codeparrot_training - Step 38628: {'lr': 6.610868924997033e-05, 'samples': 19778048, 'steps': 38628, 'loss/train': 2.022170305252075} +02/26/2022 03:34:58 - INFO - codeparrot_training - Step 38629: {'lr': 6.609760483048766e-05, 'samples': 19778560, 'steps': 38629, 'loss/train': 2.1668646335601807} +02/26/2022 03:35:01 - INFO - codeparrot_training - Step 38630: {'lr': 6.608652119878436e-05, 'samples': 19779072, 'steps': 38630, 'loss/train': 1.4865700006484985} +02/26/2022 03:35:07 - INFO - codeparrot_training - Step 38631: {'lr': 6.607543835490818e-05, 'samples': 19779584, 'steps': 38631, 'loss/train': 2.052323818206787} +02/26/2022 03:35:10 - INFO - codeparrot_training - Step 38632: {'lr': 6.606435629890628e-05, 'samples': 19780096, 'steps': 38632, 'loss/train': 1.1872520446777344} +02/26/2022 03:35:16 - INFO - codeparrot_training - Step 38633: {'lr': 6.60532750308263e-05, 'samples': 19780608, 'steps': 38633, 'loss/train': 1.5328195095062256} +02/26/2022 03:35:19 - INFO - codeparrot_training - Step 38634: {'lr': 6.604219455071567e-05, 'samples': 19781120, 'steps': 38634, 'loss/train': 2.6282432079315186} +02/26/2022 03:35:25 - INFO - codeparrot_training - Step 38635: {'lr': 6.603111485862195e-05, 'samples': 19781632, 'steps': 38635, 'loss/train': 1.7048457860946655} +02/26/2022 03:35:28 - INFO - codeparrot_training - Step 38636: {'lr': 6.60200359545924e-05, 'samples': 19782144, 'steps': 38636, 'loss/train': 1.3628875017166138} +02/26/2022 03:35:35 - INFO - codeparrot_training - Step 38637: {'lr': 6.600895783867469e-05, 'samples': 19782656, 'steps': 38637, 'loss/train': 1.6989284753799438} +02/26/2022 03:35:38 - INFO - codeparrot_training - Step 38638: {'lr': 6.599788051091606e-05, 'samples': 19783168, 'steps': 38638, 'loss/train': 1.4103751182556152} +02/26/2022 03:35:43 - INFO - codeparrot_training - Step 38639: {'lr': 6.598680397136428e-05, 'samples': 19783680, 'steps': 38639, 'loss/train': 1.1829496622085571} +02/26/2022 03:35:47 - INFO - codeparrot_training - Step 38640: {'lr': 6.597572822006642e-05, 'samples': 19784192, 'steps': 38640, 'loss/train': 0.5303569436073303} +02/26/2022 03:35:52 - INFO - codeparrot_training - Step 38641: {'lr': 6.596465325707019e-05, 'samples': 19784704, 'steps': 38641, 'loss/train': 0.8118969202041626} +02/26/2022 03:35:56 - INFO - codeparrot_training - Step 38642: {'lr': 6.595357908242289e-05, 'samples': 19785216, 'steps': 38642, 'loss/train': 1.6326771974563599} +02/26/2022 03:36:02 - INFO - codeparrot_training - Step 38643: {'lr': 6.594250569617204e-05, 'samples': 19785728, 'steps': 38643, 'loss/train': 2.5719337463378906} +02/26/2022 03:36:05 - INFO - codeparrot_training - Step 38644: {'lr': 6.59314330983651e-05, 'samples': 19786240, 'steps': 38644, 'loss/train': 0.7581230401992798} +02/26/2022 03:36:11 - INFO - codeparrot_training - Step 38645: {'lr': 6.592036128904944e-05, 'samples': 19786752, 'steps': 38645, 'loss/train': 0.7914933562278748} +02/26/2022 03:36:14 - INFO - codeparrot_training - Step 38646: {'lr': 6.590929026827241e-05, 'samples': 19787264, 'steps': 38646, 'loss/train': 1.3831466436386108} +02/26/2022 03:36:21 - INFO - codeparrot_training - Step 38647: {'lr': 6.589822003608162e-05, 'samples': 19787776, 'steps': 38647, 'loss/train': 2.1867780685424805} +02/26/2022 03:36:24 - INFO - codeparrot_training - Step 38648: {'lr': 6.58871505925244e-05, 'samples': 19788288, 'steps': 38648, 'loss/train': 2.6343843936920166} +02/26/2022 03:36:30 - INFO - codeparrot_training - Step 38649: {'lr': 6.587608193764816e-05, 'samples': 19788800, 'steps': 38649, 'loss/train': 3.540714740753174} +02/26/2022 03:36:33 - INFO - codeparrot_training - Step 38650: {'lr': 6.586501407150022e-05, 'samples': 19789312, 'steps': 38650, 'loss/train': 0.4508006274700165} +02/26/2022 03:36:39 - INFO - codeparrot_training - Step 38651: {'lr': 6.58539469941282e-05, 'samples': 19789824, 'steps': 38651, 'loss/train': 2.018789052963257} +02/26/2022 03:36:42 - INFO - codeparrot_training - Step 38652: {'lr': 6.584288070557937e-05, 'samples': 19790336, 'steps': 38652, 'loss/train': 3.4998269081115723} +02/26/2022 03:36:48 - INFO - codeparrot_training - Step 38653: {'lr': 6.583181520590117e-05, 'samples': 19790848, 'steps': 38653, 'loss/train': 1.9903764724731445} +02/26/2022 03:36:52 - INFO - codeparrot_training - Step 38654: {'lr': 6.5820750495141e-05, 'samples': 19791360, 'steps': 38654, 'loss/train': 1.8902126550674438} +02/26/2022 03:36:57 - INFO - codeparrot_training - Step 38655: {'lr': 6.580968657334616e-05, 'samples': 19791872, 'steps': 38655, 'loss/train': 2.3107526302337646} +02/26/2022 03:37:01 - INFO - codeparrot_training - Step 38656: {'lr': 6.579862344056422e-05, 'samples': 19792384, 'steps': 38656, 'loss/train': 1.2620282173156738} +02/26/2022 03:37:07 - INFO - codeparrot_training - Step 38657: {'lr': 6.57875610968425e-05, 'samples': 19792896, 'steps': 38657, 'loss/train': 2.3737082481384277} +02/26/2022 03:37:10 - INFO - codeparrot_training - Step 38658: {'lr': 6.577649954222836e-05, 'samples': 19793408, 'steps': 38658, 'loss/train': 1.1538290977478027} +02/26/2022 03:37:16 - INFO - codeparrot_training - Step 38659: {'lr': 6.576543877676913e-05, 'samples': 19793920, 'steps': 38659, 'loss/train': 1.7753148078918457} +02/26/2022 03:37:19 - INFO - codeparrot_training - Step 38660: {'lr': 6.575437880051233e-05, 'samples': 19794432, 'steps': 38660, 'loss/train': 1.6466093063354492} +02/26/2022 03:37:25 - INFO - codeparrot_training - Step 38661: {'lr': 6.574331961350527e-05, 'samples': 19794944, 'steps': 38661, 'loss/train': 2.5419349670410156} +02/26/2022 03:37:28 - INFO - codeparrot_training - Step 38662: {'lr': 6.573226121579532e-05, 'samples': 19795456, 'steps': 38662, 'loss/train': 0.5497141480445862} +02/26/2022 03:37:36 - INFO - codeparrot_training - Step 38663: {'lr': 6.572120360742977e-05, 'samples': 19795968, 'steps': 38663, 'loss/train': 1.6821372509002686} +02/26/2022 03:37:40 - INFO - codeparrot_training - Step 38664: {'lr': 6.571014678845617e-05, 'samples': 19796480, 'steps': 38664, 'loss/train': 2.0252134799957275} +02/26/2022 03:37:45 - INFO - codeparrot_training - Step 38665: {'lr': 6.569909075892175e-05, 'samples': 19796992, 'steps': 38665, 'loss/train': 1.8512320518493652} +02/26/2022 03:37:49 - INFO - codeparrot_training - Step 38666: {'lr': 6.568803551887392e-05, 'samples': 19797504, 'steps': 38666, 'loss/train': 1.83315110206604} +02/26/2022 03:37:54 - INFO - codeparrot_training - Step 38667: {'lr': 6.567698106835992e-05, 'samples': 19798016, 'steps': 38667, 'loss/train': 1.727878451347351} +02/26/2022 03:37:58 - INFO - codeparrot_training - Step 38668: {'lr': 6.566592740742733e-05, 'samples': 19798528, 'steps': 38668, 'loss/train': 1.367841124534607} +02/26/2022 03:38:03 - INFO - codeparrot_training - Step 38669: {'lr': 6.565487453612327e-05, 'samples': 19799040, 'steps': 38669, 'loss/train': 1.0969486236572266} +02/26/2022 03:38:07 - INFO - codeparrot_training - Step 38670: {'lr': 6.564382245449532e-05, 'samples': 19799552, 'steps': 38670, 'loss/train': 2.2816412448883057} +02/26/2022 03:38:12 - INFO - codeparrot_training - Step 38671: {'lr': 6.563277116259056e-05, 'samples': 19800064, 'steps': 38671, 'loss/train': 1.8742378950119019} +02/26/2022 03:38:16 - INFO - codeparrot_training - Step 38672: {'lr': 6.562172066045655e-05, 'samples': 19800576, 'steps': 38672, 'loss/train': 0.9214587807655334} +02/26/2022 03:38:23 - INFO - codeparrot_training - Step 38673: {'lr': 6.561067094814046e-05, 'samples': 19801088, 'steps': 38673, 'loss/train': 1.4929498434066772} +02/26/2022 03:38:27 - INFO - codeparrot_training - Step 38674: {'lr': 6.559962202568986e-05, 'samples': 19801600, 'steps': 38674, 'loss/train': 1.0426241159439087} +02/26/2022 03:38:32 - INFO - codeparrot_training - Step 38675: {'lr': 6.558857389315179e-05, 'samples': 19802112, 'steps': 38675, 'loss/train': 1.5233253240585327} +02/26/2022 03:38:36 - INFO - codeparrot_training - Step 38676: {'lr': 6.557752655057376e-05, 'samples': 19802624, 'steps': 38676, 'loss/train': 2.088609457015991} +02/26/2022 03:38:41 - INFO - codeparrot_training - Step 38677: {'lr': 6.556647999800298e-05, 'samples': 19803136, 'steps': 38677, 'loss/train': 2.1287267208099365} +02/26/2022 03:38:45 - INFO - codeparrot_training - Step 38678: {'lr': 6.55554342354869e-05, 'samples': 19803648, 'steps': 38678, 'loss/train': 1.4118505716323853} +02/26/2022 03:38:50 - INFO - codeparrot_training - Step 38679: {'lr': 6.554438926307279e-05, 'samples': 19804160, 'steps': 38679, 'loss/train': 2.1947858333587646} +02/26/2022 03:38:54 - INFO - codeparrot_training - Step 38680: {'lr': 6.553334508080793e-05, 'samples': 19804672, 'steps': 38680, 'loss/train': 1.3291409015655518} +02/26/2022 03:38:59 - INFO - codeparrot_training - Step 38681: {'lr': 6.55223016887396e-05, 'samples': 19805184, 'steps': 38681, 'loss/train': 1.111159086227417} +02/26/2022 03:39:03 - INFO - codeparrot_training - Step 38682: {'lr': 6.551125908691519e-05, 'samples': 19805696, 'steps': 38682, 'loss/train': 1.48469078540802} +02/26/2022 03:39:10 - INFO - codeparrot_training - Step 38683: {'lr': 6.550021727538196e-05, 'samples': 19806208, 'steps': 38683, 'loss/train': 1.2997806072235107} +02/26/2022 03:39:13 - INFO - codeparrot_training - Step 38684: {'lr': 6.548917625418727e-05, 'samples': 19806720, 'steps': 38684, 'loss/train': 1.4496510028839111} +02/26/2022 03:39:19 - INFO - codeparrot_training - Step 38685: {'lr': 6.547813602337824e-05, 'samples': 19807232, 'steps': 38685, 'loss/train': 2.0880749225616455} +02/26/2022 03:39:23 - INFO - codeparrot_training - Step 38686: {'lr': 6.546709658300234e-05, 'samples': 19807744, 'steps': 38686, 'loss/train': 1.9977792501449585} +02/26/2022 03:39:28 - INFO - codeparrot_training - Step 38687: {'lr': 6.545605793310686e-05, 'samples': 19808256, 'steps': 38687, 'loss/train': 2.467320680618286} +02/26/2022 03:39:31 - INFO - codeparrot_training - Step 38688: {'lr': 6.544502007373898e-05, 'samples': 19808768, 'steps': 38688, 'loss/train': 3.4030721187591553} +02/26/2022 03:39:37 - INFO - codeparrot_training - Step 38689: {'lr': 6.543398300494597e-05, 'samples': 19809280, 'steps': 38689, 'loss/train': 0.6142285466194153} +02/26/2022 03:39:41 - INFO - codeparrot_training - Step 38690: {'lr': 6.542294672677526e-05, 'samples': 19809792, 'steps': 38690, 'loss/train': 2.4969725608825684} +02/26/2022 03:39:46 - INFO - codeparrot_training - Step 38691: {'lr': 6.541191123927401e-05, 'samples': 19810304, 'steps': 38691, 'loss/train': 1.7564287185668945} +02/26/2022 03:39:50 - INFO - codeparrot_training - Step 38692: {'lr': 6.540087654248956e-05, 'samples': 19810816, 'steps': 38692, 'loss/train': 2.1521451473236084} +02/26/2022 03:39:57 - INFO - codeparrot_training - Step 38693: {'lr': 6.538984263646902e-05, 'samples': 19811328, 'steps': 38693, 'loss/train': 1.4548927545547485} +02/26/2022 03:40:00 - INFO - codeparrot_training - Step 38694: {'lr': 6.537880952125985e-05, 'samples': 19811840, 'steps': 38694, 'loss/train': 1.353824496269226} +02/26/2022 03:40:06 - INFO - codeparrot_training - Step 38695: {'lr': 6.536777719690926e-05, 'samples': 19812352, 'steps': 38695, 'loss/train': 2.5916013717651367} +02/26/2022 03:40:09 - INFO - codeparrot_training - Step 38696: {'lr': 6.535674566346448e-05, 'samples': 19812864, 'steps': 38696, 'loss/train': 0.9589845538139343} +02/26/2022 03:40:15 - INFO - codeparrot_training - Step 38697: {'lr': 6.534571492097269e-05, 'samples': 19813376, 'steps': 38697, 'loss/train': 1.6400796175003052} +02/26/2022 03:40:18 - INFO - codeparrot_training - Step 38698: {'lr': 6.53346849694813e-05, 'samples': 19813888, 'steps': 38698, 'loss/train': 2.89313006401062} +02/26/2022 03:40:24 - INFO - codeparrot_training - Step 38699: {'lr': 6.532365580903748e-05, 'samples': 19814400, 'steps': 38699, 'loss/train': 2.332109212875366} +02/26/2022 03:40:27 - INFO - codeparrot_training - Step 38700: {'lr': 6.531262743968849e-05, 'samples': 19814912, 'steps': 38700, 'loss/train': 1.483180284500122} +02/26/2022 03:40:33 - INFO - codeparrot_training - Step 38701: {'lr': 6.530159986148154e-05, 'samples': 19815424, 'steps': 38701, 'loss/train': 0.9306517243385315} +02/26/2022 03:40:36 - INFO - codeparrot_training - Step 38702: {'lr': 6.529057307446381e-05, 'samples': 19815936, 'steps': 38702, 'loss/train': 2.1577022075653076} +02/26/2022 03:40:42 - INFO - codeparrot_training - Step 38703: {'lr': 6.527954707868273e-05, 'samples': 19816448, 'steps': 38703, 'loss/train': 1.1545403003692627} +02/26/2022 03:40:45 - INFO - codeparrot_training - Step 38704: {'lr': 6.52685218741853e-05, 'samples': 19816960, 'steps': 38704, 'loss/train': 2.672415018081665} +02/26/2022 03:40:51 - INFO - codeparrot_training - Step 38705: {'lr': 6.525749746101902e-05, 'samples': 19817472, 'steps': 38705, 'loss/train': 1.1697603464126587} +02/26/2022 03:40:56 - INFO - codeparrot_training - Step 38706: {'lr': 6.52464738392308e-05, 'samples': 19817984, 'steps': 38706, 'loss/train': 2.028974771499634} +02/26/2022 03:41:00 - INFO - codeparrot_training - Step 38707: {'lr': 6.52354510088681e-05, 'samples': 19818496, 'steps': 38707, 'loss/train': 2.1986300945281982} +02/26/2022 03:41:07 - INFO - codeparrot_training - Step 38708: {'lr': 6.522442896997801e-05, 'samples': 19819008, 'steps': 38708, 'loss/train': 1.463073492050171} +02/26/2022 03:41:11 - INFO - codeparrot_training - Step 38709: {'lr': 6.521340772260791e-05, 'samples': 19819520, 'steps': 38709, 'loss/train': 1.7746306657791138} +02/26/2022 03:41:16 - INFO - codeparrot_training - Step 38710: {'lr': 6.520238726680477e-05, 'samples': 19820032, 'steps': 38710, 'loss/train': 1.5199174880981445} +02/26/2022 03:41:20 - INFO - codeparrot_training - Step 38711: {'lr': 6.519136760261598e-05, 'samples': 19820544, 'steps': 38711, 'loss/train': 1.934628963470459} +02/26/2022 03:41:25 - INFO - codeparrot_training - Step 38712: {'lr': 6.518034873008863e-05, 'samples': 19821056, 'steps': 38712, 'loss/train': 3.012913942337036} +02/26/2022 03:41:29 - INFO - codeparrot_training - Step 38713: {'lr': 6.516933064927012e-05, 'samples': 19821568, 'steps': 38713, 'loss/train': 2.005026340484619} +02/26/2022 03:41:34 - INFO - codeparrot_training - Step 38714: {'lr': 6.515831336020736e-05, 'samples': 19822080, 'steps': 38714, 'loss/train': 1.9883646965026855} +02/26/2022 03:41:37 - INFO - codeparrot_training - Step 38715: {'lr': 6.514729686294776e-05, 'samples': 19822592, 'steps': 38715, 'loss/train': 1.7896002531051636} +02/26/2022 03:41:43 - INFO - codeparrot_training - Step 38716: {'lr': 6.513628115753837e-05, 'samples': 19823104, 'steps': 38716, 'loss/train': 0.18262216448783875} +02/26/2022 03:41:46 - INFO - codeparrot_training - Step 38717: {'lr': 6.512526624402651e-05, 'samples': 19823616, 'steps': 38717, 'loss/train': 1.976986050605774} +02/26/2022 03:41:54 - INFO - codeparrot_training - Step 38718: {'lr': 6.511425212245933e-05, 'samples': 19824128, 'steps': 38718, 'loss/train': 2.043869733810425} +02/26/2022 03:41:58 - INFO - codeparrot_training - Step 38719: {'lr': 6.510323879288399e-05, 'samples': 19824640, 'steps': 38719, 'loss/train': 1.5984045267105103} +02/26/2022 03:42:01 - INFO - codeparrot_training - Step 38720: {'lr': 6.509222625534755e-05, 'samples': 19825152, 'steps': 38720, 'loss/train': 1.6781357526779175} +02/26/2022 03:42:07 - INFO - codeparrot_training - Step 38721: {'lr': 6.50812145098974e-05, 'samples': 19825664, 'steps': 38721, 'loss/train': 1.5842525959014893} +02/26/2022 03:42:10 - INFO - codeparrot_training - Step 38722: {'lr': 6.507020355658061e-05, 'samples': 19826176, 'steps': 38722, 'loss/train': 0.9933396577835083} +02/26/2022 03:42:16 - INFO - codeparrot_training - Step 38723: {'lr': 6.505919339544435e-05, 'samples': 19826688, 'steps': 38723, 'loss/train': 1.615172028541565} +02/26/2022 03:42:19 - INFO - codeparrot_training - Step 38724: {'lr': 6.50481840265357e-05, 'samples': 19827200, 'steps': 38724, 'loss/train': 0.9877386093139648} +02/26/2022 03:42:25 - INFO - codeparrot_training - Step 38725: {'lr': 6.503717544990198e-05, 'samples': 19827712, 'steps': 38725, 'loss/train': 2.0139565467834473} +02/26/2022 03:42:28 - INFO - codeparrot_training - Step 38726: {'lr': 6.502616766559019e-05, 'samples': 19828224, 'steps': 38726, 'loss/train': 1.6699538230895996} +02/26/2022 03:42:34 - INFO - codeparrot_training - Step 38727: {'lr': 6.501516067364771e-05, 'samples': 19828736, 'steps': 38727, 'loss/train': 1.4177770614624023} +02/26/2022 03:42:37 - INFO - codeparrot_training - Step 38728: {'lr': 6.500415447412139e-05, 'samples': 19829248, 'steps': 38728, 'loss/train': 1.5772100687026978} +02/26/2022 03:42:45 - INFO - codeparrot_training - Step 38729: {'lr': 6.499314906705862e-05, 'samples': 19829760, 'steps': 38729, 'loss/train': 1.6493568420410156} +02/26/2022 03:42:48 - INFO - codeparrot_training - Step 38730: {'lr': 6.498214445250636e-05, 'samples': 19830272, 'steps': 38730, 'loss/train': 0.5779489874839783} +02/26/2022 03:42:54 - INFO - codeparrot_training - Step 38731: {'lr': 6.497114063051198e-05, 'samples': 19830784, 'steps': 38731, 'loss/train': 2.2452361583709717} +02/26/2022 03:42:57 - INFO - codeparrot_training - Step 38732: {'lr': 6.496013760112235e-05, 'samples': 19831296, 'steps': 38732, 'loss/train': 1.1919969320297241} +02/26/2022 03:43:03 - INFO - codeparrot_training - Step 38733: {'lr': 6.494913536438483e-05, 'samples': 19831808, 'steps': 38733, 'loss/train': 2.563559055328369} +02/26/2022 03:43:06 - INFO - codeparrot_training - Step 38734: {'lr': 6.493813392034642e-05, 'samples': 19832320, 'steps': 38734, 'loss/train': 1.249554991722107} +02/26/2022 03:43:12 - INFO - codeparrot_training - Step 38735: {'lr': 6.492713326905428e-05, 'samples': 19832832, 'steps': 38735, 'loss/train': 2.5328257083892822} +02/26/2022 03:43:15 - INFO - codeparrot_training - Step 38736: {'lr': 6.491613341055547e-05, 'samples': 19833344, 'steps': 38736, 'loss/train': 1.0427772998809814} +02/26/2022 03:43:21 - INFO - codeparrot_training - Step 38737: {'lr': 6.490513434489726e-05, 'samples': 19833856, 'steps': 38737, 'loss/train': 2.762497901916504} +02/26/2022 03:43:24 - INFO - codeparrot_training - Step 38738: {'lr': 6.489413607212666e-05, 'samples': 19834368, 'steps': 38738, 'loss/train': 3.5796849727630615} +02/26/2022 03:43:31 - INFO - codeparrot_training - Step 38739: {'lr': 6.488313859229073e-05, 'samples': 19834880, 'steps': 38739, 'loss/train': 1.401711344718933} +02/26/2022 03:43:35 - INFO - codeparrot_training - Step 38740: {'lr': 6.487214190543675e-05, 'samples': 19835392, 'steps': 38740, 'loss/train': 0.5993425846099854} +02/26/2022 03:43:40 - INFO - codeparrot_training - Step 38741: {'lr': 6.486114601161172e-05, 'samples': 19835904, 'steps': 38741, 'loss/train': 1.3723808526992798} +02/26/2022 03:43:44 - INFO - codeparrot_training - Step 38742: {'lr': 6.485015091086275e-05, 'samples': 19836416, 'steps': 38742, 'loss/train': 1.9689902067184448} +02/26/2022 03:43:49 - INFO - codeparrot_training - Step 38743: {'lr': 6.483915660323686e-05, 'samples': 19836928, 'steps': 38743, 'loss/train': 0.9907351136207581} +02/26/2022 03:43:53 - INFO - codeparrot_training - Step 38744: {'lr': 6.482816308878129e-05, 'samples': 19837440, 'steps': 38744, 'loss/train': 1.8297984600067139} +02/26/2022 03:43:58 - INFO - codeparrot_training - Step 38745: {'lr': 6.481717036754308e-05, 'samples': 19837952, 'steps': 38745, 'loss/train': 2.0965633392333984} +02/26/2022 03:44:01 - INFO - codeparrot_training - Step 38746: {'lr': 6.480617843956932e-05, 'samples': 19838464, 'steps': 38746, 'loss/train': 1.1998233795166016} +02/26/2022 03:44:07 - INFO - codeparrot_training - Step 38747: {'lr': 6.479518730490702e-05, 'samples': 19838976, 'steps': 38747, 'loss/train': 1.9072761535644531} +02/26/2022 03:44:10 - INFO - codeparrot_training - Step 38748: {'lr': 6.478419696360346e-05, 'samples': 19839488, 'steps': 38748, 'loss/train': 0.18662342429161072} +02/26/2022 03:44:16 - INFO - codeparrot_training - Step 38749: {'lr': 6.477320741570545e-05, 'samples': 19840000, 'steps': 38749, 'loss/train': 0.6318190097808838} +02/26/2022 03:44:19 - INFO - codeparrot_training - Step 38750: {'lr': 6.476221866126028e-05, 'samples': 19840512, 'steps': 38750, 'loss/train': 1.8449482917785645} +02/26/2022 03:44:27 - INFO - codeparrot_training - Step 38751: {'lr': 6.475123070031485e-05, 'samples': 19841024, 'steps': 38751, 'loss/train': 1.4020644426345825} +02/26/2022 03:44:30 - INFO - codeparrot_training - Step 38752: {'lr': 6.474024353291641e-05, 'samples': 19841536, 'steps': 38752, 'loss/train': 1.1708887815475464} +02/26/2022 03:44:36 - INFO - codeparrot_training - Step 38753: {'lr': 6.472925715911195e-05, 'samples': 19842048, 'steps': 38753, 'loss/train': 1.0398430824279785} +02/26/2022 03:44:39 - INFO - codeparrot_training - Step 38754: {'lr': 6.471827157894852e-05, 'samples': 19842560, 'steps': 38754, 'loss/train': 0.9458532333374023} +02/26/2022 03:44:45 - INFO - codeparrot_training - Step 38755: {'lr': 6.470728679247309e-05, 'samples': 19843072, 'steps': 38755, 'loss/train': 1.241991639137268} +02/26/2022 03:44:48 - INFO - codeparrot_training - Step 38756: {'lr': 6.46963027997329e-05, 'samples': 19843584, 'steps': 38756, 'loss/train': 1.2338367700576782} +02/26/2022 03:44:54 - INFO - codeparrot_training - Step 38757: {'lr': 6.468531960077489e-05, 'samples': 19844096, 'steps': 38757, 'loss/train': 2.082691192626953} +02/26/2022 03:44:57 - INFO - codeparrot_training - Step 38758: {'lr': 6.467433719564613e-05, 'samples': 19844608, 'steps': 38758, 'loss/train': 1.4974420070648193} +02/26/2022 03:45:03 - INFO - codeparrot_training - Step 38759: {'lr': 6.466335558439362e-05, 'samples': 19845120, 'steps': 38759, 'loss/train': 2.7987849712371826} +02/26/2022 03:45:06 - INFO - codeparrot_training - Step 38760: {'lr': 6.465237476706449e-05, 'samples': 19845632, 'steps': 38760, 'loss/train': 2.9598820209503174} +02/26/2022 03:45:12 - INFO - codeparrot_training - Step 38761: {'lr': 6.464139474370573e-05, 'samples': 19846144, 'steps': 38761, 'loss/train': 1.4517033100128174} +02/26/2022 03:45:16 - INFO - codeparrot_training - Step 38762: {'lr': 6.463041551436438e-05, 'samples': 19846656, 'steps': 38762, 'loss/train': 0.6874664425849915} +02/26/2022 03:45:21 - INFO - codeparrot_training - Step 38763: {'lr': 6.46194370790874e-05, 'samples': 19847168, 'steps': 38763, 'loss/train': 2.9032158851623535} +02/26/2022 03:45:25 - INFO - codeparrot_training - Step 38764: {'lr': 6.460845943792195e-05, 'samples': 19847680, 'steps': 38764, 'loss/train': 1.7167894840240479} +02/26/2022 03:45:32 - INFO - codeparrot_training - Step 38765: {'lr': 6.459748259091493e-05, 'samples': 19848192, 'steps': 38765, 'loss/train': 1.9749704599380493} +02/26/2022 03:45:35 - INFO - codeparrot_training - Step 38766: {'lr': 6.458650653811357e-05, 'samples': 19848704, 'steps': 38766, 'loss/train': 0.9659585356712341} +02/26/2022 03:45:41 - INFO - codeparrot_training - Step 38767: {'lr': 6.457553127956458e-05, 'samples': 19849216, 'steps': 38767, 'loss/train': 1.6163103580474854} +02/26/2022 03:45:44 - INFO - codeparrot_training - Step 38768: {'lr': 6.456455681531522e-05, 'samples': 19849728, 'steps': 38768, 'loss/train': 2.5894775390625} +02/26/2022 03:45:50 - INFO - codeparrot_training - Step 38769: {'lr': 6.455358314541235e-05, 'samples': 19850240, 'steps': 38769, 'loss/train': 1.1043782234191895} +02/26/2022 03:45:53 - INFO - codeparrot_training - Step 38770: {'lr': 6.454261026990315e-05, 'samples': 19850752, 'steps': 38770, 'loss/train': 1.5259125232696533} +02/26/2022 03:45:59 - INFO - codeparrot_training - Step 38771: {'lr': 6.453163818883443e-05, 'samples': 19851264, 'steps': 38771, 'loss/train': 1.2306572198867798} +02/26/2022 03:46:03 - INFO - codeparrot_training - Step 38772: {'lr': 6.452066690225331e-05, 'samples': 19851776, 'steps': 38772, 'loss/train': 1.5919548273086548} +02/26/2022 03:46:08 - INFO - codeparrot_training - Step 38773: {'lr': 6.450969641020671e-05, 'samples': 19852288, 'steps': 38773, 'loss/train': 2.2383909225463867} +02/26/2022 03:46:12 - INFO - codeparrot_training - Step 38774: {'lr': 6.449872671274179e-05, 'samples': 19852800, 'steps': 38774, 'loss/train': 0.7657734751701355} +02/26/2022 03:46:19 - INFO - codeparrot_training - Step 38775: {'lr': 6.448775780990529e-05, 'samples': 19853312, 'steps': 38775, 'loss/train': 0.9641997218132019} +02/26/2022 03:46:22 - INFO - codeparrot_training - Step 38776: {'lr': 6.44767897017444e-05, 'samples': 19853824, 'steps': 38776, 'loss/train': 2.39081072807312} +02/26/2022 03:46:28 - INFO - codeparrot_training - Step 38777: {'lr': 6.446582238830597e-05, 'samples': 19854336, 'steps': 38777, 'loss/train': 2.127990484237671} +02/26/2022 03:46:31 - INFO - codeparrot_training - Step 38778: {'lr': 6.445485586963709e-05, 'samples': 19854848, 'steps': 38778, 'loss/train': 2.1040003299713135} +02/26/2022 03:46:37 - INFO - codeparrot_training - Step 38779: {'lr': 6.444389014578473e-05, 'samples': 19855360, 'steps': 38779, 'loss/train': 8.964900970458984} +02/26/2022 03:46:40 - INFO - codeparrot_training - Step 38780: {'lr': 6.443292521679578e-05, 'samples': 19855872, 'steps': 38780, 'loss/train': 0.41744714975357056} +02/26/2022 03:46:46 - INFO - codeparrot_training - Step 38781: {'lr': 6.442196108271727e-05, 'samples': 19856384, 'steps': 38781, 'loss/train': 1.8386110067367554} +02/26/2022 03:46:50 - INFO - codeparrot_training - Step 38782: {'lr': 6.44109977435961e-05, 'samples': 19856896, 'steps': 38782, 'loss/train': 1.5573471784591675} +02/26/2022 03:46:55 - INFO - codeparrot_training - Step 38783: {'lr': 6.440003519947935e-05, 'samples': 19857408, 'steps': 38783, 'loss/train': 1.8448214530944824} +02/26/2022 03:46:59 - INFO - codeparrot_training - Step 38784: {'lr': 6.438907345041389e-05, 'samples': 19857920, 'steps': 38784, 'loss/train': 1.2363420724868774} +02/26/2022 03:47:06 - INFO - codeparrot_training - Step 38785: {'lr': 6.437811249644673e-05, 'samples': 19858432, 'steps': 38785, 'loss/train': 1.7648439407348633} +02/26/2022 03:47:09 - INFO - codeparrot_training - Step 38786: {'lr': 6.43671523376247e-05, 'samples': 19858944, 'steps': 38786, 'loss/train': 1.922467589378357} +02/26/2022 03:47:15 - INFO - codeparrot_training - Step 38787: {'lr': 6.435619297399492e-05, 'samples': 19859456, 'steps': 38787, 'loss/train': 0.22969470918178558} +02/26/2022 03:47:18 - INFO - codeparrot_training - Step 38788: {'lr': 6.434523440560427e-05, 'samples': 19859968, 'steps': 38788, 'loss/train': 1.9244303703308105} +02/26/2022 03:47:24 - INFO - codeparrot_training - Step 38789: {'lr': 6.433427663249969e-05, 'samples': 19860480, 'steps': 38789, 'loss/train': 0.6102625131607056} +02/26/2022 03:47:27 - INFO - codeparrot_training - Step 38790: {'lr': 6.432331965472801e-05, 'samples': 19860992, 'steps': 38790, 'loss/train': 1.2116776704788208} +02/26/2022 03:47:33 - INFO - codeparrot_training - Step 38791: {'lr': 6.431236347233638e-05, 'samples': 19861504, 'steps': 38791, 'loss/train': 1.4490152597427368} +02/26/2022 03:47:36 - INFO - codeparrot_training - Step 38792: {'lr': 6.43014080853716e-05, 'samples': 19862016, 'steps': 38792, 'loss/train': 2.329697370529175} +02/26/2022 03:47:42 - INFO - codeparrot_training - Step 38793: {'lr': 6.429045349388063e-05, 'samples': 19862528, 'steps': 38793, 'loss/train': 1.5675824880599976} +02/26/2022 03:47:45 - INFO - codeparrot_training - Step 38794: {'lr': 6.42794996979103e-05, 'samples': 19863040, 'steps': 38794, 'loss/train': 1.5963491201400757} +02/26/2022 03:47:51 - INFO - codeparrot_training - Step 38795: {'lr': 6.426854669750773e-05, 'samples': 19863552, 'steps': 38795, 'loss/train': 2.4156441688537598} +02/26/2022 03:47:54 - INFO - codeparrot_training - Step 38796: {'lr': 6.42575944927197e-05, 'samples': 19864064, 'steps': 38796, 'loss/train': 0.5700355768203735} +02/26/2022 03:48:01 - INFO - codeparrot_training - Step 38797: {'lr': 6.424664308359315e-05, 'samples': 19864576, 'steps': 38797, 'loss/train': 1.6825120449066162} +02/26/2022 03:48:05 - INFO - codeparrot_training - Step 38798: {'lr': 6.423569247017493e-05, 'samples': 19865088, 'steps': 38798, 'loss/train': 1.7825416326522827} +02/26/2022 03:48:10 - INFO - codeparrot_training - Step 38799: {'lr': 6.42247426525121e-05, 'samples': 19865600, 'steps': 38799, 'loss/train': 1.7090396881103516} +02/26/2022 03:48:14 - INFO - codeparrot_training - Step 38800: {'lr': 6.421379363065141e-05, 'samples': 19866112, 'steps': 38800, 'loss/train': 1.4217395782470703} +02/26/2022 03:48:20 - INFO - codeparrot_training - Step 38801: {'lr': 6.420284540463998e-05, 'samples': 19866624, 'steps': 38801, 'loss/train': 1.579977035522461} +02/26/2022 03:48:23 - INFO - codeparrot_training - Step 38802: {'lr': 6.41918979745244e-05, 'samples': 19867136, 'steps': 38802, 'loss/train': 2.0598113536834717} +02/26/2022 03:48:29 - INFO - codeparrot_training - Step 38803: {'lr': 6.418095134035182e-05, 'samples': 19867648, 'steps': 38803, 'loss/train': 1.0589210987091064} +02/26/2022 03:48:32 - INFO - codeparrot_training - Step 38804: {'lr': 6.417000550216896e-05, 'samples': 19868160, 'steps': 38804, 'loss/train': 0.8834738731384277} +02/26/2022 03:48:37 - INFO - codeparrot_training - Step 38805: {'lr': 6.415906046002293e-05, 'samples': 19868672, 'steps': 38805, 'loss/train': 1.4800336360931396} +02/26/2022 03:48:41 - INFO - codeparrot_training - Step 38806: {'lr': 6.414811621396033e-05, 'samples': 19869184, 'steps': 38806, 'loss/train': 1.513084888458252} +02/26/2022 03:48:48 - INFO - codeparrot_training - Step 38807: {'lr': 6.413717276402828e-05, 'samples': 19869696, 'steps': 38807, 'loss/train': 1.9747583866119385} +02/26/2022 03:48:52 - INFO - codeparrot_training - Step 38808: {'lr': 6.412623011027346e-05, 'samples': 19870208, 'steps': 38808, 'loss/train': 0.9450200796127319} +02/26/2022 03:48:57 - INFO - codeparrot_training - Step 38809: {'lr': 6.411528825274301e-05, 'samples': 19870720, 'steps': 38809, 'loss/train': 1.3941991329193115} +02/26/2022 03:49:01 - INFO - codeparrot_training - Step 38810: {'lr': 6.410434719148347e-05, 'samples': 19871232, 'steps': 38810, 'loss/train': 1.262963891029358} +02/26/2022 03:49:06 - INFO - codeparrot_training - Step 38811: {'lr': 6.409340692654198e-05, 'samples': 19871744, 'steps': 38811, 'loss/train': 2.3142611980438232} +02/26/2022 03:49:10 - INFO - codeparrot_training - Step 38812: {'lr': 6.408246745796523e-05, 'samples': 19872256, 'steps': 38812, 'loss/train': 0.08465367555618286} +02/26/2022 03:49:15 - INFO - codeparrot_training - Step 38813: {'lr': 6.407152878580023e-05, 'samples': 19872768, 'steps': 38813, 'loss/train': 2.168731689453125} +02/26/2022 03:49:19 - INFO - codeparrot_training - Step 38814: {'lr': 6.406059091009373e-05, 'samples': 19873280, 'steps': 38814, 'loss/train': 1.2257672548294067} +02/26/2022 03:49:24 - INFO - codeparrot_training - Step 38815: {'lr': 6.404965383089265e-05, 'samples': 19873792, 'steps': 38815, 'loss/train': 0.5894840359687805} +02/26/2022 03:49:28 - INFO - codeparrot_training - Step 38816: {'lr': 6.403871754824372e-05, 'samples': 19874304, 'steps': 38816, 'loss/train': 0.60886150598526} +02/26/2022 03:49:33 - INFO - codeparrot_training - Step 38817: {'lr': 6.402778206219395e-05, 'samples': 19874816, 'steps': 38817, 'loss/train': 2.5555009841918945} +02/26/2022 03:49:37 - INFO - codeparrot_training - Step 38818: {'lr': 6.401684737279009e-05, 'samples': 19875328, 'steps': 38818, 'loss/train': 2.7031188011169434} +02/26/2022 03:49:42 - INFO - codeparrot_training - Step 38819: {'lr': 6.400591348007904e-05, 'samples': 19875840, 'steps': 38819, 'loss/train': 1.8502089977264404} +02/26/2022 03:49:46 - INFO - codeparrot_training - Step 38820: {'lr': 6.399498038410747e-05, 'samples': 19876352, 'steps': 38820, 'loss/train': 1.0791562795639038} +02/26/2022 03:49:51 - INFO - codeparrot_training - Step 38821: {'lr': 6.398404808492245e-05, 'samples': 19876864, 'steps': 38821, 'loss/train': 1.3779817819595337} +02/26/2022 03:49:55 - INFO - codeparrot_training - Step 38822: {'lr': 6.397311658257071e-05, 'samples': 19877376, 'steps': 38822, 'loss/train': 1.263892650604248} +02/26/2022 03:50:02 - INFO - codeparrot_training - Step 38823: {'lr': 6.396218587709904e-05, 'samples': 19877888, 'steps': 38823, 'loss/train': 1.3508083820343018} +02/26/2022 03:50:05 - INFO - codeparrot_training - Step 38824: {'lr': 6.395125596855425e-05, 'samples': 19878400, 'steps': 38824, 'loss/train': 0.11727475374937057} +02/26/2022 03:50:11 - INFO - codeparrot_training - Step 38825: {'lr': 6.394032685698325e-05, 'samples': 19878912, 'steps': 38825, 'loss/train': 1.6723921298980713} +02/26/2022 03:50:14 - INFO - codeparrot_training - Step 38826: {'lr': 6.392939854243282e-05, 'samples': 19879424, 'steps': 38826, 'loss/train': 2.1133294105529785} +02/26/2022 03:50:20 - INFO - codeparrot_training - Step 38827: {'lr': 6.391847102494976e-05, 'samples': 19879936, 'steps': 38827, 'loss/train': 0.07957497984170914} +02/26/2022 03:50:23 - INFO - codeparrot_training - Step 38828: {'lr': 6.390754430458081e-05, 'samples': 19880448, 'steps': 38828, 'loss/train': 2.9327425956726074} +02/26/2022 03:50:29 - INFO - codeparrot_training - Step 38829: {'lr': 6.389661838137292e-05, 'samples': 19880960, 'steps': 38829, 'loss/train': 1.6273353099822998} +02/26/2022 03:50:32 - INFO - codeparrot_training - Step 38830: {'lr': 6.388569325537283e-05, 'samples': 19881472, 'steps': 38830, 'loss/train': 1.8934136629104614} +02/26/2022 03:50:38 - INFO - codeparrot_training - Step 38831: {'lr': 6.387476892662733e-05, 'samples': 19881984, 'steps': 38831, 'loss/train': 1.2015880346298218} +02/26/2022 03:50:41 - INFO - codeparrot_training - Step 38832: {'lr': 6.38638453951832e-05, 'samples': 19882496, 'steps': 38832, 'loss/train': 1.5802578926086426} +02/26/2022 03:50:48 - INFO - codeparrot_training - Step 38833: {'lr': 6.385292266108719e-05, 'samples': 19883008, 'steps': 38833, 'loss/train': 1.0243046283721924} +02/26/2022 03:50:52 - INFO - codeparrot_training - Step 38834: {'lr': 6.384200072438623e-05, 'samples': 19883520, 'steps': 38834, 'loss/train': 1.5294610261917114} +02/26/2022 03:50:57 - INFO - codeparrot_training - Step 38835: {'lr': 6.383107958512696e-05, 'samples': 19884032, 'steps': 38835, 'loss/train': 1.7044965028762817} +02/26/2022 03:51:01 - INFO - codeparrot_training - Step 38836: {'lr': 6.382015924335636e-05, 'samples': 19884544, 'steps': 38836, 'loss/train': 1.6806957721710205} +02/26/2022 03:51:06 - INFO - codeparrot_training - Step 38837: {'lr': 6.380923969912094e-05, 'samples': 19885056, 'steps': 38837, 'loss/train': 2.737531900405884} +02/26/2022 03:51:10 - INFO - codeparrot_training - Step 38838: {'lr': 6.379832095246767e-05, 'samples': 19885568, 'steps': 38838, 'loss/train': 1.864533543586731} +02/26/2022 03:51:15 - INFO - codeparrot_training - Step 38839: {'lr': 6.378740300344324e-05, 'samples': 19886080, 'steps': 38839, 'loss/train': 1.286806583404541} +02/26/2022 03:51:19 - INFO - codeparrot_training - Step 38840: {'lr': 6.377648585209455e-05, 'samples': 19886592, 'steps': 38840, 'loss/train': 0.8436279892921448} +02/26/2022 03:51:24 - INFO - codeparrot_training - Step 38841: {'lr': 6.376556949846813e-05, 'samples': 19887104, 'steps': 38841, 'loss/train': 2.421673536300659} +02/26/2022 03:51:28 - INFO - codeparrot_training - Step 38842: {'lr': 6.375465394261096e-05, 'samples': 19887616, 'steps': 38842, 'loss/train': 1.671796441078186} +02/26/2022 03:51:34 - INFO - codeparrot_training - Step 38843: {'lr': 6.374373918456964e-05, 'samples': 19888128, 'steps': 38843, 'loss/train': 2.339667558670044} +02/26/2022 03:51:38 - INFO - codeparrot_training - Step 38844: {'lr': 6.37328252243911e-05, 'samples': 19888640, 'steps': 38844, 'loss/train': 2.1658670902252197} +02/26/2022 03:51:43 - INFO - codeparrot_training - Step 38845: {'lr': 6.372191206212188e-05, 'samples': 19889152, 'steps': 38845, 'loss/train': 2.45666241645813} +02/26/2022 03:51:48 - INFO - codeparrot_training - Step 38846: {'lr': 6.371099969780891e-05, 'samples': 19889664, 'steps': 38846, 'loss/train': 2.5400333404541016} +02/26/2022 03:51:52 - INFO - codeparrot_training - Step 38847: {'lr': 6.37000881314988e-05, 'samples': 19890176, 'steps': 38847, 'loss/train': 2.4450693130493164} +02/26/2022 03:51:57 - INFO - codeparrot_training - Step 38848: {'lr': 6.368917736323843e-05, 'samples': 19890688, 'steps': 38848, 'loss/train': 1.0211149454116821} +02/26/2022 03:52:01 - INFO - codeparrot_training - Step 38849: {'lr': 6.367826739307445e-05, 'samples': 19891200, 'steps': 38849, 'loss/train': 1.6614383459091187} +02/26/2022 03:52:06 - INFO - codeparrot_training - Step 38850: {'lr': 6.36673582210536e-05, 'samples': 19891712, 'steps': 38850, 'loss/train': 1.6359202861785889} +02/26/2022 03:52:10 - INFO - codeparrot_training - Step 38851: {'lr': 6.365644984722254e-05, 'samples': 19892224, 'steps': 38851, 'loss/train': 1.525418996810913} +02/26/2022 03:52:15 - INFO - codeparrot_training - Step 38852: {'lr': 6.364554227162819e-05, 'samples': 19892736, 'steps': 38852, 'loss/train': 2.3382010459899902} +02/26/2022 03:52:19 - INFO - codeparrot_training - Step 38853: {'lr': 6.363463549431714e-05, 'samples': 19893248, 'steps': 38853, 'loss/train': 1.3372362852096558} +02/26/2022 03:52:25 - INFO - codeparrot_training - Step 38854: {'lr': 6.362372951533613e-05, 'samples': 19893760, 'steps': 38854, 'loss/train': 1.1186985969543457} +02/26/2022 03:52:28 - INFO - codeparrot_training - Step 38855: {'lr': 6.361282433473181e-05, 'samples': 19894272, 'steps': 38855, 'loss/train': 1.403040885925293} +02/26/2022 03:52:33 - INFO - codeparrot_training - Step 38856: {'lr': 6.360191995255104e-05, 'samples': 19894784, 'steps': 38856, 'loss/train': 1.9209054708480835} +02/26/2022 03:52:37 - INFO - codeparrot_training - Step 38857: {'lr': 6.359101636884045e-05, 'samples': 19895296, 'steps': 38857, 'loss/train': 2.063040018081665} +02/26/2022 03:52:43 - INFO - codeparrot_training - Step 38858: {'lr': 6.358011358364676e-05, 'samples': 19895808, 'steps': 38858, 'loss/train': 1.859063982963562} +02/26/2022 03:52:47 - INFO - codeparrot_training - Step 38859: {'lr': 6.356921159701662e-05, 'samples': 19896320, 'steps': 38859, 'loss/train': 1.6190849542617798} +02/26/2022 03:52:52 - INFO - codeparrot_training - Step 38860: {'lr': 6.355831040899682e-05, 'samples': 19896832, 'steps': 38860, 'loss/train': 1.7135318517684937} +02/26/2022 03:52:55 - INFO - codeparrot_training - Step 38861: {'lr': 6.354741001963396e-05, 'samples': 19897344, 'steps': 38861, 'loss/train': 0.18433037400245667} +02/26/2022 03:53:01 - INFO - codeparrot_training - Step 38862: {'lr': 6.353651042897493e-05, 'samples': 19897856, 'steps': 38862, 'loss/train': 1.3983616828918457} +02/26/2022 03:53:05 - INFO - codeparrot_training - Step 38863: {'lr': 6.352561163706613e-05, 'samples': 19898368, 'steps': 38863, 'loss/train': 1.2397453784942627} +02/26/2022 03:53:10 - INFO - codeparrot_training - Step 38864: {'lr': 6.351471364395448e-05, 'samples': 19898880, 'steps': 38864, 'loss/train': 1.0877991914749146} +02/26/2022 03:53:14 - INFO - codeparrot_training - Step 38865: {'lr': 6.350381644968659e-05, 'samples': 19899392, 'steps': 38865, 'loss/train': 1.620319128036499} +02/26/2022 03:53:19 - INFO - codeparrot_training - Step 38866: {'lr': 6.34929200543091e-05, 'samples': 19899904, 'steps': 38866, 'loss/train': 2.918816089630127} +02/26/2022 03:53:23 - INFO - codeparrot_training - Step 38867: {'lr': 6.348202445786866e-05, 'samples': 19900416, 'steps': 38867, 'loss/train': 1.7316852807998657} +02/26/2022 03:53:29 - INFO - codeparrot_training - Step 38868: {'lr': 6.347112966041208e-05, 'samples': 19900928, 'steps': 38868, 'loss/train': 0.8470566868782043} +02/26/2022 03:53:32 - INFO - codeparrot_training - Step 38869: {'lr': 6.346023566198594e-05, 'samples': 19901440, 'steps': 38869, 'loss/train': 1.8697400093078613} +02/26/2022 03:53:38 - INFO - codeparrot_training - Step 38870: {'lr': 6.344934246263692e-05, 'samples': 19901952, 'steps': 38870, 'loss/train': 2.8419699668884277} +02/26/2022 03:53:41 - INFO - codeparrot_training - Step 38871: {'lr': 6.343845006241161e-05, 'samples': 19902464, 'steps': 38871, 'loss/train': 3.0880727767944336} +02/26/2022 03:53:47 - INFO - codeparrot_training - Step 38872: {'lr': 6.342755846135684e-05, 'samples': 19902976, 'steps': 38872, 'loss/train': 1.8982683420181274} +02/26/2022 03:53:50 - INFO - codeparrot_training - Step 38873: {'lr': 6.341666765951912e-05, 'samples': 19903488, 'steps': 38873, 'loss/train': 1.6093734502792358} +02/26/2022 03:53:56 - INFO - codeparrot_training - Step 38874: {'lr': 6.340577765694511e-05, 'samples': 19904000, 'steps': 38874, 'loss/train': 1.942063331604004} +02/26/2022 03:53:59 - INFO - codeparrot_training - Step 38875: {'lr': 6.339488845368155e-05, 'samples': 19904512, 'steps': 38875, 'loss/train': 1.6383899450302124} +02/26/2022 03:54:05 - INFO - codeparrot_training - Step 38876: {'lr': 6.338400004977505e-05, 'samples': 19905024, 'steps': 38876, 'loss/train': 1.677234411239624} +02/26/2022 03:54:08 - INFO - codeparrot_training - Step 38877: {'lr': 6.337311244527221e-05, 'samples': 19905536, 'steps': 38877, 'loss/train': 1.2173211574554443} +02/26/2022 03:54:15 - INFO - codeparrot_training - Step 38878: {'lr': 6.336222564021965e-05, 'samples': 19906048, 'steps': 38878, 'loss/train': 1.966973066329956} +02/26/2022 03:54:18 - INFO - codeparrot_training - Step 38879: {'lr': 6.33513396346642e-05, 'samples': 19906560, 'steps': 38879, 'loss/train': 1.4125511646270752} +02/26/2022 03:54:24 - INFO - codeparrot_training - Step 38880: {'lr': 6.334045442865219e-05, 'samples': 19907072, 'steps': 38880, 'loss/train': 1.6864938735961914} +02/26/2022 03:54:27 - INFO - codeparrot_training - Step 38881: {'lr': 6.332957002223047e-05, 'samples': 19907584, 'steps': 38881, 'loss/train': 2.026339054107666} +02/26/2022 03:54:33 - INFO - codeparrot_training - Step 38882: {'lr': 6.331868641544553e-05, 'samples': 19908096, 'steps': 38882, 'loss/train': 2.478119373321533} +02/26/2022 03:54:37 - INFO - codeparrot_training - Step 38883: {'lr': 6.330780360834418e-05, 'samples': 19908608, 'steps': 38883, 'loss/train': 1.8960620164871216} +02/26/2022 03:54:42 - INFO - codeparrot_training - Step 38884: {'lr': 6.329692160097281e-05, 'samples': 19909120, 'steps': 38884, 'loss/train': 1.472038984298706} +02/26/2022 03:54:46 - INFO - codeparrot_training - Step 38885: {'lr': 6.328604039337818e-05, 'samples': 19909632, 'steps': 38885, 'loss/train': 1.2072947025299072} +02/26/2022 03:54:51 - INFO - codeparrot_training - Step 38886: {'lr': 6.327515998560681e-05, 'samples': 19910144, 'steps': 38886, 'loss/train': 2.57529878616333} +02/26/2022 03:54:55 - INFO - codeparrot_training - Step 38887: {'lr': 6.326428037770545e-05, 'samples': 19910656, 'steps': 38887, 'loss/train': 2.057734251022339} +02/26/2022 03:55:01 - INFO - codeparrot_training - Step 38888: {'lr': 6.325340156972059e-05, 'samples': 19911168, 'steps': 38888, 'loss/train': 1.392457365989685} +02/26/2022 03:55:04 - INFO - codeparrot_training - Step 38889: {'lr': 6.324252356169888e-05, 'samples': 19911680, 'steps': 38889, 'loss/train': 1.569298505783081} +02/26/2022 03:55:10 - INFO - codeparrot_training - Step 38890: {'lr': 6.32316463536868e-05, 'samples': 19912192, 'steps': 38890, 'loss/train': 1.3328437805175781} +02/26/2022 03:55:13 - INFO - codeparrot_training - Step 38891: {'lr': 6.322076994573115e-05, 'samples': 19912704, 'steps': 38891, 'loss/train': 1.5142974853515625} +02/26/2022 03:55:19 - INFO - codeparrot_training - Step 38892: {'lr': 6.320989433787838e-05, 'samples': 19913216, 'steps': 38892, 'loss/train': 1.4834496974945068} +02/26/2022 03:55:22 - INFO - codeparrot_training - Step 38893: {'lr': 6.319901953017515e-05, 'samples': 19913728, 'steps': 38893, 'loss/train': 1.5543599128723145} +02/26/2022 03:55:28 - INFO - codeparrot_training - Step 38894: {'lr': 6.318814552266788e-05, 'samples': 19914240, 'steps': 38894, 'loss/train': 1.092104196548462} +02/26/2022 03:55:33 - INFO - codeparrot_training - Step 38895: {'lr': 6.317727231540338e-05, 'samples': 19914752, 'steps': 38895, 'loss/train': 1.6777210235595703} +02/26/2022 03:55:37 - INFO - codeparrot_training - Step 38896: {'lr': 6.316639990842804e-05, 'samples': 19915264, 'steps': 38896, 'loss/train': 2.6742794513702393} +02/26/2022 03:55:42 - INFO - codeparrot_training - Step 38897: {'lr': 6.315552830178867e-05, 'samples': 19915776, 'steps': 38897, 'loss/train': 1.963529109954834} +02/26/2022 03:55:46 - INFO - codeparrot_training - Step 38898: {'lr': 6.314465749553152e-05, 'samples': 19916288, 'steps': 38898, 'loss/train': 2.05869722366333} +02/26/2022 03:55:51 - INFO - codeparrot_training - Step 38899: {'lr': 6.313378748970344e-05, 'samples': 19916800, 'steps': 38899, 'loss/train': 0.3517754077911377} +02/26/2022 03:55:55 - INFO - codeparrot_training - Step 38900: {'lr': 6.312291828435076e-05, 'samples': 19917312, 'steps': 38900, 'loss/train': 2.547058343887329} +02/26/2022 03:56:01 - INFO - codeparrot_training - Step 38901: {'lr': 6.311204987952033e-05, 'samples': 19917824, 'steps': 38901, 'loss/train': 2.3607535362243652} +02/26/2022 03:56:04 - INFO - codeparrot_training - Step 38902: {'lr': 6.310118227525838e-05, 'samples': 19918336, 'steps': 38902, 'loss/train': 2.202324628829956} +02/26/2022 03:56:08 - INFO - codeparrot_training - Step 38903: {'lr': 6.30903154716117e-05, 'samples': 19918848, 'steps': 38903, 'loss/train': 2.181614875793457} +02/26/2022 03:56:14 - INFO - codeparrot_training - Step 38904: {'lr': 6.307944946862668e-05, 'samples': 19919360, 'steps': 38904, 'loss/train': 1.1483254432678223} +02/26/2022 03:56:20 - INFO - codeparrot_training - Step 38905: {'lr': 6.306858426635006e-05, 'samples': 19919872, 'steps': 38905, 'loss/train': 3.3665950298309326} +02/26/2022 03:56:23 - INFO - codeparrot_training - Step 38906: {'lr': 6.305771986482816e-05, 'samples': 19920384, 'steps': 38906, 'loss/train': 1.4355310201644897} +02/26/2022 03:56:29 - INFO - codeparrot_training - Step 38907: {'lr': 6.304685626410769e-05, 'samples': 19920896, 'steps': 38907, 'loss/train': 1.51449453830719} +02/26/2022 03:56:33 - INFO - codeparrot_training - Step 38908: {'lr': 6.303599346423505e-05, 'samples': 19921408, 'steps': 38908, 'loss/train': 3.7690417766571045} +02/26/2022 03:56:36 - INFO - codeparrot_training - Step 38909: {'lr': 6.302513146525693e-05, 'samples': 19921920, 'steps': 38909, 'loss/train': 1.0974311828613281} +02/26/2022 03:56:42 - INFO - codeparrot_training - Step 38910: {'lr': 6.301427026721975e-05, 'samples': 19922432, 'steps': 38910, 'loss/train': 1.3523627519607544} +02/26/2022 03:56:45 - INFO - codeparrot_training - Step 38911: {'lr': 6.300340987017009e-05, 'samples': 19922944, 'steps': 38911, 'loss/train': 1.7942637205123901} +02/26/2022 03:56:51 - INFO - codeparrot_training - Step 38912: {'lr': 6.299255027415443e-05, 'samples': 19923456, 'steps': 38912, 'loss/train': 7.154319763183594} +02/26/2022 03:56:54 - INFO - codeparrot_training - Step 38913: {'lr': 6.298169147921923e-05, 'samples': 19923968, 'steps': 38913, 'loss/train': 1.2122001647949219} +02/26/2022 03:57:01 - INFO - codeparrot_training - Step 38914: {'lr': 6.297083348541113e-05, 'samples': 19924480, 'steps': 38914, 'loss/train': 1.4609757661819458} +02/26/2022 03:57:04 - INFO - codeparrot_training - Step 38915: {'lr': 6.295997629277661e-05, 'samples': 19924992, 'steps': 38915, 'loss/train': 2.0608909130096436} +02/26/2022 03:57:10 - INFO - codeparrot_training - Step 38916: {'lr': 6.294911990136218e-05, 'samples': 19925504, 'steps': 38916, 'loss/train': 2.5247342586517334} +02/26/2022 03:57:13 - INFO - codeparrot_training - Step 38917: {'lr': 6.293826431121422e-05, 'samples': 19926016, 'steps': 38917, 'loss/train': 2.2232210636138916} +02/26/2022 03:57:19 - INFO - codeparrot_training - Step 38918: {'lr': 6.292740952237943e-05, 'samples': 19926528, 'steps': 38918, 'loss/train': 1.9103516340255737} +02/26/2022 03:57:24 - INFO - codeparrot_training - Step 38919: {'lr': 6.291655553490422e-05, 'samples': 19927040, 'steps': 38919, 'loss/train': 2.00417423248291} +02/26/2022 03:57:28 - INFO - codeparrot_training - Step 38920: {'lr': 6.290570234883505e-05, 'samples': 19927552, 'steps': 38920, 'loss/train': 0.45651569962501526} +02/26/2022 03:57:33 - INFO - codeparrot_training - Step 38921: {'lr': 6.28948499642184e-05, 'samples': 19928064, 'steps': 38921, 'loss/train': 2.1316864490509033} +02/26/2022 03:57:37 - INFO - codeparrot_training - Step 38922: {'lr': 6.288399838110087e-05, 'samples': 19928576, 'steps': 38922, 'loss/train': 1.490264892578125} +02/26/2022 03:57:43 - INFO - codeparrot_training - Step 38923: {'lr': 6.287314759952886e-05, 'samples': 19929088, 'steps': 38923, 'loss/train': 3.206657886505127} +02/26/2022 03:57:46 - INFO - codeparrot_training - Step 38924: {'lr': 6.286229761954887e-05, 'samples': 19929600, 'steps': 38924, 'loss/train': 1.715929627418518} +02/26/2022 03:57:52 - INFO - codeparrot_training - Step 38925: {'lr': 6.28514484412073e-05, 'samples': 19930112, 'steps': 38925, 'loss/train': 1.8856327533721924} +02/26/2022 03:57:55 - INFO - codeparrot_training - Step 38926: {'lr': 6.284060006455078e-05, 'samples': 19930624, 'steps': 38926, 'loss/train': 1.176323413848877} +02/26/2022 03:58:01 - INFO - codeparrot_training - Step 38927: {'lr': 6.28297524896257e-05, 'samples': 19931136, 'steps': 38927, 'loss/train': 1.6909675598144531} +02/26/2022 03:58:04 - INFO - codeparrot_training - Step 38928: {'lr': 6.281890571647852e-05, 'samples': 19931648, 'steps': 38928, 'loss/train': 2.348320960998535} +02/26/2022 03:58:10 - INFO - codeparrot_training - Step 38929: {'lr': 6.280805974515563e-05, 'samples': 19932160, 'steps': 38929, 'loss/train': 1.5610156059265137} +02/26/2022 03:58:13 - INFO - codeparrot_training - Step 38930: {'lr': 6.279721457570367e-05, 'samples': 19932672, 'steps': 38930, 'loss/train': 2.2120895385742188} +02/26/2022 03:58:19 - INFO - codeparrot_training - Step 38931: {'lr': 6.278637020816896e-05, 'samples': 19933184, 'steps': 38931, 'loss/train': 1.5010899305343628} +02/26/2022 03:58:22 - INFO - codeparrot_training - Step 38932: {'lr': 6.277552664259803e-05, 'samples': 19933696, 'steps': 38932, 'loss/train': 1.4336180686950684} +02/26/2022 03:58:29 - INFO - codeparrot_training - Step 38933: {'lr': 6.276468387903719e-05, 'samples': 19934208, 'steps': 38933, 'loss/train': 2.6342320442199707} +02/26/2022 03:58:32 - INFO - codeparrot_training - Step 38934: {'lr': 6.275384191753311e-05, 'samples': 19934720, 'steps': 38934, 'loss/train': 1.445743203163147} +02/26/2022 03:58:37 - INFO - codeparrot_training - Step 38935: {'lr': 6.274300075813199e-05, 'samples': 19935232, 'steps': 38935, 'loss/train': 1.3488141298294067} +02/26/2022 03:58:41 - INFO - codeparrot_training - Step 38936: {'lr': 6.273216040088056e-05, 'samples': 19935744, 'steps': 38936, 'loss/train': 1.3567650318145752} +02/26/2022 03:58:46 - INFO - codeparrot_training - Step 38937: {'lr': 6.272132084582496e-05, 'samples': 19936256, 'steps': 38937, 'loss/train': 1.5761371850967407} +02/26/2022 03:58:50 - INFO - codeparrot_training - Step 38938: {'lr': 6.27104820930118e-05, 'samples': 19936768, 'steps': 38938, 'loss/train': 2.4720654487609863} +02/26/2022 03:58:56 - INFO - codeparrot_training - Step 38939: {'lr': 6.269964414248741e-05, 'samples': 19937280, 'steps': 38939, 'loss/train': 1.7867281436920166} +02/26/2022 03:59:00 - INFO - codeparrot_training - Step 38940: {'lr': 6.26888069942984e-05, 'samples': 19937792, 'steps': 38940, 'loss/train': 1.887107253074646} +02/26/2022 03:59:03 - INFO - codeparrot_training - Step 38941: {'lr': 6.267797064849093e-05, 'samples': 19938304, 'steps': 38941, 'loss/train': 2.723895788192749} +02/26/2022 03:59:09 - INFO - codeparrot_training - Step 38942: {'lr': 6.266713510511163e-05, 'samples': 19938816, 'steps': 38942, 'loss/train': 1.1761444807052612} +02/26/2022 03:59:12 - INFO - codeparrot_training - Step 38943: {'lr': 6.265630036420675e-05, 'samples': 19939328, 'steps': 38943, 'loss/train': 2.514967918395996} +02/26/2022 03:59:18 - INFO - codeparrot_training - Step 38944: {'lr': 6.264546642582289e-05, 'samples': 19939840, 'steps': 38944, 'loss/train': 1.5851999521255493} +02/26/2022 03:59:21 - INFO - codeparrot_training - Step 38945: {'lr': 6.263463329000632e-05, 'samples': 19940352, 'steps': 38945, 'loss/train': 2.5215721130371094} +02/26/2022 03:59:27 - INFO - codeparrot_training - Step 38946: {'lr': 6.26238009568035e-05, 'samples': 19940864, 'steps': 38946, 'loss/train': 2.454012632369995} +02/26/2022 03:59:31 - INFO - codeparrot_training - Step 38947: {'lr': 6.261296942626077e-05, 'samples': 19941376, 'steps': 38947, 'loss/train': 1.1757171154022217} +02/26/2022 03:59:36 - INFO - codeparrot_training - Step 38948: {'lr': 6.260213869842462e-05, 'samples': 19941888, 'steps': 38948, 'loss/train': 1.0435585975646973} +02/26/2022 03:59:40 - INFO - codeparrot_training - Step 38949: {'lr': 6.259130877334143e-05, 'samples': 19942400, 'steps': 38949, 'loss/train': 1.7368721961975098} +02/26/2022 03:59:45 - INFO - codeparrot_training - Step 38950: {'lr': 6.258047965105753e-05, 'samples': 19942912, 'steps': 38950, 'loss/train': 1.3974124193191528} +02/26/2022 03:59:49 - INFO - codeparrot_training - Step 38951: {'lr': 6.25696513316193e-05, 'samples': 19943424, 'steps': 38951, 'loss/train': 1.3515630960464478} +02/26/2022 03:59:55 - INFO - codeparrot_training - Step 38952: {'lr': 6.255882381507324e-05, 'samples': 19943936, 'steps': 38952, 'loss/train': 1.0100599527359009} +02/26/2022 03:59:58 - INFO - codeparrot_training - Step 38953: {'lr': 6.254799710146564e-05, 'samples': 19944448, 'steps': 38953, 'loss/train': 2.2196245193481445} +02/26/2022 04:00:04 - INFO - codeparrot_training - Step 38954: {'lr': 6.25371711908429e-05, 'samples': 19944960, 'steps': 38954, 'loss/train': 1.175177812576294} +02/26/2022 04:00:07 - INFO - codeparrot_training - Step 38955: {'lr': 6.252634608325134e-05, 'samples': 19945472, 'steps': 38955, 'loss/train': 1.796678066253662} +02/26/2022 04:00:11 - INFO - codeparrot_training - Step 38956: {'lr': 6.251552177873742e-05, 'samples': 19945984, 'steps': 38956, 'loss/train': 2.1559677124023438} +02/26/2022 04:00:16 - INFO - codeparrot_training - Step 38957: {'lr': 6.250469827734751e-05, 'samples': 19946496, 'steps': 38957, 'loss/train': 1.7717361450195312} +02/26/2022 04:00:20 - INFO - codeparrot_training - Step 38958: {'lr': 6.249387557912792e-05, 'samples': 19947008, 'steps': 38958, 'loss/train': 2.8185548782348633} +02/26/2022 04:00:25 - INFO - codeparrot_training - Step 38959: {'lr': 6.248305368412502e-05, 'samples': 19947520, 'steps': 38959, 'loss/train': 1.7751221656799316} +02/26/2022 04:00:29 - INFO - codeparrot_training - Step 38960: {'lr': 6.24722325923851e-05, 'samples': 19948032, 'steps': 38960, 'loss/train': 1.2177268266677856} +02/26/2022 04:00:36 - INFO - codeparrot_training - Step 38961: {'lr': 6.246141230395469e-05, 'samples': 19948544, 'steps': 38961, 'loss/train': 2.254542827606201} +02/26/2022 04:00:39 - INFO - codeparrot_training - Step 38962: {'lr': 6.245059281888002e-05, 'samples': 19949056, 'steps': 38962, 'loss/train': 1.8975316286087036} +02/26/2022 04:00:45 - INFO - codeparrot_training - Step 38963: {'lr': 6.243977413720744e-05, 'samples': 19949568, 'steps': 38963, 'loss/train': 1.8330730199813843} +02/26/2022 04:00:48 - INFO - codeparrot_training - Step 38964: {'lr': 6.242895625898326e-05, 'samples': 19950080, 'steps': 38964, 'loss/train': 1.3657501935958862} +02/26/2022 04:00:54 - INFO - codeparrot_training - Step 38965: {'lr': 6.241813918425396e-05, 'samples': 19950592, 'steps': 38965, 'loss/train': 1.5496937036514282} +02/26/2022 04:00:57 - INFO - codeparrot_training - Step 38966: {'lr': 6.240732291306575e-05, 'samples': 19951104, 'steps': 38966, 'loss/train': 1.0134525299072266} +02/26/2022 04:01:03 - INFO - codeparrot_training - Step 38967: {'lr': 6.239650744546502e-05, 'samples': 19951616, 'steps': 38967, 'loss/train': 2.5222418308258057} +02/26/2022 04:01:06 - INFO - codeparrot_training - Step 38968: {'lr': 6.2385692781498e-05, 'samples': 19952128, 'steps': 38968, 'loss/train': 1.680293321609497} +02/26/2022 04:01:12 - INFO - codeparrot_training - Step 38969: {'lr': 6.237487892121118e-05, 'samples': 19952640, 'steps': 38969, 'loss/train': 0.2331373542547226} +02/26/2022 04:01:15 - INFO - codeparrot_training - Step 38970: {'lr': 6.236406586465074e-05, 'samples': 19953152, 'steps': 38970, 'loss/train': 0.7589865922927856} +02/26/2022 04:01:22 - INFO - codeparrot_training - Step 38971: {'lr': 6.235325361186316e-05, 'samples': 19953664, 'steps': 38971, 'loss/train': 1.479731798171997} +02/26/2022 04:01:27 - INFO - codeparrot_training - Step 38972: {'lr': 6.234244216289456e-05, 'samples': 19954176, 'steps': 38972, 'loss/train': 1.619925618171692} +02/26/2022 04:01:31 - INFO - codeparrot_training - Step 38973: {'lr': 6.233163151779143e-05, 'samples': 19954688, 'steps': 38973, 'loss/train': 1.6573783159255981} +02/26/2022 04:01:34 - INFO - codeparrot_training - Step 38974: {'lr': 6.232082167659989e-05, 'samples': 19955200, 'steps': 38974, 'loss/train': 1.2507054805755615} +02/26/2022 04:01:40 - INFO - codeparrot_training - Step 38975: {'lr': 6.23100126393665e-05, 'samples': 19955712, 'steps': 38975, 'loss/train': 0.04629538953304291} +02/26/2022 04:01:45 - INFO - codeparrot_training - Step 38976: {'lr': 6.229920440613729e-05, 'samples': 19956224, 'steps': 38976, 'loss/train': 0.3713911771774292} +02/26/2022 04:01:49 - INFO - codeparrot_training - Step 38977: {'lr': 6.228839697695876e-05, 'samples': 19956736, 'steps': 38977, 'loss/train': 2.4896554946899414} +02/26/2022 04:01:54 - INFO - codeparrot_training - Step 38978: {'lr': 6.227759035187706e-05, 'samples': 19957248, 'steps': 38978, 'loss/train': 2.1101582050323486} +02/26/2022 04:01:58 - INFO - codeparrot_training - Step 38979: {'lr': 6.226678453093867e-05, 'samples': 19957760, 'steps': 38979, 'loss/train': 2.0928194522857666} +02/26/2022 04:02:03 - INFO - codeparrot_training - Step 38980: {'lr': 6.225597951418965e-05, 'samples': 19958272, 'steps': 38980, 'loss/train': 2.3729329109191895} +02/26/2022 04:02:07 - INFO - codeparrot_training - Step 38981: {'lr': 6.224517530167645e-05, 'samples': 19958784, 'steps': 38981, 'loss/train': 1.4953956604003906} +02/26/2022 04:02:13 - INFO - codeparrot_training - Step 38982: {'lr': 6.223437189344525e-05, 'samples': 19959296, 'steps': 38982, 'loss/train': 1.1345945596694946} +02/26/2022 04:02:16 - INFO - codeparrot_training - Step 38983: {'lr': 6.222356928954243e-05, 'samples': 19959808, 'steps': 38983, 'loss/train': 2.1563832759857178} +02/26/2022 04:02:22 - INFO - codeparrot_training - Step 38984: {'lr': 6.221276749001423e-05, 'samples': 19960320, 'steps': 38984, 'loss/train': 1.7778867483139038} +02/26/2022 04:02:25 - INFO - codeparrot_training - Step 38985: {'lr': 6.220196649490689e-05, 'samples': 19960832, 'steps': 38985, 'loss/train': 1.9760615825653076} +02/26/2022 04:02:31 - INFO - codeparrot_training - Step 38986: {'lr': 6.219116630426664e-05, 'samples': 19961344, 'steps': 38986, 'loss/train': 2.253070831298828} +02/26/2022 04:02:34 - INFO - codeparrot_training - Step 38987: {'lr': 6.218036691813986e-05, 'samples': 19961856, 'steps': 38987, 'loss/train': 1.7850995063781738} +02/26/2022 04:02:40 - INFO - codeparrot_training - Step 38988: {'lr': 6.216956833657276e-05, 'samples': 19962368, 'steps': 38988, 'loss/train': 2.5457990169525146} +02/26/2022 04:02:43 - INFO - codeparrot_training - Step 38989: {'lr': 6.215877055961156e-05, 'samples': 19962880, 'steps': 38989, 'loss/train': 0.038928911089897156} +02/26/2022 04:02:49 - INFO - codeparrot_training - Step 38990: {'lr': 6.214797358730248e-05, 'samples': 19963392, 'steps': 38990, 'loss/train': 2.327338457107544} +02/26/2022 04:02:52 - INFO - codeparrot_training - Step 38991: {'lr': 6.213717741969191e-05, 'samples': 19963904, 'steps': 38991, 'loss/train': 1.9290884733200073} +02/26/2022 04:02:58 - INFO - codeparrot_training - Step 38992: {'lr': 6.2126382056826e-05, 'samples': 19964416, 'steps': 38992, 'loss/train': 0.7063797116279602} +02/26/2022 04:03:02 - INFO - codeparrot_training - Step 38993: {'lr': 6.211558749875105e-05, 'samples': 19964928, 'steps': 38993, 'loss/train': 1.392071008682251} +02/26/2022 04:03:07 - INFO - codeparrot_training - Step 38994: {'lr': 6.210479374551314e-05, 'samples': 19965440, 'steps': 38994, 'loss/train': 1.7028536796569824} +02/26/2022 04:03:11 - INFO - codeparrot_training - Step 38995: {'lr': 6.209400079715874e-05, 'samples': 19965952, 'steps': 38995, 'loss/train': 1.382046103477478} +02/26/2022 04:03:16 - INFO - codeparrot_training - Step 38996: {'lr': 6.208320865373396e-05, 'samples': 19966464, 'steps': 38996, 'loss/train': 1.1038291454315186} +02/26/2022 04:03:20 - INFO - codeparrot_training - Step 38997: {'lr': 6.207241731528507e-05, 'samples': 19966976, 'steps': 38997, 'loss/train': 1.7524518966674805} +02/26/2022 04:03:25 - INFO - codeparrot_training - Step 38998: {'lr': 6.206162678185817e-05, 'samples': 19967488, 'steps': 38998, 'loss/train': 1.4853224754333496} +02/26/2022 04:03:29 - INFO - codeparrot_training - Step 38999: {'lr': 6.205083705349965e-05, 'samples': 19968000, 'steps': 38999, 'loss/train': 1.7108924388885498} +02/26/2022 04:03:29 - INFO - codeparrot_training - Evaluating and saving model checkpoint