diff --git "a/log/debug_0.log" "b/log/debug_0.log" --- "a/log/debug_0.log" +++ "b/log/debug_0.log" @@ -45392,3 +45392,7487 @@ Use FP16 precision: False 03/05/2022 00:42:30 - INFO - codeparrot_training - Skipping example with length 520 (seq_length=1024) 03/05/2022 00:42:35 - INFO - codeparrot_training - Step 29999: {'lr': 0.0004571303839073271, 'samples': 15360000, 'steps': 29999, 'loss/train': 1.5493794679641724} 03/05/2022 00:42:35 - INFO - codeparrot_training - Evaluating and saving model checkpoint +03/05/2022 00:42:49 - WARNING - huggingface_hub.repository - Several commits (6) will be pushed upstream. +03/05/2022 00:42:49 - WARNING - huggingface_hub.repository - The progress bars may be unreliable. +03/05/2022 00:43:16 - WARNING - huggingface_hub.repository - To https://huggingface.co/ncoop57/cm_code_clippy + 20b2be6..8908229 glowing-puddle-3 -> glowing-puddle-3 + +03/05/2022 00:43:20 - INFO - codeparrot_training - Step 30000: {'lr': 0.00045712741231096054, 'samples': 15360512, 'steps': 30000, 'loss/train': 1.8289461135864258} +03/05/2022 00:43:20 - INFO - codeparrot_training - Skipping example with length 873 (seq_length=1024) +03/05/2022 00:43:26 - INFO - codeparrot_training - Step 30001: {'lr': 0.0004571244406212656, 'samples': 15361024, 'steps': 30001, 'loss/train': 1.2173447608947754} +03/05/2022 00:43:29 - INFO - codeparrot_training - Step 30002: {'lr': 0.00045712146883824357, 'samples': 15361536, 'steps': 30002, 'loss/train': 1.5588682889938354} +03/05/2022 00:43:29 - INFO - codeparrot_training - Skipping example with length 563 (seq_length=1024) +03/05/2022 00:43:34 - INFO - codeparrot_training - Step 30003: {'lr': 0.00045711849696189585, 'samples': 15362048, 'steps': 30003, 'loss/train': 1.0836864709854126} +03/05/2022 00:43:37 - INFO - codeparrot_training - Step 30004: {'lr': 0.0004571155249922237, 'samples': 15362560, 'steps': 30004, 'loss/train': 1.896442174911499} +03/05/2022 00:43:38 - INFO - codeparrot_training - Skipping example with length 452 (seq_length=1024) +03/05/2022 00:43:42 - INFO - codeparrot_training - Step 30005: {'lr': 0.00045711255292922847, 'samples': 15363072, 'steps': 30005, 'loss/train': 2.269477605819702} +03/05/2022 00:43:45 - INFO - codeparrot_training - Step 30006: {'lr': 0.00045710958077291156, 'samples': 15363584, 'steps': 30006, 'loss/train': 2.0160892009735107} +03/05/2022 00:43:46 - INFO - codeparrot_training - Skipping example with length 149 (seq_length=1024) +03/05/2022 00:43:51 - INFO - codeparrot_training - Step 30007: {'lr': 0.00045710660852327423, 'samples': 15364096, 'steps': 30007, 'loss/train': 1.6335222721099854} +03/05/2022 00:43:54 - INFO - codeparrot_training - Step 30008: {'lr': 0.00045710363618031783, 'samples': 15364608, 'steps': 30008, 'loss/train': 1.1586971282958984} +03/05/2022 00:43:54 - INFO - codeparrot_training - Skipping example with length 942 (seq_length=1024) +03/05/2022 00:43:59 - INFO - codeparrot_training - Step 30009: {'lr': 0.0004571006637440438, 'samples': 15365120, 'steps': 30009, 'loss/train': 1.6179038286209106} +03/05/2022 00:44:02 - INFO - codeparrot_training - Step 30010: {'lr': 0.00045709769121445335, 'samples': 15365632, 'steps': 30010, 'loss/train': 2.0572926998138428} +03/05/2022 00:44:03 - INFO - codeparrot_training - Skipping example with length 559 (seq_length=1024) +03/05/2022 00:44:08 - INFO - codeparrot_training - Step 30011: {'lr': 0.00045709471859154793, 'samples': 15366144, 'steps': 30011, 'loss/train': 1.8443877696990967} +03/05/2022 00:44:11 - INFO - codeparrot_training - Step 30012: {'lr': 0.0004570917458753288, 'samples': 15366656, 'steps': 30012, 'loss/train': 1.659393310546875} +03/05/2022 00:44:12 - INFO - codeparrot_training - Skipping example with length 275 (seq_length=1024) +03/05/2022 00:44:16 - INFO - codeparrot_training - Step 30013: {'lr': 0.00045708877306579733, 'samples': 15367168, 'steps': 30013, 'loss/train': 1.1356165409088135} +03/05/2022 00:44:19 - INFO - codeparrot_training - Step 30014: {'lr': 0.00045708580016295486, 'samples': 15367680, 'steps': 30014, 'loss/train': 1.8352152109146118} +03/05/2022 00:44:20 - INFO - codeparrot_training - Skipping example with length 422 (seq_length=1024) +03/05/2022 00:44:24 - INFO - codeparrot_training - Step 30015: {'lr': 0.0004570828271668027, 'samples': 15368192, 'steps': 30015, 'loss/train': 1.8785282373428345} +03/05/2022 00:44:28 - INFO - codeparrot_training - Step 30016: {'lr': 0.0004570798540773422, 'samples': 15368704, 'steps': 30016, 'loss/train': 1.9754853248596191} +03/05/2022 00:44:28 - INFO - codeparrot_training - Skipping example with length 71 (seq_length=1024) +03/05/2022 00:44:33 - INFO - codeparrot_training - Step 30017: {'lr': 0.0004570768808945748, 'samples': 15369216, 'steps': 30017, 'loss/train': 1.8309119939804077} +03/05/2022 00:44:36 - INFO - codeparrot_training - Step 30018: {'lr': 0.00045707390761850163, 'samples': 15369728, 'steps': 30018, 'loss/train': 2.398773670196533} +03/05/2022 00:44:37 - INFO - codeparrot_training - Skipping example with length 366 (seq_length=1024) +03/05/2022 00:44:41 - INFO - codeparrot_training - Step 30019: {'lr': 0.00045707093424912426, 'samples': 15370240, 'steps': 30019, 'loss/train': 1.9269746541976929} +03/05/2022 00:44:45 - INFO - codeparrot_training - Step 30020: {'lr': 0.00045706796078644386, 'samples': 15370752, 'steps': 30020, 'loss/train': 2.2926995754241943} +03/05/2022 00:44:45 - INFO - codeparrot_training - Skipping example with length 724 (seq_length=1024) +03/05/2022 00:44:50 - INFO - codeparrot_training - Step 30021: {'lr': 0.00045706498723046185, 'samples': 15371264, 'steps': 30021, 'loss/train': 1.957943320274353} +03/05/2022 00:44:53 - INFO - codeparrot_training - Step 30022: {'lr': 0.0004570620135811795, 'samples': 15371776, 'steps': 30022, 'loss/train': 1.5461033582687378} +03/05/2022 00:44:53 - INFO - codeparrot_training - Skipping example with length 633 (seq_length=1024) +03/05/2022 00:44:59 - INFO - codeparrot_training - Step 30023: {'lr': 0.0004570590398385983, 'samples': 15372288, 'steps': 30023, 'loss/train': 1.4753776788711548} +03/05/2022 00:45:02 - INFO - codeparrot_training - Step 30024: {'lr': 0.0004570560660027194, 'samples': 15372800, 'steps': 30024, 'loss/train': 1.3805350065231323} +03/05/2022 00:45:02 - INFO - codeparrot_training - Skipping example with length 106 (seq_length=1024) +03/05/2022 00:45:07 - INFO - codeparrot_training - Step 30025: {'lr': 0.00045705309207354433, 'samples': 15373312, 'steps': 30025, 'loss/train': 1.6123640537261963} +03/05/2022 00:45:10 - INFO - codeparrot_training - Step 30026: {'lr': 0.00045705011805107426, 'samples': 15373824, 'steps': 30026, 'loss/train': 1.850448489189148} +03/05/2022 00:45:10 - INFO - codeparrot_training - Skipping example with length 761 (seq_length=1024) +03/05/2022 00:45:16 - INFO - codeparrot_training - Step 30027: {'lr': 0.00045704714393531064, 'samples': 15374336, 'steps': 30027, 'loss/train': 0.881676971912384} +03/05/2022 00:45:19 - INFO - codeparrot_training - Step 30028: {'lr': 0.00045704416972625474, 'samples': 15374848, 'steps': 30028, 'loss/train': 2.1063857078552246} +03/05/2022 00:45:19 - INFO - codeparrot_training - Skipping example with length 573 (seq_length=1024) +03/05/2022 00:45:24 - INFO - codeparrot_training - Step 30029: {'lr': 0.000457041195423908, 'samples': 15375360, 'steps': 30029, 'loss/train': 0.9632497429847717} +03/05/2022 00:45:28 - INFO - codeparrot_training - Step 30030: {'lr': 0.0004570382210282716, 'samples': 15375872, 'steps': 30030, 'loss/train': 1.6717524528503418} +03/05/2022 00:45:28 - INFO - codeparrot_training - Skipping example with length 501 (seq_length=1024) +03/05/2022 00:45:33 - INFO - codeparrot_training - Step 30031: {'lr': 0.00045703524653934705, 'samples': 15376384, 'steps': 30031, 'loss/train': 1.5573110580444336} +03/05/2022 00:45:36 - INFO - codeparrot_training - Skipping example with length 148 (seq_length=1024) +03/05/2022 00:45:38 - INFO - codeparrot_training - Step 30032: {'lr': 0.0004570322719571355, 'samples': 15376896, 'steps': 30032, 'loss/train': 1.7397286891937256} +03/05/2022 00:45:41 - INFO - codeparrot_training - Step 30033: {'lr': 0.00045702929728163845, 'samples': 15377408, 'steps': 30033, 'loss/train': 1.4734880924224854} +03/05/2022 00:45:44 - INFO - codeparrot_training - Skipping example with length 577 (seq_length=1024) +03/05/2022 00:45:46 - INFO - codeparrot_training - Step 30034: {'lr': 0.00045702632251285727, 'samples': 15377920, 'steps': 30034, 'loss/train': 2.11061954498291} +03/05/2022 00:45:50 - INFO - codeparrot_training - Step 30035: {'lr': 0.0004570233476507931, 'samples': 15378432, 'steps': 30035, 'loss/train': 1.3703136444091797} +03/05/2022 00:45:52 - INFO - codeparrot_training - Skipping example with length 660 (seq_length=1024) +03/05/2022 00:45:55 - INFO - codeparrot_training - Step 30036: {'lr': 0.0004570203726954475, 'samples': 15378944, 'steps': 30036, 'loss/train': 2.3308465480804443} +03/05/2022 00:45:58 - INFO - codeparrot_training - Step 30037: {'lr': 0.0004570173976468217, 'samples': 15379456, 'steps': 30037, 'loss/train': 1.9480481147766113} +03/05/2022 00:46:01 - INFO - codeparrot_training - Step 30038: {'lr': 0.0004570144225049171, 'samples': 15379968, 'steps': 30038, 'loss/train': 0.07623183727264404} +03/05/2022 00:46:02 - INFO - codeparrot_training - Skipping example with length 665 (seq_length=1024) +03/05/2022 00:46:07 - INFO - codeparrot_training - Step 30039: {'lr': 0.00045701144726973487, 'samples': 15380480, 'steps': 30039, 'loss/train': 1.9388179779052734} +03/05/2022 00:46:10 - INFO - codeparrot_training - Step 30040: {'lr': 0.0004570084719412766, 'samples': 15380992, 'steps': 30040, 'loss/train': 2.3384456634521484} +03/05/2022 00:46:10 - INFO - codeparrot_training - Skipping example with length 401 (seq_length=1024) +03/05/2022 00:46:15 - INFO - codeparrot_training - Step 30041: {'lr': 0.00045700549651954344, 'samples': 15381504, 'steps': 30041, 'loss/train': 1.5204285383224487} +03/05/2022 00:46:18 - INFO - codeparrot_training - Step 30042: {'lr': 0.0004570025210045368, 'samples': 15382016, 'steps': 30042, 'loss/train': 1.5184179544448853} +03/05/2022 00:46:19 - INFO - codeparrot_training - Skipping example with length 923 (seq_length=1024) +03/05/2022 00:46:24 - INFO - codeparrot_training - Step 30043: {'lr': 0.00045699954539625803, 'samples': 15382528, 'steps': 30043, 'loss/train': 1.788817048072815} +03/05/2022 00:46:27 - INFO - codeparrot_training - Step 30044: {'lr': 0.0004569965696947085, 'samples': 15383040, 'steps': 30044, 'loss/train': 1.287003517150879} +03/05/2022 00:46:27 - INFO - codeparrot_training - Skipping example with length 267 (seq_length=1024) +03/05/2022 00:46:33 - INFO - codeparrot_training - Step 30045: {'lr': 0.00045699359389988944, 'samples': 15383552, 'steps': 30045, 'loss/train': 1.7901946306228638} +03/05/2022 00:46:36 - INFO - codeparrot_training - Step 30046: {'lr': 0.0004569906180118023, 'samples': 15384064, 'steps': 30046, 'loss/train': 1.7433677911758423} +03/05/2022 00:46:38 - INFO - codeparrot_training - Skipping example with length 757 (seq_length=1024) +03/05/2022 00:46:41 - INFO - codeparrot_training - Step 30047: {'lr': 0.0004569876420304484, 'samples': 15384576, 'steps': 30047, 'loss/train': 2.262643337249756} +03/05/2022 00:46:44 - INFO - codeparrot_training - Step 30048: {'lr': 0.000456984665955829, 'samples': 15385088, 'steps': 30048, 'loss/train': 1.3046284914016724} +03/05/2022 00:46:46 - INFO - codeparrot_training - Skipping example with length 465 (seq_length=1024) +03/05/2022 00:46:49 - INFO - codeparrot_training - Step 30049: {'lr': 0.00045698168978794553, 'samples': 15385600, 'steps': 30049, 'loss/train': 2.065197467803955} +03/05/2022 00:46:53 - INFO - codeparrot_training - Step 30050: {'lr': 0.0004569787135267993, 'samples': 15386112, 'steps': 30050, 'loss/train': 1.3863437175750732} +03/05/2022 00:46:54 - INFO - codeparrot_training - Skipping example with length 389 (seq_length=1024) +03/05/2022 00:46:58 - INFO - codeparrot_training - Step 30051: {'lr': 0.00045697573717239174, 'samples': 15386624, 'steps': 30051, 'loss/train': 2.091391086578369} +03/05/2022 00:47:01 - INFO - codeparrot_training - Step 30052: {'lr': 0.0004569727607247239, 'samples': 15387136, 'steps': 30052, 'loss/train': 1.4294064044952393} +03/05/2022 00:47:02 - INFO - codeparrot_training - Skipping example with length 513 (seq_length=1024) +03/05/2022 00:47:06 - INFO - codeparrot_training - Step 30053: {'lr': 0.00045696978418379754, 'samples': 15387648, 'steps': 30053, 'loss/train': 2.2440483570098877} +03/05/2022 00:47:09 - INFO - codeparrot_training - Step 30054: {'lr': 0.0004569668075496137, 'samples': 15388160, 'steps': 30054, 'loss/train': 1.721880316734314} +03/05/2022 00:47:10 - INFO - codeparrot_training - Skipping example with length 248 (seq_length=1024) +03/05/2022 00:47:15 - INFO - codeparrot_training - Step 30055: {'lr': 0.00045696383082217387, 'samples': 15388672, 'steps': 30055, 'loss/train': 1.45264732837677} +03/05/2022 00:47:18 - INFO - codeparrot_training - Step 30056: {'lr': 0.00045696085400147925, 'samples': 15389184, 'steps': 30056, 'loss/train': 1.2470375299453735} +03/05/2022 00:47:19 - INFO - codeparrot_training - Skipping example with length 837 (seq_length=1024) +03/05/2022 00:47:23 - INFO - codeparrot_training - Step 30057: {'lr': 0.00045695787708753126, 'samples': 15389696, 'steps': 30057, 'loss/train': 1.4519813060760498} +03/05/2022 00:47:26 - INFO - codeparrot_training - Step 30058: {'lr': 0.0004569549000803313, 'samples': 15390208, 'steps': 30058, 'loss/train': 0.4629649221897125} +03/05/2022 00:47:27 - INFO - codeparrot_training - Skipping example with length 519 (seq_length=1024) +03/05/2022 00:47:31 - INFO - codeparrot_training - Step 30059: {'lr': 0.00045695192297988066, 'samples': 15390720, 'steps': 30059, 'loss/train': 2.955383062362671} +03/05/2022 00:47:35 - INFO - codeparrot_training - Step 30060: {'lr': 0.00045694894578618064, 'samples': 15391232, 'steps': 30060, 'loss/train': 1.5059194564819336} +03/05/2022 00:47:35 - INFO - codeparrot_training - Skipping example with length 35 (seq_length=1024) +03/05/2022 00:47:40 - INFO - codeparrot_training - Step 30061: {'lr': 0.00045694596849923263, 'samples': 15391744, 'steps': 30061, 'loss/train': 1.7649555206298828} +03/05/2022 00:47:43 - INFO - codeparrot_training - Step 30062: {'lr': 0.0004569429911190379, 'samples': 15392256, 'steps': 30062, 'loss/train': 1.6643859148025513} +03/05/2022 00:47:44 - INFO - codeparrot_training - Skipping example with length 788 (seq_length=1024) +03/05/2022 00:47:48 - INFO - codeparrot_training - Step 30063: {'lr': 0.00045694001364559797, 'samples': 15392768, 'steps': 30063, 'loss/train': 1.5236775875091553} +03/05/2022 00:47:52 - INFO - codeparrot_training - Step 30064: {'lr': 0.00045693703607891403, 'samples': 15393280, 'steps': 30064, 'loss/train': 2.0967564582824707} +03/05/2022 00:47:52 - INFO - codeparrot_training - Skipping example with length 308 (seq_length=1024) +03/05/2022 00:47:57 - INFO - codeparrot_training - Step 30065: {'lr': 0.0004569340584189874, 'samples': 15393792, 'steps': 30065, 'loss/train': 1.8825595378875732} +03/05/2022 00:48:00 - INFO - codeparrot_training - Step 30066: {'lr': 0.0004569310806658195, 'samples': 15394304, 'steps': 30066, 'loss/train': 1.6849169731140137} +03/05/2022 00:48:00 - INFO - codeparrot_training - Skipping example with length 528 (seq_length=1024) +03/05/2022 00:48:05 - INFO - codeparrot_training - Step 30067: {'lr': 0.0004569281028194117, 'samples': 15394816, 'steps': 30067, 'loss/train': 2.5284647941589355} +03/05/2022 00:48:09 - INFO - codeparrot_training - Step 30068: {'lr': 0.0004569251248797652, 'samples': 15395328, 'steps': 30068, 'loss/train': 1.8243889808654785} +03/05/2022 00:48:10 - INFO - codeparrot_training - Skipping example with length 557 (seq_length=1024) +03/05/2022 00:48:14 - INFO - codeparrot_training - Step 30069: {'lr': 0.0004569221468468815, 'samples': 15395840, 'steps': 30069, 'loss/train': 0.8982431888580322} +03/05/2022 00:48:17 - INFO - codeparrot_training - Step 30070: {'lr': 0.0004569191687207618, 'samples': 15396352, 'steps': 30070, 'loss/train': 3.1284542083740234} +03/05/2022 00:48:19 - INFO - codeparrot_training - Skipping example with length 1002 (seq_length=1024) +03/05/2022 00:48:23 - INFO - codeparrot_training - Step 30071: {'lr': 0.0004569161905014076, 'samples': 15396864, 'steps': 30071, 'loss/train': 0.5278277397155762} +03/05/2022 00:48:26 - INFO - codeparrot_training - Step 30072: {'lr': 0.0004569132121888201, 'samples': 15397376, 'steps': 30072, 'loss/train': 2.1388659477233887} +03/05/2022 00:48:28 - INFO - codeparrot_training - Skipping example with length 899 (seq_length=1024) +03/05/2022 00:48:31 - INFO - codeparrot_training - Step 30073: {'lr': 0.0004569102337830007, 'samples': 15397888, 'steps': 30073, 'loss/train': 1.5493289232254028} +03/05/2022 00:48:34 - INFO - codeparrot_training - Step 30074: {'lr': 0.00045690725528395077, 'samples': 15398400, 'steps': 30074, 'loss/train': 3.477476119995117} +03/05/2022 00:48:36 - INFO - codeparrot_training - Skipping example with length 724 (seq_length=1024) +03/05/2022 00:48:39 - INFO - codeparrot_training - Step 30075: {'lr': 0.0004569042766916717, 'samples': 15398912, 'steps': 30075, 'loss/train': 1.8774348497390747} +03/05/2022 00:48:43 - INFO - codeparrot_training - Step 30076: {'lr': 0.0004569012980061646, 'samples': 15399424, 'steps': 30076, 'loss/train': 1.8760998249053955} +03/05/2022 00:48:45 - INFO - codeparrot_training - Skipping example with length 712 (seq_length=1024) +03/05/2022 00:48:48 - INFO - codeparrot_training - Step 30077: {'lr': 0.00045689831922743107, 'samples': 15399936, 'steps': 30077, 'loss/train': 1.7275433540344238} +03/05/2022 00:48:51 - INFO - codeparrot_training - Step 30078: {'lr': 0.0004568953403554723, 'samples': 15400448, 'steps': 30078, 'loss/train': 1.9771796464920044} +03/05/2022 00:48:53 - INFO - codeparrot_training - Skipping example with length 68 (seq_length=1024) +03/05/2022 00:48:56 - INFO - codeparrot_training - Step 30079: {'lr': 0.0004568923613902897, 'samples': 15400960, 'steps': 30079, 'loss/train': 1.8651039600372314} +03/05/2022 00:48:59 - INFO - codeparrot_training - Step 30080: {'lr': 0.0004568893823318846, 'samples': 15401472, 'steps': 30080, 'loss/train': 1.0507383346557617} +03/05/2022 00:49:01 - INFO - codeparrot_training - Skipping example with length 1007 (seq_length=1024) +03/05/2022 00:49:05 - INFO - codeparrot_training - Step 30081: {'lr': 0.0004568864031802583, 'samples': 15401984, 'steps': 30081, 'loss/train': 2.374959945678711} +03/05/2022 00:49:08 - INFO - codeparrot_training - Step 30082: {'lr': 0.00045688342393541227, 'samples': 15402496, 'steps': 30082, 'loss/train': 0.5805590152740479} +03/05/2022 00:49:10 - INFO - codeparrot_training - Skipping example with length 266 (seq_length=1024) +03/05/2022 00:49:13 - INFO - codeparrot_training - Step 30083: {'lr': 0.00045688044459734766, 'samples': 15403008, 'steps': 30083, 'loss/train': 1.5638983249664307} +03/05/2022 00:49:16 - INFO - codeparrot_training - Step 30084: {'lr': 0.000456877465166066, 'samples': 15403520, 'steps': 30084, 'loss/train': 0.7802882790565491} +03/05/2022 00:49:18 - INFO - codeparrot_training - Skipping example with length 29 (seq_length=1024) +03/05/2022 00:49:21 - INFO - codeparrot_training - Step 30085: {'lr': 0.0004568744856415685, 'samples': 15404032, 'steps': 30085, 'loss/train': 1.0853203535079956} +03/05/2022 00:49:25 - INFO - codeparrot_training - Step 30086: {'lr': 0.0004568715060238565, 'samples': 15404544, 'steps': 30086, 'loss/train': 1.3193738460540771} +03/05/2022 00:49:26 - INFO - codeparrot_training - Skipping example with length 329 (seq_length=1024) +03/05/2022 00:49:30 - INFO - codeparrot_training - Step 30087: {'lr': 0.0004568685263129315, 'samples': 15405056, 'steps': 30087, 'loss/train': 1.794023871421814} +03/05/2022 00:49:33 - INFO - codeparrot_training - Step 30088: {'lr': 0.00045686554650879464, 'samples': 15405568, 'steps': 30088, 'loss/train': 1.9164760112762451} +03/05/2022 00:49:36 - INFO - codeparrot_training - Skipping example with length 707 (seq_length=1024) +03/05/2022 00:49:38 - INFO - codeparrot_training - Step 30089: {'lr': 0.0004568625666114474, 'samples': 15406080, 'steps': 30089, 'loss/train': 1.6596910953521729} +03/05/2022 00:49:42 - INFO - codeparrot_training - Step 30090: {'lr': 0.00045685958662089113, 'samples': 15406592, 'steps': 30090, 'loss/train': 1.7234231233596802} +03/05/2022 00:49:44 - INFO - codeparrot_training - Skipping example with length 725 (seq_length=1024) +03/05/2022 00:49:47 - INFO - codeparrot_training - Step 30091: {'lr': 0.000456856606537127, 'samples': 15407104, 'steps': 30091, 'loss/train': 2.4382810592651367} +03/05/2022 00:49:50 - INFO - codeparrot_training - Step 30092: {'lr': 0.00045685362636015657, 'samples': 15407616, 'steps': 30092, 'loss/train': 1.4692848920822144} +03/05/2022 00:49:52 - INFO - codeparrot_training - Skipping example with length 280 (seq_length=1024) +03/05/2022 00:49:55 - INFO - codeparrot_training - Step 30093: {'lr': 0.00045685064608998107, 'samples': 15408128, 'steps': 30093, 'loss/train': 1.6077817678451538} +03/05/2022 00:49:58 - INFO - codeparrot_training - Step 30094: {'lr': 0.00045684766572660185, 'samples': 15408640, 'steps': 30094, 'loss/train': 1.5444180965423584} +03/05/2022 00:50:00 - INFO - codeparrot_training - Skipping example with length 245 (seq_length=1024) +03/05/2022 00:50:04 - INFO - codeparrot_training - Step 30095: {'lr': 0.0004568446852700203, 'samples': 15409152, 'steps': 30095, 'loss/train': 1.5687755346298218} +03/05/2022 00:50:07 - INFO - codeparrot_training - Step 30096: {'lr': 0.00045684170472023766, 'samples': 15409664, 'steps': 30096, 'loss/train': 2.0847253799438477} +03/05/2022 00:50:09 - INFO - codeparrot_training - Skipping example with length 365 (seq_length=1024) +03/05/2022 00:50:12 - INFO - codeparrot_training - Step 30097: {'lr': 0.00045683872407725534, 'samples': 15410176, 'steps': 30097, 'loss/train': 2.2411348819732666} +03/05/2022 00:50:15 - INFO - codeparrot_training - Step 30098: {'lr': 0.00045683574334107473, 'samples': 15410688, 'steps': 30098, 'loss/train': 1.59357488155365} +03/05/2022 00:50:19 - INFO - codeparrot_training - Step 30099: {'lr': 0.00045683276251169713, 'samples': 15411200, 'steps': 30099, 'loss/train': 2.1585466861724854} +03/05/2022 00:50:19 - INFO - codeparrot_training - Skipping example with length 883 (seq_length=1024) +03/05/2022 00:50:24 - INFO - codeparrot_training - Step 30100: {'lr': 0.00045682978158912384, 'samples': 15411712, 'steps': 30100, 'loss/train': 0.8039388060569763} +03/05/2022 00:50:27 - INFO - codeparrot_training - Step 30101: {'lr': 0.0004568268005733562, 'samples': 15412224, 'steps': 30101, 'loss/train': 1.82028067111969} +03/05/2022 00:50:27 - INFO - codeparrot_training - Skipping example with length 592 (seq_length=1024) +03/05/2022 00:50:32 - INFO - codeparrot_training - Step 30102: {'lr': 0.0004568238194643958, 'samples': 15412736, 'steps': 30102, 'loss/train': 1.6911276578903198} +03/05/2022 00:50:36 - INFO - codeparrot_training - Step 30103: {'lr': 0.00045682083826224356, 'samples': 15413248, 'steps': 30103, 'loss/train': 1.6601359844207764} +03/05/2022 00:50:36 - INFO - codeparrot_training - Skipping example with length 71 (seq_length=1024) +03/05/2022 00:50:41 - INFO - codeparrot_training - Step 30104: {'lr': 0.00045681785696690113, 'samples': 15413760, 'steps': 30104, 'loss/train': 1.8160486221313477} +03/05/2022 00:50:44 - INFO - codeparrot_training - Step 30105: {'lr': 0.0004568148755783698, 'samples': 15414272, 'steps': 30105, 'loss/train': 1.6059305667877197} +03/05/2022 00:50:46 - INFO - codeparrot_training - Skipping example with length 900 (seq_length=1024) +03/05/2022 00:50:50 - INFO - codeparrot_training - Step 30106: {'lr': 0.00045681189409665083, 'samples': 15414784, 'steps': 30106, 'loss/train': 2.16241717338562} +03/05/2022 00:50:53 - INFO - codeparrot_training - Step 30107: {'lr': 0.00045680891252174557, 'samples': 15415296, 'steps': 30107, 'loss/train': 1.1611987352371216} +03/05/2022 00:50:54 - INFO - codeparrot_training - Skipping example with length 816 (seq_length=1024) +03/05/2022 00:50:58 - INFO - codeparrot_training - Step 30108: {'lr': 0.0004568059308536554, 'samples': 15415808, 'steps': 30108, 'loss/train': 1.2094054222106934} +03/05/2022 00:51:01 - INFO - codeparrot_training - Step 30109: {'lr': 0.00045680294909238175, 'samples': 15416320, 'steps': 30109, 'loss/train': 2.348546266555786} +03/05/2022 00:51:02 - INFO - codeparrot_training - Skipping example with length 789 (seq_length=1024) +03/05/2022 00:51:06 - INFO - codeparrot_training - Step 30110: {'lr': 0.00045679996723792585, 'samples': 15416832, 'steps': 30110, 'loss/train': 1.7360273599624634} +03/05/2022 00:51:10 - INFO - codeparrot_training - Step 30111: {'lr': 0.00045679698529028906, 'samples': 15417344, 'steps': 30111, 'loss/train': 1.3415448665618896} +03/05/2022 00:51:11 - INFO - codeparrot_training - Skipping example with length 87 (seq_length=1024) +03/05/2022 00:51:15 - INFO - codeparrot_training - Step 30112: {'lr': 0.00045679400324947274, 'samples': 15417856, 'steps': 30112, 'loss/train': 1.991532325744629} +03/05/2022 00:51:18 - INFO - codeparrot_training - Step 30113: {'lr': 0.00045679102111547825, 'samples': 15418368, 'steps': 30113, 'loss/train': 1.521023154258728} +03/05/2022 00:51:19 - INFO - codeparrot_training - Skipping example with length 962 (seq_length=1024) +03/05/2022 00:51:23 - INFO - codeparrot_training - Step 30114: {'lr': 0.00045678803888830687, 'samples': 15418880, 'steps': 30114, 'loss/train': 1.7485442161560059} +03/05/2022 00:51:26 - INFO - codeparrot_training - Step 30115: {'lr': 0.0004567850565679601, 'samples': 15419392, 'steps': 30115, 'loss/train': 0.4203520119190216} +03/05/2022 00:51:27 - INFO - codeparrot_training - Skipping example with length 529 (seq_length=1024) +03/05/2022 00:51:32 - INFO - codeparrot_training - Step 30116: {'lr': 0.00045678207415443913, 'samples': 15419904, 'steps': 30116, 'loss/train': 1.745429515838623} +03/05/2022 00:51:35 - INFO - codeparrot_training - Step 30117: {'lr': 0.0004567790916477453, 'samples': 15420416, 'steps': 30117, 'loss/train': 0.867196798324585} +03/05/2022 00:51:36 - INFO - codeparrot_training - Skipping example with length 778 (seq_length=1024) +03/05/2022 00:51:40 - INFO - codeparrot_training - Step 30118: {'lr': 0.00045677610904788004, 'samples': 15420928, 'steps': 30118, 'loss/train': 2.043165445327759} +03/05/2022 00:51:43 - INFO - codeparrot_training - Step 30119: {'lr': 0.00045677312635484466, 'samples': 15421440, 'steps': 30119, 'loss/train': 1.6716259717941284} +03/05/2022 00:51:44 - INFO - codeparrot_training - Skipping example with length 561 (seq_length=1024) +03/05/2022 00:51:49 - INFO - codeparrot_training - Step 30120: {'lr': 0.00045677014356864043, 'samples': 15421952, 'steps': 30120, 'loss/train': 1.5415599346160889} +03/05/2022 00:51:52 - INFO - codeparrot_training - Step 30121: {'lr': 0.0004567671606892688, 'samples': 15422464, 'steps': 30121, 'loss/train': 2.024001121520996} +03/05/2022 00:51:53 - INFO - codeparrot_training - Skipping example with length 824 (seq_length=1024) +03/05/2022 00:51:57 - INFO - codeparrot_training - Step 30122: {'lr': 0.00045676417771673116, 'samples': 15422976, 'steps': 30122, 'loss/train': 1.776038646697998} +03/05/2022 00:52:01 - INFO - codeparrot_training - Step 30123: {'lr': 0.0004567611946510287, 'samples': 15423488, 'steps': 30123, 'loss/train': 2.036388874053955} +03/05/2022 00:52:01 - INFO - codeparrot_training - Skipping example with length 506 (seq_length=1024) +03/05/2022 00:52:06 - INFO - codeparrot_training - Step 30124: {'lr': 0.00045675821149216285, 'samples': 15424000, 'steps': 30124, 'loss/train': 2.1159322261810303} +03/05/2022 00:52:09 - INFO - codeparrot_training - Step 30125: {'lr': 0.00045675522824013495, 'samples': 15424512, 'steps': 30125, 'loss/train': 2.169635534286499} +03/05/2022 00:52:09 - INFO - codeparrot_training - Skipping example with length 862 (seq_length=1024) +03/05/2022 00:52:14 - INFO - codeparrot_training - Step 30126: {'lr': 0.00045675224489494633, 'samples': 15425024, 'steps': 30126, 'loss/train': 1.9738236665725708} +03/05/2022 00:52:17 - INFO - codeparrot_training - Step 30127: {'lr': 0.00045674926145659834, 'samples': 15425536, 'steps': 30127, 'loss/train': 1.6067774295806885} +03/05/2022 00:52:18 - INFO - codeparrot_training - Skipping example with length 971 (seq_length=1024) +03/05/2022 00:52:23 - INFO - codeparrot_training - Step 30128: {'lr': 0.0004567462779250923, 'samples': 15426048, 'steps': 30128, 'loss/train': 1.0786906480789185} +03/05/2022 00:52:26 - INFO - codeparrot_training - Step 30129: {'lr': 0.0004567432943004296, 'samples': 15426560, 'steps': 30129, 'loss/train': 1.6639996767044067} +03/05/2022 00:52:26 - INFO - codeparrot_training - Skipping example with length 431 (seq_length=1024) +03/05/2022 00:52:31 - INFO - codeparrot_training - Step 30130: {'lr': 0.00045674031058261157, 'samples': 15427072, 'steps': 30130, 'loss/train': 0.2703652083873749} +03/05/2022 00:52:34 - INFO - codeparrot_training - Step 30131: {'lr': 0.0004567373267716395, 'samples': 15427584, 'steps': 30131, 'loss/train': 1.8357006311416626} +03/05/2022 00:52:35 - INFO - codeparrot_training - Skipping example with length 607 (seq_length=1024) +03/05/2022 00:52:40 - INFO - codeparrot_training - Step 30132: {'lr': 0.0004567343428675148, 'samples': 15428096, 'steps': 30132, 'loss/train': 0.7730497121810913} +03/05/2022 00:52:43 - INFO - codeparrot_training - Step 30133: {'lr': 0.00045673135887023874, 'samples': 15428608, 'steps': 30133, 'loss/train': 1.355360984802246} +03/05/2022 00:52:43 - INFO - codeparrot_training - Skipping example with length 840 (seq_length=1024) +03/05/2022 00:52:48 - INFO - codeparrot_training - Step 30134: {'lr': 0.0004567283747798128, 'samples': 15429120, 'steps': 30134, 'loss/train': 1.4444273710250854} +03/05/2022 00:52:51 - INFO - codeparrot_training - Step 30135: {'lr': 0.0004567253905962383, 'samples': 15429632, 'steps': 30135, 'loss/train': 1.5038108825683594} +03/05/2022 00:52:52 - INFO - codeparrot_training - Skipping example with length 846 (seq_length=1024) +03/05/2022 00:52:57 - INFO - codeparrot_training - Step 30136: {'lr': 0.00045672240631951645, 'samples': 15430144, 'steps': 30136, 'loss/train': 2.4408342838287354} +03/05/2022 00:53:00 - INFO - codeparrot_training - Step 30137: {'lr': 0.0004567194219496487, 'samples': 15430656, 'steps': 30137, 'loss/train': 0.2602927088737488} +03/05/2022 00:53:01 - INFO - codeparrot_training - Skipping example with length 184 (seq_length=1024) +03/05/2022 00:53:05 - INFO - codeparrot_training - Step 30138: {'lr': 0.0004567164374866363, 'samples': 15431168, 'steps': 30138, 'loss/train': 1.7092548608779907} +03/05/2022 00:53:08 - INFO - codeparrot_training - Step 30139: {'lr': 0.00045671345293048075, 'samples': 15431680, 'steps': 30139, 'loss/train': 1.6997926235198975} +03/05/2022 00:53:09 - INFO - codeparrot_training - Skipping example with length 15 (seq_length=1024) +03/05/2022 00:53:14 - INFO - codeparrot_training - Step 30140: {'lr': 0.00045671046828118324, 'samples': 15432192, 'steps': 30140, 'loss/train': 2.019731044769287} +03/05/2022 00:53:17 - INFO - codeparrot_training - Step 30141: {'lr': 0.0004567074835387452, 'samples': 15432704, 'steps': 30141, 'loss/train': 1.9466673135757446} +03/05/2022 00:53:17 - INFO - codeparrot_training - Skipping example with length 874 (seq_length=1024) +03/05/2022 00:53:22 - INFO - codeparrot_training - Step 30142: {'lr': 0.000456704498703168, 'samples': 15433216, 'steps': 30142, 'loss/train': 1.6673802137374878} +03/05/2022 00:53:25 - INFO - codeparrot_training - Step 30143: {'lr': 0.0004567015137744529, 'samples': 15433728, 'steps': 30143, 'loss/train': 3.781850814819336} +03/05/2022 00:53:26 - INFO - codeparrot_training - Skipping example with length 148 (seq_length=1024) +03/05/2022 00:53:30 - INFO - codeparrot_training - Step 30144: {'lr': 0.00045669852875260134, 'samples': 15434240, 'steps': 30144, 'loss/train': 1.9569998979568481} +03/05/2022 00:53:34 - INFO - codeparrot_training - Step 30145: {'lr': 0.00045669554363761454, 'samples': 15434752, 'steps': 30145, 'loss/train': 1.8220595121383667} +03/05/2022 00:53:34 - INFO - codeparrot_training - Skipping example with length 366 (seq_length=1024) +03/05/2022 00:53:39 - INFO - codeparrot_training - Step 30146: {'lr': 0.0004566925584294939, 'samples': 15435264, 'steps': 30146, 'loss/train': 2.322819948196411} +03/05/2022 00:53:42 - INFO - codeparrot_training - Step 30147: {'lr': 0.00045668957312824086, 'samples': 15435776, 'steps': 30147, 'loss/train': 2.182586669921875} +03/05/2022 00:53:42 - INFO - codeparrot_training - Skipping example with length 73 (seq_length=1024) +03/05/2022 00:53:47 - INFO - codeparrot_training - Step 30148: {'lr': 0.00045668658773385663, 'samples': 15436288, 'steps': 30148, 'loss/train': 0.7960249185562134} +03/05/2022 00:53:51 - INFO - codeparrot_training - Step 30149: {'lr': 0.00045668360224634263, 'samples': 15436800, 'steps': 30149, 'loss/train': 1.796868920326233} +03/05/2022 00:53:51 - INFO - codeparrot_training - Skipping example with length 674 (seq_length=1024) +03/05/2022 00:53:56 - INFO - codeparrot_training - Step 30150: {'lr': 0.00045668061666570027, 'samples': 15437312, 'steps': 30150, 'loss/train': 0.5574421882629395} +03/05/2022 00:53:59 - INFO - codeparrot_training - Skipping example with length 781 (seq_length=1024) +03/05/2022 00:54:01 - INFO - codeparrot_training - Step 30151: {'lr': 0.0004566776309919307, 'samples': 15437824, 'steps': 30151, 'loss/train': 1.5253926515579224} +03/05/2022 00:54:04 - INFO - codeparrot_training - Step 30152: {'lr': 0.0004566746452250354, 'samples': 15438336, 'steps': 30152, 'loss/train': 1.9378290176391602} +03/05/2022 00:54:07 - INFO - codeparrot_training - Skipping example with length 168 (seq_length=1024) +03/05/2022 00:54:09 - INFO - codeparrot_training - Step 30153: {'lr': 0.00045667165936501573, 'samples': 15438848, 'steps': 30153, 'loss/train': 1.9853847026824951} +03/05/2022 00:54:13 - INFO - codeparrot_training - Step 30154: {'lr': 0.000456668673411873, 'samples': 15439360, 'steps': 30154, 'loss/train': 1.8432587385177612} +03/05/2022 00:54:15 - INFO - codeparrot_training - Skipping example with length 910 (seq_length=1024) +03/05/2022 00:54:18 - INFO - codeparrot_training - Step 30155: {'lr': 0.00045666568736560853, 'samples': 15439872, 'steps': 30155, 'loss/train': 2.5243008136749268} +03/05/2022 00:54:21 - INFO - codeparrot_training - Step 30156: {'lr': 0.0004566627012262238, 'samples': 15440384, 'steps': 30156, 'loss/train': 1.9896689653396606} +03/05/2022 00:54:23 - INFO - codeparrot_training - Skipping example with length 921 (seq_length=1024) +03/05/2022 00:54:26 - INFO - codeparrot_training - Step 30157: {'lr': 0.0004566597149937199, 'samples': 15440896, 'steps': 30157, 'loss/train': 1.7000889778137207} +03/05/2022 00:54:29 - INFO - codeparrot_training - Step 30158: {'lr': 0.00045665672866809835, 'samples': 15441408, 'steps': 30158, 'loss/train': 2.9940712451934814} +03/05/2022 00:54:32 - INFO - codeparrot_training - Skipping example with length 613 (seq_length=1024) +03/05/2022 00:54:35 - INFO - codeparrot_training - Step 30159: {'lr': 0.0004566537422493605, 'samples': 15441920, 'steps': 30159, 'loss/train': 1.5751402378082275} +03/05/2022 00:54:38 - INFO - codeparrot_training - Step 30160: {'lr': 0.00045665075573750764, 'samples': 15442432, 'steps': 30160, 'loss/train': 2.1699953079223633} +03/05/2022 00:54:40 - INFO - codeparrot_training - Skipping example with length 668 (seq_length=1024) +03/05/2022 00:54:43 - INFO - codeparrot_training - Step 30161: {'lr': 0.00045664776913254115, 'samples': 15442944, 'steps': 30161, 'loss/train': 1.7363845109939575} +03/05/2022 00:54:46 - INFO - codeparrot_training - Step 30162: {'lr': 0.0004566447824344624, 'samples': 15443456, 'steps': 30162, 'loss/train': 1.8542977571487427} +03/05/2022 00:54:48 - INFO - codeparrot_training - Skipping example with length 502 (seq_length=1024) +03/05/2022 00:54:52 - INFO - codeparrot_training - Step 30163: {'lr': 0.00045664179564327266, 'samples': 15443968, 'steps': 30163, 'loss/train': 2.0066847801208496} +03/05/2022 00:54:55 - INFO - codeparrot_training - Step 30164: {'lr': 0.00045663880875897325, 'samples': 15444480, 'steps': 30164, 'loss/train': 1.7360237836837769} +03/05/2022 00:54:57 - INFO - codeparrot_training - Skipping example with length 820 (seq_length=1024) +03/05/2022 00:55:00 - INFO - codeparrot_training - Step 30165: {'lr': 0.00045663582178156564, 'samples': 15444992, 'steps': 30165, 'loss/train': 1.1062883138656616} +03/05/2022 00:55:03 - INFO - codeparrot_training - Step 30166: {'lr': 0.00045663283471105115, 'samples': 15445504, 'steps': 30166, 'loss/train': 1.268115758895874} +03/05/2022 00:55:05 - INFO - codeparrot_training - Skipping example with length 806 (seq_length=1024) +03/05/2022 00:55:09 - INFO - codeparrot_training - Step 30167: {'lr': 0.00045662984754743106, 'samples': 15446016, 'steps': 30167, 'loss/train': 2.4817821979522705} +03/05/2022 00:55:12 - INFO - codeparrot_training - Step 30168: {'lr': 0.00045662686029070674, 'samples': 15446528, 'steps': 30168, 'loss/train': 1.5153189897537231} +03/05/2022 00:55:14 - INFO - codeparrot_training - Skipping example with length 40 (seq_length=1024) +03/05/2022 00:55:17 - INFO - codeparrot_training - Step 30169: {'lr': 0.0004566238729408796, 'samples': 15447040, 'steps': 30169, 'loss/train': 2.1652262210845947} +03/05/2022 00:55:20 - INFO - codeparrot_training - Step 30170: {'lr': 0.00045662088549795087, 'samples': 15447552, 'steps': 30170, 'loss/train': 0.12777474522590637} +03/05/2022 00:55:22 - INFO - codeparrot_training - Skipping example with length 781 (seq_length=1024) +03/05/2022 00:55:25 - INFO - codeparrot_training - Step 30171: {'lr': 0.000456617897961922, 'samples': 15448064, 'steps': 30171, 'loss/train': 1.5894675254821777} +03/05/2022 00:55:29 - INFO - codeparrot_training - Step 30172: {'lr': 0.00045661491033279427, 'samples': 15448576, 'steps': 30172, 'loss/train': 2.382303476333618} +03/05/2022 00:55:30 - INFO - codeparrot_training - Skipping example with length 760 (seq_length=1024) +03/05/2022 00:55:34 - INFO - codeparrot_training - Step 30173: {'lr': 0.00045661192261056905, 'samples': 15449088, 'steps': 30173, 'loss/train': 0.10404415428638458} +03/05/2022 00:55:37 - INFO - codeparrot_training - Step 30174: {'lr': 0.00045660893479524767, 'samples': 15449600, 'steps': 30174, 'loss/train': 2.171333074569702} +03/05/2022 00:55:39 - INFO - codeparrot_training - Skipping example with length 363 (seq_length=1024) +03/05/2022 00:55:42 - INFO - codeparrot_training - Step 30175: {'lr': 0.00045660594688683154, 'samples': 15450112, 'steps': 30175, 'loss/train': 0.8810412883758545} +03/05/2022 00:55:46 - INFO - codeparrot_training - Step 30176: {'lr': 0.00045660295888532196, 'samples': 15450624, 'steps': 30176, 'loss/train': 1.6395387649536133} +03/05/2022 00:55:47 - INFO - codeparrot_training - Skipping example with length 395 (seq_length=1024) +03/05/2022 00:55:51 - INFO - codeparrot_training - Step 30177: {'lr': 0.00045659997079072024, 'samples': 15451136, 'steps': 30177, 'loss/train': 1.5356953144073486} +03/05/2022 00:55:54 - INFO - codeparrot_training - Step 30178: {'lr': 0.00045659698260302773, 'samples': 15451648, 'steps': 30178, 'loss/train': 1.5441616773605347} +03/05/2022 00:55:56 - INFO - codeparrot_training - Skipping example with length 257 (seq_length=1024) +03/05/2022 00:55:59 - INFO - codeparrot_training - Step 30179: {'lr': 0.00045659399432224583, 'samples': 15452160, 'steps': 30179, 'loss/train': 1.3203091621398926} +03/05/2022 00:56:02 - INFO - codeparrot_training - Step 30180: {'lr': 0.00045659100594837586, 'samples': 15452672, 'steps': 30180, 'loss/train': 1.2761400938034058} +03/05/2022 00:56:04 - INFO - codeparrot_training - Skipping example with length 214 (seq_length=1024) +03/05/2022 00:56:08 - INFO - codeparrot_training - Step 30181: {'lr': 0.0004565880174814192, 'samples': 15453184, 'steps': 30181, 'loss/train': 1.816937804222107} +03/05/2022 00:56:11 - INFO - codeparrot_training - Step 30182: {'lr': 0.0004565850289213772, 'samples': 15453696, 'steps': 30182, 'loss/train': 0.7331827282905579} +03/05/2022 00:56:13 - INFO - codeparrot_training - Skipping example with length 756 (seq_length=1024) +03/05/2022 00:56:16 - INFO - codeparrot_training - Step 30183: {'lr': 0.0004565820402682511, 'samples': 15454208, 'steps': 30183, 'loss/train': 6.669641017913818} +03/05/2022 00:56:19 - INFO - codeparrot_training - Step 30184: {'lr': 0.00045657905152204236, 'samples': 15454720, 'steps': 30184, 'loss/train': 2.00179123878479} +03/05/2022 00:56:22 - INFO - codeparrot_training - Skipping example with length 318 (seq_length=1024) +03/05/2022 00:56:25 - INFO - codeparrot_training - Step 30185: {'lr': 0.0004565760626827523, 'samples': 15455232, 'steps': 30185, 'loss/train': 1.325749397277832} +03/05/2022 00:56:28 - INFO - codeparrot_training - Step 30186: {'lr': 0.00045657307375038226, 'samples': 15455744, 'steps': 30186, 'loss/train': 1.6459600925445557} +03/05/2022 00:56:31 - INFO - codeparrot_training - Skipping example with length 870 (seq_length=1024) +03/05/2022 00:56:33 - INFO - codeparrot_training - Step 30187: {'lr': 0.00045657008472493356, 'samples': 15456256, 'steps': 30187, 'loss/train': 1.857986330986023} +03/05/2022 00:56:36 - INFO - codeparrot_training - Step 30188: {'lr': 0.0004565670956064075, 'samples': 15456768, 'steps': 30188, 'loss/train': 1.1490070819854736} +03/05/2022 00:56:39 - INFO - codeparrot_training - Skipping example with length 306 (seq_length=1024) +03/05/2022 00:56:42 - INFO - codeparrot_training - Step 30189: {'lr': 0.00045656410639480563, 'samples': 15457280, 'steps': 30189, 'loss/train': 1.8654168844223022} +03/05/2022 00:56:45 - INFO - codeparrot_training - Step 30190: {'lr': 0.00045656111709012906, 'samples': 15457792, 'steps': 30190, 'loss/train': 1.9297715425491333} +03/05/2022 00:56:48 - INFO - codeparrot_training - Step 30191: {'lr': 0.00045655812769237927, 'samples': 15458304, 'steps': 30191, 'loss/train': 1.1933776140213013} +03/05/2022 00:56:48 - INFO - codeparrot_training - Skipping example with length 468 (seq_length=1024) +03/05/2022 00:56:53 - INFO - codeparrot_training - Step 30192: {'lr': 0.00045655513820155755, 'samples': 15458816, 'steps': 30192, 'loss/train': 2.049964427947998} +03/05/2022 00:56:57 - INFO - codeparrot_training - Step 30193: {'lr': 0.00045655214861766525, 'samples': 15459328, 'steps': 30193, 'loss/train': 1.4200948476791382} +03/05/2022 00:56:57 - INFO - codeparrot_training - Skipping example with length 939 (seq_length=1024) +03/05/2022 00:57:02 - INFO - codeparrot_training - Step 30194: {'lr': 0.0004565491589407038, 'samples': 15459840, 'steps': 30194, 'loss/train': 1.7983677387237549} +03/05/2022 00:57:04 - INFO - codeparrot_training - Skipping example with length 498 (seq_length=1024) +03/05/2022 00:57:07 - INFO - codeparrot_training - Step 30195: {'lr': 0.0004565461691706745, 'samples': 15460352, 'steps': 30195, 'loss/train': 2.2857582569122314} +03/05/2022 00:57:10 - INFO - codeparrot_training - Step 30196: {'lr': 0.0004565431793075786, 'samples': 15460864, 'steps': 30196, 'loss/train': 1.6115623712539673} +03/05/2022 00:57:13 - INFO - codeparrot_training - Skipping example with length 761 (seq_length=1024) +03/05/2022 00:57:15 - INFO - codeparrot_training - Step 30197: {'lr': 0.0004565401893514176, 'samples': 15461376, 'steps': 30197, 'loss/train': 1.582255244255066} +03/05/2022 00:57:19 - INFO - codeparrot_training - Step 30198: {'lr': 0.0004565371993021927, 'samples': 15461888, 'steps': 30198, 'loss/train': 1.1788573265075684} +03/05/2022 00:57:21 - INFO - codeparrot_training - Skipping example with length 894 (seq_length=1024) +03/05/2022 00:57:24 - INFO - codeparrot_training - Step 30199: {'lr': 0.00045653420915990546, 'samples': 15462400, 'steps': 30199, 'loss/train': 1.5279617309570312} +03/05/2022 00:57:27 - INFO - codeparrot_training - Step 30200: {'lr': 0.000456531218924557, 'samples': 15462912, 'steps': 30200, 'loss/train': 0.6642404794692993} +03/05/2022 00:57:29 - INFO - codeparrot_training - Skipping example with length 772 (seq_length=1024) +03/05/2022 00:57:32 - INFO - codeparrot_training - Step 30201: {'lr': 0.0004565282285961488, 'samples': 15463424, 'steps': 30201, 'loss/train': 1.3005342483520508} +03/05/2022 00:57:35 - INFO - codeparrot_training - Step 30202: {'lr': 0.0004565252381746821, 'samples': 15463936, 'steps': 30202, 'loss/train': 1.9071435928344727} +03/05/2022 00:57:38 - INFO - codeparrot_training - Skipping example with length 36 (seq_length=1024) +03/05/2022 00:57:41 - INFO - codeparrot_training - Step 30203: {'lr': 0.0004565222476601584, 'samples': 15464448, 'steps': 30203, 'loss/train': 1.9037094116210938} +03/05/2022 00:57:44 - INFO - codeparrot_training - Step 30204: {'lr': 0.0004565192570525789, 'samples': 15464960, 'steps': 30204, 'loss/train': 0.8617432117462158} +03/05/2022 00:57:46 - INFO - codeparrot_training - Skipping example with length 346 (seq_length=1024) +03/05/2022 00:57:49 - INFO - codeparrot_training - Step 30205: {'lr': 0.00045651626635194497, 'samples': 15465472, 'steps': 30205, 'loss/train': 2.136298418045044} +03/05/2022 00:57:52 - INFO - codeparrot_training - Step 30206: {'lr': 0.0004565132755582581, 'samples': 15465984, 'steps': 30206, 'loss/train': 1.6034797430038452} +03/05/2022 00:57:55 - INFO - codeparrot_training - Skipping example with length 83 (seq_length=1024) +03/05/2022 00:57:58 - INFO - codeparrot_training - Step 30207: {'lr': 0.0004565102846715195, 'samples': 15466496, 'steps': 30207, 'loss/train': 1.116777777671814} +03/05/2022 00:58:01 - INFO - codeparrot_training - Step 30208: {'lr': 0.0004565072936917305, 'samples': 15467008, 'steps': 30208, 'loss/train': 1.985948085784912} +03/05/2022 00:58:03 - INFO - codeparrot_training - Skipping example with length 1003 (seq_length=1024) +03/05/2022 00:58:06 - INFO - codeparrot_training - Step 30209: {'lr': 0.0004565043026188926, 'samples': 15467520, 'steps': 30209, 'loss/train': 2.0067193508148193} +03/05/2022 00:58:09 - INFO - codeparrot_training - Step 30210: {'lr': 0.000456501311453007, 'samples': 15468032, 'steps': 30210, 'loss/train': 2.190906524658203} +03/05/2022 00:58:11 - INFO - codeparrot_training - Skipping example with length 155 (seq_length=1024) +03/05/2022 00:58:14 - INFO - codeparrot_training - Step 30211: {'lr': 0.00045649832019407504, 'samples': 15468544, 'steps': 30211, 'loss/train': 1.8707445859909058} +03/05/2022 00:58:17 - INFO - codeparrot_training - Step 30212: {'lr': 0.0004564953288420982, 'samples': 15469056, 'steps': 30212, 'loss/train': 1.779178261756897} +03/05/2022 00:58:19 - INFO - codeparrot_training - Skipping example with length 718 (seq_length=1024) +03/05/2022 00:58:23 - INFO - codeparrot_training - Step 30213: {'lr': 0.00045649233739707774, 'samples': 15469568, 'steps': 30213, 'loss/train': 2.0264296531677246} +03/05/2022 00:58:26 - INFO - codeparrot_training - Step 30214: {'lr': 0.00045648934585901496, 'samples': 15470080, 'steps': 30214, 'loss/train': 1.3510459661483765} +03/05/2022 00:58:28 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 00:58:31 - INFO - codeparrot_training - Step 30215: {'lr': 0.0004564863542279113, 'samples': 15470592, 'steps': 30215, 'loss/train': 1.4700790643692017} +03/05/2022 00:58:35 - INFO - codeparrot_training - Step 30216: {'lr': 0.0004564833625037681, 'samples': 15471104, 'steps': 30216, 'loss/train': 2.0649003982543945} +03/05/2022 00:58:37 - INFO - codeparrot_training - Skipping example with length 718 (seq_length=1024) +03/05/2022 00:58:40 - INFO - codeparrot_training - Step 30217: {'lr': 0.00045648037068658667, 'samples': 15471616, 'steps': 30217, 'loss/train': 1.567647099494934} +03/05/2022 00:58:43 - INFO - codeparrot_training - Step 30218: {'lr': 0.00045647737877636834, 'samples': 15472128, 'steps': 30218, 'loss/train': 1.7761714458465576} +03/05/2022 00:58:45 - INFO - codeparrot_training - Skipping example with length 399 (seq_length=1024) +03/05/2022 00:58:48 - INFO - codeparrot_training - Step 30219: {'lr': 0.0004564743867731145, 'samples': 15472640, 'steps': 30219, 'loss/train': 1.7921855449676514} +03/05/2022 00:58:51 - INFO - codeparrot_training - Step 30220: {'lr': 0.0004564713946768265, 'samples': 15473152, 'steps': 30220, 'loss/train': 2.465643882751465} +03/05/2022 00:58:54 - INFO - codeparrot_training - Skipping example with length 648 (seq_length=1024) +03/05/2022 00:58:57 - INFO - codeparrot_training - Step 30221: {'lr': 0.0004564684024875057, 'samples': 15473664, 'steps': 30221, 'loss/train': 1.6221206188201904} +03/05/2022 00:59:00 - INFO - codeparrot_training - Step 30222: {'lr': 0.0004564654102051534, 'samples': 15474176, 'steps': 30222, 'loss/train': 2.371615409851074} +03/05/2022 00:59:02 - INFO - codeparrot_training - Skipping example with length 391 (seq_length=1024) +03/05/2022 00:59:05 - INFO - codeparrot_training - Step 30223: {'lr': 0.000456462417829771, 'samples': 15474688, 'steps': 30223, 'loss/train': 0.9984307885169983} +03/05/2022 00:59:08 - INFO - codeparrot_training - Step 30224: {'lr': 0.0004564594253613598, 'samples': 15475200, 'steps': 30224, 'loss/train': 1.2560369968414307} +03/05/2022 00:59:10 - INFO - codeparrot_training - Skipping example with length 894 (seq_length=1024) +03/05/2022 00:59:14 - INFO - codeparrot_training - Step 30225: {'lr': 0.0004564564327999211, 'samples': 15475712, 'steps': 30225, 'loss/train': 2.3676202297210693} +03/05/2022 00:59:17 - INFO - codeparrot_training - Step 30226: {'lr': 0.00045645344014545643, 'samples': 15476224, 'steps': 30226, 'loss/train': 1.9876879453659058} +03/05/2022 00:59:19 - INFO - codeparrot_training - Skipping example with length 350 (seq_length=1024) +03/05/2022 00:59:22 - INFO - codeparrot_training - Step 30227: {'lr': 0.00045645044739796694, 'samples': 15476736, 'steps': 30227, 'loss/train': 1.4872524738311768} +03/05/2022 00:59:25 - INFO - codeparrot_training - Step 30228: {'lr': 0.00045644745455745414, 'samples': 15477248, 'steps': 30228, 'loss/train': 0.6331552267074585} +03/05/2022 00:59:31 - INFO - codeparrot_training - Step 30229: {'lr': 0.0004564444616239193, 'samples': 15477760, 'steps': 30229, 'loss/train': 0.2098829746246338} +03/05/2022 00:59:34 - INFO - codeparrot_training - Step 30230: {'lr': 0.0004564414685973637, 'samples': 15478272, 'steps': 30230, 'loss/train': 1.7654131650924683} +03/05/2022 00:59:35 - INFO - codeparrot_training - Skipping example with length 322 (seq_length=1024) +03/05/2022 00:59:39 - INFO - codeparrot_training - Step 30231: {'lr': 0.0004564384754777888, 'samples': 15478784, 'steps': 30231, 'loss/train': 2.1293141841888428} +03/05/2022 00:59:42 - INFO - codeparrot_training - Step 30232: {'lr': 0.00045643548226519587, 'samples': 15479296, 'steps': 30232, 'loss/train': 1.8077073097229004} +03/05/2022 00:59:44 - INFO - codeparrot_training - Skipping example with length 428 (seq_length=1024) +03/05/2022 00:59:48 - INFO - codeparrot_training - Step 30233: {'lr': 0.00045643248895958636, 'samples': 15479808, 'steps': 30233, 'loss/train': 1.1070702075958252} +03/05/2022 00:59:51 - INFO - codeparrot_training - Step 30234: {'lr': 0.00045642949556096146, 'samples': 15480320, 'steps': 30234, 'loss/train': 2.7490386962890625} +03/05/2022 00:59:52 - INFO - codeparrot_training - Skipping example with length 806 (seq_length=1024) +03/05/2022 00:59:56 - INFO - codeparrot_training - Step 30235: {'lr': 0.0004564265020693227, 'samples': 15480832, 'steps': 30235, 'loss/train': 1.2530138492584229} +03/05/2022 00:59:59 - INFO - codeparrot_training - Step 30236: {'lr': 0.0004564235084846713, 'samples': 15481344, 'steps': 30236, 'loss/train': 1.2790501117706299} +03/05/2022 01:00:00 - INFO - codeparrot_training - Skipping example with length 226 (seq_length=1024) +03/05/2022 01:00:04 - INFO - codeparrot_training - Step 30237: {'lr': 0.00045642051480700873, 'samples': 15481856, 'steps': 30237, 'loss/train': 1.438962697982788} +03/05/2022 01:00:08 - INFO - codeparrot_training - Step 30238: {'lr': 0.0004564175210363362, 'samples': 15482368, 'steps': 30238, 'loss/train': 1.755921721458435} +03/05/2022 01:00:09 - INFO - codeparrot_training - Skipping example with length 911 (seq_length=1024) +03/05/2022 01:00:13 - INFO - codeparrot_training - Step 30239: {'lr': 0.00045641452717265507, 'samples': 15482880, 'steps': 30239, 'loss/train': 1.8186254501342773} +03/05/2022 01:00:16 - INFO - codeparrot_training - Step 30240: {'lr': 0.00045641153321596687, 'samples': 15483392, 'steps': 30240, 'loss/train': 1.6997802257537842} +03/05/2022 01:00:17 - INFO - codeparrot_training - Skipping example with length 694 (seq_length=1024) +03/05/2022 01:00:21 - INFO - codeparrot_training - Step 30241: {'lr': 0.0004564085391662727, 'samples': 15483904, 'steps': 30241, 'loss/train': 0.6641673445701599} +03/05/2022 01:00:24 - INFO - codeparrot_training - Step 30242: {'lr': 0.00045640554502357413, 'samples': 15484416, 'steps': 30242, 'loss/train': 1.682521939277649} +03/05/2022 01:00:26 - INFO - codeparrot_training - Skipping example with length 329 (seq_length=1024) +03/05/2022 01:00:30 - INFO - codeparrot_training - Step 30243: {'lr': 0.0004564025507878723, 'samples': 15484928, 'steps': 30243, 'loss/train': 2.0395255088806152} +03/05/2022 01:00:33 - INFO - codeparrot_training - Step 30244: {'lr': 0.00045639955645916875, 'samples': 15485440, 'steps': 30244, 'loss/train': 2.3381590843200684} +03/05/2022 01:00:34 - INFO - codeparrot_training - Skipping example with length 66 (seq_length=1024) +03/05/2022 01:00:38 - INFO - codeparrot_training - Step 30245: {'lr': 0.0004563965620374647, 'samples': 15485952, 'steps': 30245, 'loss/train': 1.1800812482833862} +03/05/2022 01:00:41 - INFO - codeparrot_training - Step 30246: {'lr': 0.0004563935675227615, 'samples': 15486464, 'steps': 30246, 'loss/train': 2.39896559715271} +03/05/2022 01:00:42 - INFO - codeparrot_training - Skipping example with length 149 (seq_length=1024) +03/05/2022 01:00:47 - INFO - codeparrot_training - Step 30247: {'lr': 0.00045639057291506065, 'samples': 15486976, 'steps': 30247, 'loss/train': 1.636587142944336} +03/05/2022 01:00:50 - INFO - codeparrot_training - Step 30248: {'lr': 0.0004563875782143633, 'samples': 15487488, 'steps': 30248, 'loss/train': 2.1304707527160645} +03/05/2022 01:00:51 - INFO - codeparrot_training - Skipping example with length 613 (seq_length=1024) +03/05/2022 01:00:55 - INFO - codeparrot_training - Step 30249: {'lr': 0.000456384583420671, 'samples': 15488000, 'steps': 30249, 'loss/train': 2.1647915840148926} +03/05/2022 01:00:58 - INFO - codeparrot_training - Step 30250: {'lr': 0.0004563815885339849, 'samples': 15488512, 'steps': 30250, 'loss/train': 1.878063678741455} +03/05/2022 01:00:59 - INFO - codeparrot_training - Skipping example with length 361 (seq_length=1024) +03/05/2022 01:01:04 - INFO - codeparrot_training - Step 30251: {'lr': 0.00045637859355430647, 'samples': 15489024, 'steps': 30251, 'loss/train': 1.9763576984405518} +03/05/2022 01:01:07 - INFO - codeparrot_training - Step 30252: {'lr': 0.000456375598481637, 'samples': 15489536, 'steps': 30252, 'loss/train': 2.1009347438812256} +03/05/2022 01:01:07 - INFO - codeparrot_training - Skipping example with length 921 (seq_length=1024) +03/05/2022 01:01:12 - INFO - codeparrot_training - Step 30253: {'lr': 0.00045637260331597793, 'samples': 15490048, 'steps': 30253, 'loss/train': 3.047492742538452} +03/05/2022 01:01:15 - INFO - codeparrot_training - Step 30254: {'lr': 0.00045636960805733054, 'samples': 15490560, 'steps': 30254, 'loss/train': 1.3888639211654663} +03/05/2022 01:01:16 - INFO - codeparrot_training - Skipping example with length 342 (seq_length=1024) +03/05/2022 01:01:21 - INFO - codeparrot_training - Step 30255: {'lr': 0.0004563666127056961, 'samples': 15491072, 'steps': 30255, 'loss/train': 1.5548039674758911} +03/05/2022 01:01:24 - INFO - codeparrot_training - Step 30256: {'lr': 0.0004563636172610761, 'samples': 15491584, 'steps': 30256, 'loss/train': 1.9221271276474} +03/05/2022 01:01:24 - INFO - codeparrot_training - Skipping example with length 662 (seq_length=1024) +03/05/2022 01:01:29 - INFO - codeparrot_training - Step 30257: {'lr': 0.00045636062172347186, 'samples': 15492096, 'steps': 30257, 'loss/train': 1.9878610372543335} +03/05/2022 01:01:32 - INFO - codeparrot_training - Step 30258: {'lr': 0.0004563576260928847, 'samples': 15492608, 'steps': 30258, 'loss/train': 1.368032455444336} +03/05/2022 01:01:32 - INFO - codeparrot_training - Skipping example with length 577 (seq_length=1024) +03/05/2022 01:01:37 - INFO - codeparrot_training - Step 30259: {'lr': 0.000456354630369316, 'samples': 15493120, 'steps': 30259, 'loss/train': 1.535534381866455} +03/05/2022 01:01:40 - INFO - codeparrot_training - Step 30260: {'lr': 0.00045635163455276707, 'samples': 15493632, 'steps': 30260, 'loss/train': 1.5032907724380493} +03/05/2022 01:01:40 - INFO - codeparrot_training - Skipping example with length 596 (seq_length=1024) +03/05/2022 01:01:46 - INFO - codeparrot_training - Step 30261: {'lr': 0.0004563486386432393, 'samples': 15494144, 'steps': 30261, 'loss/train': 1.9104982614517212} +03/05/2022 01:01:49 - INFO - codeparrot_training - Step 30262: {'lr': 0.00045634564264073396, 'samples': 15494656, 'steps': 30262, 'loss/train': 3.494652032852173} +03/05/2022 01:01:49 - INFO - codeparrot_training - Skipping example with length 804 (seq_length=1024) +03/05/2022 01:01:54 - INFO - codeparrot_training - Step 30263: {'lr': 0.0004563426465452525, 'samples': 15495168, 'steps': 30263, 'loss/train': 1.6567870378494263} +03/05/2022 01:01:57 - INFO - codeparrot_training - Step 30264: {'lr': 0.00045633965035679614, 'samples': 15495680, 'steps': 30264, 'loss/train': 1.900291085243225} +03/05/2022 01:01:58 - INFO - codeparrot_training - Skipping example with length 105 (seq_length=1024) +03/05/2022 01:02:03 - INFO - codeparrot_training - Step 30265: {'lr': 0.0004563366540753664, 'samples': 15496192, 'steps': 30265, 'loss/train': 1.5593653917312622} +03/05/2022 01:02:06 - INFO - codeparrot_training - Step 30266: {'lr': 0.00045633365770096456, 'samples': 15496704, 'steps': 30266, 'loss/train': 1.4124549627304077} +03/05/2022 01:02:06 - INFO - codeparrot_training - Skipping example with length 175 (seq_length=1024) +03/05/2022 01:02:11 - INFO - codeparrot_training - Step 30267: {'lr': 0.000456330661233592, 'samples': 15497216, 'steps': 30267, 'loss/train': 2.317880153656006} +03/05/2022 01:02:14 - INFO - codeparrot_training - Skipping example with length 310 (seq_length=1024) +03/05/2022 01:02:17 - INFO - codeparrot_training - Step 30268: {'lr': 0.00045632766467324995, 'samples': 15497728, 'steps': 30268, 'loss/train': 1.693334937095642} +03/05/2022 01:02:20 - INFO - codeparrot_training - Step 30269: {'lr': 0.0004563246680199398, 'samples': 15498240, 'steps': 30269, 'loss/train': 1.5191677808761597} +03/05/2022 01:02:22 - INFO - codeparrot_training - Skipping example with length 174 (seq_length=1024) +03/05/2022 01:02:25 - INFO - codeparrot_training - Step 30270: {'lr': 0.000456321671273663, 'samples': 15498752, 'steps': 30270, 'loss/train': 1.4728446006774902} +03/05/2022 01:02:28 - INFO - codeparrot_training - Step 30271: {'lr': 0.00045631867443442084, 'samples': 15499264, 'steps': 30271, 'loss/train': 1.7472803592681885} +03/05/2022 01:02:31 - INFO - codeparrot_training - Skipping example with length 670 (seq_length=1024) +03/05/2022 01:02:34 - INFO - codeparrot_training - Step 30272: {'lr': 0.00045631567750221465, 'samples': 15499776, 'steps': 30272, 'loss/train': 1.2688239812850952} +03/05/2022 01:02:37 - INFO - codeparrot_training - Step 30273: {'lr': 0.0004563126804770458, 'samples': 15500288, 'steps': 30273, 'loss/train': 0.9735040068626404} +03/05/2022 01:02:39 - INFO - codeparrot_training - Skipping example with length 176 (seq_length=1024) +03/05/2022 01:02:42 - INFO - codeparrot_training - Step 30274: {'lr': 0.00045630968335891564, 'samples': 15500800, 'steps': 30274, 'loss/train': 2.2206263542175293} +03/05/2022 01:02:45 - INFO - codeparrot_training - Step 30275: {'lr': 0.00045630668614782553, 'samples': 15501312, 'steps': 30275, 'loss/train': 1.1849333047866821} +03/05/2022 01:02:48 - INFO - codeparrot_training - Skipping example with length 251 (seq_length=1024) +03/05/2022 01:02:50 - INFO - codeparrot_training - Step 30276: {'lr': 0.0004563036888437768, 'samples': 15501824, 'steps': 30276, 'loss/train': 0.4587782919406891} +03/05/2022 01:02:54 - INFO - codeparrot_training - Step 30277: {'lr': 0.0004563006914467709, 'samples': 15502336, 'steps': 30277, 'loss/train': 1.5043517351150513} +03/05/2022 01:02:56 - INFO - codeparrot_training - Skipping example with length 246 (seq_length=1024) +03/05/2022 01:02:59 - INFO - codeparrot_training - Step 30278: {'lr': 0.000456297693956809, 'samples': 15502848, 'steps': 30278, 'loss/train': 1.8949087858200073} +03/05/2022 01:03:02 - INFO - codeparrot_training - Step 30279: {'lr': 0.0004562946963738925, 'samples': 15503360, 'steps': 30279, 'loss/train': 1.8669930696487427} +03/05/2022 01:03:04 - INFO - codeparrot_training - Skipping example with length 267 (seq_length=1024) +03/05/2022 01:03:07 - INFO - codeparrot_training - Step 30280: {'lr': 0.0004562916986980229, 'samples': 15503872, 'steps': 30280, 'loss/train': 1.2581777572631836} +03/05/2022 01:03:10 - INFO - codeparrot_training - Step 30281: {'lr': 0.0004562887009292014, 'samples': 15504384, 'steps': 30281, 'loss/train': 0.9684621691703796} +03/05/2022 01:03:12 - INFO - codeparrot_training - Skipping example with length 841 (seq_length=1024) +03/05/2022 01:03:16 - INFO - codeparrot_training - Step 30282: {'lr': 0.0004562857030674293, 'samples': 15504896, 'steps': 30282, 'loss/train': 1.1793482303619385} +03/05/2022 01:03:19 - INFO - codeparrot_training - Step 30283: {'lr': 0.0004562827051127082, 'samples': 15505408, 'steps': 30283, 'loss/train': 1.6133840084075928} +03/05/2022 01:03:21 - INFO - codeparrot_training - Skipping example with length 49 (seq_length=1024) +03/05/2022 01:03:24 - INFO - codeparrot_training - Step 30284: {'lr': 0.0004562797070650392, 'samples': 15505920, 'steps': 30284, 'loss/train': 1.7075990438461304} +03/05/2022 01:03:27 - INFO - codeparrot_training - Step 30285: {'lr': 0.00045627670892442376, 'samples': 15506432, 'steps': 30285, 'loss/train': 1.4524474143981934} +03/05/2022 01:03:29 - INFO - codeparrot_training - Skipping example with length 812 (seq_length=1024) +03/05/2022 01:03:32 - INFO - codeparrot_training - Step 30286: {'lr': 0.0004562737106908632, 'samples': 15506944, 'steps': 30286, 'loss/train': 2.1674249172210693} +03/05/2022 01:03:36 - INFO - codeparrot_training - Step 30287: {'lr': 0.00045627071236435896, 'samples': 15507456, 'steps': 30287, 'loss/train': 1.509385585784912} +03/05/2022 01:03:37 - INFO - codeparrot_training - Skipping example with length 637 (seq_length=1024) +03/05/2022 01:03:41 - INFO - codeparrot_training - Step 30288: {'lr': 0.0004562677139449123, 'samples': 15507968, 'steps': 30288, 'loss/train': 2.908494710922241} +03/05/2022 01:03:44 - INFO - codeparrot_training - Step 30289: {'lr': 0.0004562647154325246, 'samples': 15508480, 'steps': 30289, 'loss/train': 2.167825937271118} +03/05/2022 01:03:46 - INFO - codeparrot_training - Skipping example with length 501 (seq_length=1024) +03/05/2022 01:03:49 - INFO - codeparrot_training - Step 30290: {'lr': 0.0004562617168271971, 'samples': 15508992, 'steps': 30290, 'loss/train': 1.6798962354660034} +03/05/2022 01:03:53 - INFO - codeparrot_training - Step 30291: {'lr': 0.0004562587181289314, 'samples': 15509504, 'steps': 30291, 'loss/train': 1.7441438436508179} +03/05/2022 01:03:54 - INFO - codeparrot_training - Skipping example with length 315 (seq_length=1024) +03/05/2022 01:03:58 - INFO - codeparrot_training - Step 30292: {'lr': 0.00045625571933772857, 'samples': 15510016, 'steps': 30292, 'loss/train': 1.9378803968429565} +03/05/2022 01:04:01 - INFO - codeparrot_training - Step 30293: {'lr': 0.0004562527204535902, 'samples': 15510528, 'steps': 30293, 'loss/train': 1.5410722494125366} +03/05/2022 01:04:02 - INFO - codeparrot_training - Skipping example with length 249 (seq_length=1024) +03/05/2022 01:04:06 - INFO - codeparrot_training - Step 30294: {'lr': 0.00045624972147651746, 'samples': 15511040, 'steps': 30294, 'loss/train': 1.4874112606048584} +03/05/2022 01:04:09 - INFO - codeparrot_training - Step 30295: {'lr': 0.00045624672240651183, 'samples': 15511552, 'steps': 30295, 'loss/train': 1.9203979969024658} +03/05/2022 01:04:11 - INFO - codeparrot_training - Skipping example with length 630 (seq_length=1024) +03/05/2022 01:04:15 - INFO - codeparrot_training - Step 30296: {'lr': 0.00045624372324357457, 'samples': 15512064, 'steps': 30296, 'loss/train': 1.7807732820510864} +03/05/2022 01:04:18 - INFO - codeparrot_training - Step 30297: {'lr': 0.0004562407239877071, 'samples': 15512576, 'steps': 30297, 'loss/train': 1.9081791639328003} +03/05/2022 01:04:19 - INFO - codeparrot_training - Skipping example with length 405 (seq_length=1024) +03/05/2022 01:04:23 - INFO - codeparrot_training - Step 30298: {'lr': 0.0004562377246389108, 'samples': 15513088, 'steps': 30298, 'loss/train': 1.4249955415725708} +03/05/2022 01:04:26 - INFO - codeparrot_training - Step 30299: {'lr': 0.00045623472519718683, 'samples': 15513600, 'steps': 30299, 'loss/train': 2.372708559036255} +03/05/2022 01:04:27 - INFO - codeparrot_training - Skipping example with length 726 (seq_length=1024) +03/05/2022 01:04:32 - INFO - codeparrot_training - Step 30300: {'lr': 0.00045623172566253676, 'samples': 15514112, 'steps': 30300, 'loss/train': 2.2095062732696533} +03/05/2022 01:04:35 - INFO - codeparrot_training - Step 30301: {'lr': 0.00045622872603496184, 'samples': 15514624, 'steps': 30301, 'loss/train': 1.9211101531982422} +03/05/2022 01:04:36 - INFO - codeparrot_training - Skipping example with length 890 (seq_length=1024) +03/05/2022 01:04:40 - INFO - codeparrot_training - Step 30302: {'lr': 0.0004562257263144635, 'samples': 15515136, 'steps': 30302, 'loss/train': 1.0406535863876343} +03/05/2022 01:04:43 - INFO - codeparrot_training - Step 30303: {'lr': 0.0004562227265010429, 'samples': 15515648, 'steps': 30303, 'loss/train': 1.2455202341079712} +03/05/2022 01:04:45 - INFO - codeparrot_training - Skipping example with length 171 (seq_length=1024) +03/05/2022 01:04:49 - INFO - codeparrot_training - Step 30304: {'lr': 0.00045621972659470156, 'samples': 15516160, 'steps': 30304, 'loss/train': 2.6532111167907715} +03/05/2022 01:04:52 - INFO - codeparrot_training - Step 30305: {'lr': 0.0004562167265954409, 'samples': 15516672, 'steps': 30305, 'loss/train': 1.954776406288147} +03/05/2022 01:04:54 - INFO - codeparrot_training - Skipping example with length 445 (seq_length=1024) +03/05/2022 01:04:57 - INFO - codeparrot_training - Step 30306: {'lr': 0.000456213726503262, 'samples': 15517184, 'steps': 30306, 'loss/train': 1.7793982028961182} +03/05/2022 01:05:00 - INFO - codeparrot_training - Step 30307: {'lr': 0.0004562107263181665, 'samples': 15517696, 'steps': 30307, 'loss/train': 2.420687675476074} +03/05/2022 01:05:02 - INFO - codeparrot_training - Skipping example with length 792 (seq_length=1024) +03/05/2022 01:05:06 - INFO - codeparrot_training - Step 30308: {'lr': 0.0004562077260401556, 'samples': 15518208, 'steps': 30308, 'loss/train': 1.699628233909607} +03/05/2022 01:05:09 - INFO - codeparrot_training - Step 30309: {'lr': 0.00045620472566923064, 'samples': 15518720, 'steps': 30309, 'loss/train': 1.8189477920532227} +03/05/2022 01:05:10 - INFO - codeparrot_training - Skipping example with length 250 (seq_length=1024) +03/05/2022 01:05:14 - INFO - codeparrot_training - Step 30310: {'lr': 0.0004562017252053931, 'samples': 15519232, 'steps': 30310, 'loss/train': 5.373987197875977} +03/05/2022 01:05:17 - INFO - codeparrot_training - Step 30311: {'lr': 0.0004561987246486442, 'samples': 15519744, 'steps': 30311, 'loss/train': 1.670209527015686} +03/05/2022 01:05:20 - INFO - codeparrot_training - Skipping example with length 411 (seq_length=1024) +03/05/2022 01:05:23 - INFO - codeparrot_training - Step 30312: {'lr': 0.00045619572399898534, 'samples': 15520256, 'steps': 30312, 'loss/train': 1.5850143432617188} +03/05/2022 01:05:26 - INFO - codeparrot_training - Step 30313: {'lr': 0.0004561927232564179, 'samples': 15520768, 'steps': 30313, 'loss/train': 1.8503373861312866} +03/05/2022 01:05:28 - INFO - codeparrot_training - Skipping example with length 914 (seq_length=1024) +03/05/2022 01:05:31 - INFO - codeparrot_training - Step 30314: {'lr': 0.00045618972242094313, 'samples': 15521280, 'steps': 30314, 'loss/train': 1.8182893991470337} +03/05/2022 01:05:34 - INFO - codeparrot_training - Step 30315: {'lr': 0.00045618672149256244, 'samples': 15521792, 'steps': 30315, 'loss/train': 1.4408502578735352} +03/05/2022 01:05:36 - INFO - codeparrot_training - Skipping example with length 443 (seq_length=1024) +03/05/2022 01:05:40 - INFO - codeparrot_training - Step 30316: {'lr': 0.0004561837204712773, 'samples': 15522304, 'steps': 30316, 'loss/train': 1.6367123126983643} +03/05/2022 01:05:43 - INFO - codeparrot_training - Step 30317: {'lr': 0.0004561807193570888, 'samples': 15522816, 'steps': 30317, 'loss/train': 1.8563569784164429} +03/05/2022 01:05:45 - INFO - codeparrot_training - Skipping example with length 11 (seq_length=1024) +03/05/2022 01:05:48 - INFO - codeparrot_training - Step 30318: {'lr': 0.0004561777181499986, 'samples': 15523328, 'steps': 30318, 'loss/train': 1.7057815790176392} +03/05/2022 01:05:51 - INFO - codeparrot_training - Step 30319: {'lr': 0.00045617471685000785, 'samples': 15523840, 'steps': 30319, 'loss/train': 1.831925630569458} +03/05/2022 01:05:53 - INFO - codeparrot_training - Skipping example with length 650 (seq_length=1024) +03/05/2022 01:05:56 - INFO - codeparrot_training - Step 30320: {'lr': 0.00045617171545711793, 'samples': 15524352, 'steps': 30320, 'loss/train': 0.0617365762591362} +03/05/2022 01:06:00 - INFO - codeparrot_training - Step 30321: {'lr': 0.0004561687139713302, 'samples': 15524864, 'steps': 30321, 'loss/train': 1.2955726385116577} +03/05/2022 01:06:01 - INFO - codeparrot_training - Skipping example with length 454 (seq_length=1024) +03/05/2022 01:06:05 - INFO - codeparrot_training - Step 30322: {'lr': 0.00045616571239264614, 'samples': 15525376, 'steps': 30322, 'loss/train': 1.7771223783493042} +03/05/2022 01:06:08 - INFO - codeparrot_training - Step 30323: {'lr': 0.0004561627107210669, 'samples': 15525888, 'steps': 30323, 'loss/train': 1.493330478668213} +03/05/2022 01:06:09 - INFO - codeparrot_training - Skipping example with length 905 (seq_length=1024) +03/05/2022 01:06:13 - INFO - codeparrot_training - Step 30324: {'lr': 0.00045615970895659393, 'samples': 15526400, 'steps': 30324, 'loss/train': 0.9467135667800903} +03/05/2022 01:06:17 - INFO - codeparrot_training - Step 30325: {'lr': 0.00045615670709922855, 'samples': 15526912, 'steps': 30325, 'loss/train': 1.058262825012207} +03/05/2022 01:06:18 - INFO - codeparrot_training - Skipping example with length 848 (seq_length=1024) +03/05/2022 01:06:22 - INFO - codeparrot_training - Step 30326: {'lr': 0.0004561537051489722, 'samples': 15527424, 'steps': 30326, 'loss/train': 1.4175759553909302} +03/05/2022 01:06:25 - INFO - codeparrot_training - Step 30327: {'lr': 0.00045615070310582617, 'samples': 15527936, 'steps': 30327, 'loss/train': 1.2218552827835083} +03/05/2022 01:06:26 - INFO - codeparrot_training - Skipping example with length 284 (seq_length=1024) +03/05/2022 01:06:31 - INFO - codeparrot_training - Step 30328: {'lr': 0.00045614770096979177, 'samples': 15528448, 'steps': 30328, 'loss/train': 1.2990055084228516} +03/05/2022 01:06:34 - INFO - codeparrot_training - Step 30329: {'lr': 0.0004561446987408704, 'samples': 15528960, 'steps': 30329, 'loss/train': 1.965140461921692} +03/05/2022 01:06:36 - INFO - codeparrot_training - Skipping example with length 274 (seq_length=1024) +03/05/2022 01:06:39 - INFO - codeparrot_training - Step 30330: {'lr': 0.00045614169641906344, 'samples': 15529472, 'steps': 30330, 'loss/train': 2.1058785915374756} +03/05/2022 01:06:42 - INFO - codeparrot_training - Step 30331: {'lr': 0.00045613869400437223, 'samples': 15529984, 'steps': 30331, 'loss/train': 1.4208797216415405} +03/05/2022 01:06:45 - INFO - codeparrot_training - Skipping example with length 969 (seq_length=1024) +03/05/2022 01:06:48 - INFO - codeparrot_training - Step 30332: {'lr': 0.000456135691496798, 'samples': 15530496, 'steps': 30332, 'loss/train': 2.1719412803649902} +03/05/2022 01:06:51 - INFO - codeparrot_training - Step 30333: {'lr': 0.0004561326888963423, 'samples': 15531008, 'steps': 30333, 'loss/train': 0.16385029256343842} +03/05/2022 01:06:53 - INFO - codeparrot_training - Skipping example with length 96 (seq_length=1024) +03/05/2022 01:06:56 - INFO - codeparrot_training - Step 30334: {'lr': 0.0004561296862030064, 'samples': 15531520, 'steps': 30334, 'loss/train': 1.8687011003494263} +03/05/2022 01:06:59 - INFO - codeparrot_training - Step 30335: {'lr': 0.00045612668341679164, 'samples': 15532032, 'steps': 30335, 'loss/train': 0.1145060658454895} +03/05/2022 01:07:02 - INFO - codeparrot_training - Skipping example with length 743 (seq_length=1024) +03/05/2022 01:07:05 - INFO - codeparrot_training - Step 30336: {'lr': 0.0004561236805376994, 'samples': 15532544, 'steps': 30336, 'loss/train': 1.8252521753311157} +03/05/2022 01:07:08 - INFO - codeparrot_training - Step 30337: {'lr': 0.00045612067756573097, 'samples': 15533056, 'steps': 30337, 'loss/train': 1.1377383470535278} +03/05/2022 01:07:10 - INFO - codeparrot_training - Skipping example with length 348 (seq_length=1024) +03/05/2022 01:07:13 - INFO - codeparrot_training - Step 30338: {'lr': 0.0004561176745008877, 'samples': 15533568, 'steps': 30338, 'loss/train': 1.4026397466659546} +03/05/2022 01:07:16 - INFO - codeparrot_training - Step 30339: {'lr': 0.000456114671343171, 'samples': 15534080, 'steps': 30339, 'loss/train': 2.222360610961914} +03/05/2022 01:07:18 - INFO - codeparrot_training - Skipping example with length 634 (seq_length=1024) +03/05/2022 01:07:22 - INFO - codeparrot_training - Step 30340: {'lr': 0.00045611166809258227, 'samples': 15534592, 'steps': 30340, 'loss/train': 1.4127634763717651} +03/05/2022 01:07:25 - INFO - codeparrot_training - Step 30341: {'lr': 0.0004561086647491227, 'samples': 15535104, 'steps': 30341, 'loss/train': 1.526201844215393} +03/05/2022 01:07:27 - INFO - codeparrot_training - Skipping example with length 914 (seq_length=1024) +03/05/2022 01:07:30 - INFO - codeparrot_training - Step 30342: {'lr': 0.00045610566131279386, 'samples': 15535616, 'steps': 30342, 'loss/train': 1.739932894706726} +03/05/2022 01:07:33 - INFO - codeparrot_training - Step 30343: {'lr': 0.00045610265778359696, 'samples': 15536128, 'steps': 30343, 'loss/train': 1.7376621961593628} +03/05/2022 01:07:35 - INFO - codeparrot_training - Skipping example with length 430 (seq_length=1024) +03/05/2022 01:07:39 - INFO - codeparrot_training - Step 30344: {'lr': 0.00045609965416153333, 'samples': 15536640, 'steps': 30344, 'loss/train': 1.795729398727417} +03/05/2022 01:07:42 - INFO - codeparrot_training - Step 30345: {'lr': 0.0004560966504466044, 'samples': 15537152, 'steps': 30345, 'loss/train': 1.8292362689971924} +03/05/2022 01:07:44 - INFO - codeparrot_training - Skipping example with length 31 (seq_length=1024) +03/05/2022 01:07:47 - INFO - codeparrot_training - Step 30346: {'lr': 0.00045609364663881153, 'samples': 15537664, 'steps': 30346, 'loss/train': 1.2304362058639526} +03/05/2022 01:07:50 - INFO - codeparrot_training - Step 30347: {'lr': 0.000456090642738156, 'samples': 15538176, 'steps': 30347, 'loss/train': 2.116027355194092} +03/05/2022 01:07:53 - INFO - codeparrot_training - Skipping example with length 178 (seq_length=1024) +03/05/2022 01:07:56 - INFO - codeparrot_training - Step 30348: {'lr': 0.00045608763874463925, 'samples': 15538688, 'steps': 30348, 'loss/train': 0.9933581352233887} +03/05/2022 01:07:59 - INFO - codeparrot_training - Step 30349: {'lr': 0.00045608463465826257, 'samples': 15539200, 'steps': 30349, 'loss/train': 2.2502827644348145} +03/05/2022 01:08:01 - INFO - codeparrot_training - Skipping example with length 424 (seq_length=1024) +03/05/2022 01:08:04 - INFO - codeparrot_training - Step 30350: {'lr': 0.0004560816304790274, 'samples': 15539712, 'steps': 30350, 'loss/train': 2.142665147781372} +03/05/2022 01:08:07 - INFO - codeparrot_training - Step 30351: {'lr': 0.0004560786262069349, 'samples': 15540224, 'steps': 30351, 'loss/train': 2.10463547706604} +03/05/2022 01:08:10 - INFO - codeparrot_training - Skipping example with length 827 (seq_length=1024) +03/05/2022 01:08:13 - INFO - codeparrot_training - Step 30352: {'lr': 0.00045607562184198666, 'samples': 15540736, 'steps': 30352, 'loss/train': 2.174138307571411} +03/05/2022 01:08:16 - INFO - codeparrot_training - Step 30353: {'lr': 0.00045607261738418384, 'samples': 15541248, 'steps': 30353, 'loss/train': 2.0719547271728516} +03/05/2022 01:08:19 - INFO - codeparrot_training - Step 30354: {'lr': 0.00045606961283352793, 'samples': 15541760, 'steps': 30354, 'loss/train': 6.586909294128418} +03/05/2022 01:08:19 - INFO - codeparrot_training - Skipping example with length 749 (seq_length=1024) +03/05/2022 01:08:24 - INFO - codeparrot_training - Step 30355: {'lr': 0.0004560666081900202, 'samples': 15542272, 'steps': 30355, 'loss/train': 1.7161489725112915} +03/05/2022 01:08:27 - INFO - codeparrot_training - Step 30356: {'lr': 0.00045606360345366203, 'samples': 15542784, 'steps': 30356, 'loss/train': 1.4627867937088013} +03/05/2022 01:08:28 - INFO - codeparrot_training - Skipping example with length 599 (seq_length=1024) +03/05/2022 01:08:33 - INFO - codeparrot_training - Step 30357: {'lr': 0.00045606059862445485, 'samples': 15543296, 'steps': 30357, 'loss/train': 1.872009515762329} +03/05/2022 01:08:36 - INFO - codeparrot_training - Step 30358: {'lr': 0.0004560575937023999, 'samples': 15543808, 'steps': 30358, 'loss/train': 1.9575735330581665} +03/05/2022 01:08:36 - INFO - codeparrot_training - Skipping example with length 475 (seq_length=1024) +03/05/2022 01:08:41 - INFO - codeparrot_training - Step 30359: {'lr': 0.0004560545886874986, 'samples': 15544320, 'steps': 30359, 'loss/train': 1.8711278438568115} +03/05/2022 01:08:44 - INFO - codeparrot_training - Skipping example with length 655 (seq_length=1024) +03/05/2022 01:08:46 - INFO - codeparrot_training - Step 30360: {'lr': 0.00045605158357975225, 'samples': 15544832, 'steps': 30360, 'loss/train': 1.4265213012695312} +03/05/2022 01:08:50 - INFO - codeparrot_training - Step 30361: {'lr': 0.00045604857837916224, 'samples': 15545344, 'steps': 30361, 'loss/train': 1.7307380437850952} +03/05/2022 01:08:52 - INFO - codeparrot_training - Skipping example with length 232 (seq_length=1024) +03/05/2022 01:08:55 - INFO - codeparrot_training - Step 30362: {'lr': 0.0004560455730857299, 'samples': 15545856, 'steps': 30362, 'loss/train': 2.065617561340332} +03/05/2022 01:08:58 - INFO - codeparrot_training - Step 30363: {'lr': 0.0004560425676994566, 'samples': 15546368, 'steps': 30363, 'loss/train': 1.6186941862106323} +03/05/2022 01:09:00 - INFO - codeparrot_training - Skipping example with length 653 (seq_length=1024) +03/05/2022 01:09:03 - INFO - codeparrot_training - Step 30364: {'lr': 0.00045603956222034384, 'samples': 15546880, 'steps': 30364, 'loss/train': 1.6865589618682861} +03/05/2022 01:09:06 - INFO - codeparrot_training - Step 30365: {'lr': 0.0004560365566483927, 'samples': 15547392, 'steps': 30365, 'loss/train': 1.2278800010681152} +03/05/2022 01:09:09 - INFO - codeparrot_training - Skipping example with length 645 (seq_length=1024) +03/05/2022 01:09:12 - INFO - codeparrot_training - Step 30366: {'lr': 0.00045603355098360466, 'samples': 15547904, 'steps': 30366, 'loss/train': 1.0190188884735107} +03/05/2022 01:09:15 - INFO - codeparrot_training - Step 30367: {'lr': 0.00045603054522598107, 'samples': 15548416, 'steps': 30367, 'loss/train': 1.727705478668213} +03/05/2022 01:09:17 - INFO - codeparrot_training - Skipping example with length 1022 (seq_length=1024) +03/05/2022 01:09:20 - INFO - codeparrot_training - Step 30368: {'lr': 0.0004560275393755233, 'samples': 15548928, 'steps': 30368, 'loss/train': 1.0315419435501099} +03/05/2022 01:09:23 - INFO - codeparrot_training - Step 30369: {'lr': 0.0004560245334322328, 'samples': 15549440, 'steps': 30369, 'loss/train': 1.7085744142532349} +03/05/2022 01:09:25 - INFO - codeparrot_training - Skipping example with length 681 (seq_length=1024) +03/05/2022 01:09:29 - INFO - codeparrot_training - Step 30370: {'lr': 0.00045602152739611075, 'samples': 15549952, 'steps': 30370, 'loss/train': 1.881314992904663} +03/05/2022 01:09:32 - INFO - codeparrot_training - Step 30371: {'lr': 0.0004560185212671586, 'samples': 15550464, 'steps': 30371, 'loss/train': 1.3301869630813599} +03/05/2022 01:09:34 - INFO - codeparrot_training - Skipping example with length 757 (seq_length=1024) +03/05/2022 01:09:37 - INFO - codeparrot_training - Step 30372: {'lr': 0.00045601551504537765, 'samples': 15550976, 'steps': 30372, 'loss/train': 2.1871769428253174} +03/05/2022 01:09:40 - INFO - codeparrot_training - Step 30373: {'lr': 0.0004560125087307693, 'samples': 15551488, 'steps': 30373, 'loss/train': 1.5007432699203491} +03/05/2022 01:09:42 - INFO - codeparrot_training - Skipping example with length 382 (seq_length=1024) +03/05/2022 01:09:46 - INFO - codeparrot_training - Step 30374: {'lr': 0.00045600950232333495, 'samples': 15552000, 'steps': 30374, 'loss/train': 0.9763179421424866} +03/05/2022 01:09:49 - INFO - codeparrot_training - Step 30375: {'lr': 0.00045600649582307586, 'samples': 15552512, 'steps': 30375, 'loss/train': 2.0295298099517822} +03/05/2022 01:09:51 - INFO - codeparrot_training - Skipping example with length 705 (seq_length=1024) +03/05/2022 01:09:54 - INFO - codeparrot_training - Step 30376: {'lr': 0.00045600348922999334, 'samples': 15553024, 'steps': 30376, 'loss/train': 2.4519736766815186} +03/05/2022 01:09:57 - INFO - codeparrot_training - Step 30377: {'lr': 0.0004560004825440889, 'samples': 15553536, 'steps': 30377, 'loss/train': 1.318518042564392} +03/05/2022 01:10:00 - INFO - codeparrot_training - Skipping example with length 137 (seq_length=1024) +03/05/2022 01:10:03 - INFO - codeparrot_training - Step 30378: {'lr': 0.0004559974757653639, 'samples': 15554048, 'steps': 30378, 'loss/train': 2.206862688064575} +03/05/2022 01:10:06 - INFO - codeparrot_training - Step 30379: {'lr': 0.0004559944688938195, 'samples': 15554560, 'steps': 30379, 'loss/train': 1.7655829191207886} +03/05/2022 01:10:08 - INFO - codeparrot_training - Skipping example with length 784 (seq_length=1024) +03/05/2022 01:10:11 - INFO - codeparrot_training - Step 30380: {'lr': 0.0004559914619294572, 'samples': 15555072, 'steps': 30380, 'loss/train': 0.25516730546951294} +03/05/2022 01:10:14 - INFO - codeparrot_training - Step 30381: {'lr': 0.00045598845487227835, 'samples': 15555584, 'steps': 30381, 'loss/train': 1.504288911819458} +03/05/2022 01:10:16 - INFO - codeparrot_training - Skipping example with length 552 (seq_length=1024) +03/05/2022 01:10:19 - INFO - codeparrot_training - Step 30382: {'lr': 0.0004559854477222842, 'samples': 15556096, 'steps': 30382, 'loss/train': 1.1959232091903687} +03/05/2022 01:10:23 - INFO - codeparrot_training - Step 30383: {'lr': 0.0004559824404794763, 'samples': 15556608, 'steps': 30383, 'loss/train': 1.766464114189148} +03/05/2022 01:10:25 - INFO - codeparrot_training - Skipping example with length 309 (seq_length=1024) +03/05/2022 01:10:28 - INFO - codeparrot_training - Step 30384: {'lr': 0.0004559794331438558, 'samples': 15557120, 'steps': 30384, 'loss/train': 1.9022656679153442} +03/05/2022 01:10:31 - INFO - codeparrot_training - Step 30385: {'lr': 0.0004559764257154242, 'samples': 15557632, 'steps': 30385, 'loss/train': 1.6189199686050415} +03/05/2022 01:10:33 - INFO - codeparrot_training - Skipping example with length 141 (seq_length=1024) +03/05/2022 01:10:36 - INFO - codeparrot_training - Step 30386: {'lr': 0.0004559734181941828, 'samples': 15558144, 'steps': 30386, 'loss/train': 2.0789079666137695} +03/05/2022 01:10:40 - INFO - codeparrot_training - Step 30387: {'lr': 0.0004559704105801329, 'samples': 15558656, 'steps': 30387, 'loss/train': 1.676277756690979} +03/05/2022 01:10:41 - INFO - codeparrot_training - Skipping example with length 132 (seq_length=1024) +03/05/2022 01:10:45 - INFO - codeparrot_training - Step 30388: {'lr': 0.00045596740287327597, 'samples': 15559168, 'steps': 30388, 'loss/train': 1.4329053163528442} +03/05/2022 01:10:48 - INFO - codeparrot_training - Step 30389: {'lr': 0.0004559643950736133, 'samples': 15559680, 'steps': 30389, 'loss/train': 2.304358959197998} +03/05/2022 01:10:50 - INFO - codeparrot_training - Skipping example with length 729 (seq_length=1024) +03/05/2022 01:10:53 - INFO - codeparrot_training - Step 30390: {'lr': 0.00045596138718114626, 'samples': 15560192, 'steps': 30390, 'loss/train': 1.9810020923614502} +03/05/2022 01:10:56 - INFO - codeparrot_training - Step 30391: {'lr': 0.00045595837919587616, 'samples': 15560704, 'steps': 30391, 'loss/train': 1.020075798034668} +03/05/2022 01:10:58 - INFO - codeparrot_training - Skipping example with length 305 (seq_length=1024) +03/05/2022 01:11:02 - INFO - codeparrot_training - Step 30392: {'lr': 0.0004559553711178044, 'samples': 15561216, 'steps': 30392, 'loss/train': 1.3351904153823853} +03/05/2022 01:11:05 - INFO - codeparrot_training - Step 30393: {'lr': 0.00045595236294693236, 'samples': 15561728, 'steps': 30393, 'loss/train': 2.4174575805664062} +03/05/2022 01:11:06 - INFO - codeparrot_training - Skipping example with length 32 (seq_length=1024) +03/05/2022 01:11:10 - INFO - codeparrot_training - Step 30394: {'lr': 0.00045594935468326137, 'samples': 15562240, 'steps': 30394, 'loss/train': 1.9899287223815918} +03/05/2022 01:11:13 - INFO - codeparrot_training - Step 30395: {'lr': 0.00045594634632679275, 'samples': 15562752, 'steps': 30395, 'loss/train': 1.2670739889144897} +03/05/2022 01:11:15 - INFO - codeparrot_training - Skipping example with length 954 (seq_length=1024) +03/05/2022 01:11:18 - INFO - codeparrot_training - Step 30396: {'lr': 0.0004559433378775278, 'samples': 15563264, 'steps': 30396, 'loss/train': 1.4350285530090332} +03/05/2022 01:11:22 - INFO - codeparrot_training - Step 30397: {'lr': 0.00045594032933546813, 'samples': 15563776, 'steps': 30397, 'loss/train': 1.019887089729309} +03/05/2022 01:11:23 - INFO - codeparrot_training - Skipping example with length 452 (seq_length=1024) +03/05/2022 01:11:27 - INFO - codeparrot_training - Step 30398: {'lr': 0.00045593732070061484, 'samples': 15564288, 'steps': 30398, 'loss/train': 1.8890637159347534} +03/05/2022 01:11:30 - INFO - codeparrot_training - Step 30399: {'lr': 0.00045593431197296934, 'samples': 15564800, 'steps': 30399, 'loss/train': 1.0421630144119263} +03/05/2022 01:11:31 - INFO - codeparrot_training - Skipping example with length 45 (seq_length=1024) +03/05/2022 01:11:35 - INFO - codeparrot_training - Step 30400: {'lr': 0.00045593130315253305, 'samples': 15565312, 'steps': 30400, 'loss/train': 1.8648065328598022} +03/05/2022 01:11:38 - INFO - codeparrot_training - Step 30401: {'lr': 0.0004559282942393073, 'samples': 15565824, 'steps': 30401, 'loss/train': 2.101236581802368} +03/05/2022 01:11:40 - INFO - codeparrot_training - Skipping example with length 759 (seq_length=1024) +03/05/2022 01:11:44 - INFO - codeparrot_training - Step 30402: {'lr': 0.00045592528523329346, 'samples': 15566336, 'steps': 30402, 'loss/train': 1.8022751808166504} +03/05/2022 01:11:47 - INFO - codeparrot_training - Step 30403: {'lr': 0.0004559222761344928, 'samples': 15566848, 'steps': 30403, 'loss/train': 0.08982302248477936} +03/05/2022 01:11:48 - INFO - codeparrot_training - Skipping example with length 945 (seq_length=1024) +03/05/2022 01:11:52 - INFO - codeparrot_training - Step 30404: {'lr': 0.0004559192669429068, 'samples': 15567360, 'steps': 30404, 'loss/train': 1.9577254056930542} +03/05/2022 01:11:55 - INFO - codeparrot_training - Step 30405: {'lr': 0.0004559162576585367, 'samples': 15567872, 'steps': 30405, 'loss/train': 0.6883639097213745} +03/05/2022 01:11:57 - INFO - codeparrot_training - Skipping example with length 639 (seq_length=1024) +03/05/2022 01:12:01 - INFO - codeparrot_training - Step 30406: {'lr': 0.00045591324828138396, 'samples': 15568384, 'steps': 30406, 'loss/train': 1.9827839136123657} +03/05/2022 01:12:04 - INFO - codeparrot_training - Step 30407: {'lr': 0.0004559102388114499, 'samples': 15568896, 'steps': 30407, 'loss/train': 1.9918971061706543} +03/05/2022 01:12:05 - INFO - codeparrot_training - Skipping example with length 78 (seq_length=1024) +03/05/2022 01:12:09 - INFO - codeparrot_training - Step 30408: {'lr': 0.00045590722924873585, 'samples': 15569408, 'steps': 30408, 'loss/train': 1.4455137252807617} +03/05/2022 01:12:12 - INFO - codeparrot_training - Step 30409: {'lr': 0.00045590421959324314, 'samples': 15569920, 'steps': 30409, 'loss/train': 1.2680877447128296} +03/05/2022 01:12:13 - INFO - codeparrot_training - Skipping example with length 669 (seq_length=1024) +03/05/2022 01:12:17 - INFO - codeparrot_training - Step 30410: {'lr': 0.0004559012098449732, 'samples': 15570432, 'steps': 30410, 'loss/train': 0.12951192259788513} +03/05/2022 01:12:21 - INFO - codeparrot_training - Step 30411: {'lr': 0.00045589820000392736, 'samples': 15570944, 'steps': 30411, 'loss/train': 0.05925912410020828} +03/05/2022 01:12:22 - INFO - codeparrot_training - Skipping example with length 20 (seq_length=1024) +03/05/2022 01:12:26 - INFO - codeparrot_training - Step 30412: {'lr': 0.00045589519007010695, 'samples': 15571456, 'steps': 30412, 'loss/train': 2.0319509506225586} +03/05/2022 01:12:29 - INFO - codeparrot_training - Step 30413: {'lr': 0.0004558921800435133, 'samples': 15571968, 'steps': 30413, 'loss/train': 1.633844256401062} +03/05/2022 01:12:30 - INFO - codeparrot_training - Skipping example with length 969 (seq_length=1024) +03/05/2022 01:12:34 - INFO - codeparrot_training - Step 30414: {'lr': 0.00045588916992414784, 'samples': 15572480, 'steps': 30414, 'loss/train': 1.635192632675171} +03/05/2022 01:12:37 - INFO - codeparrot_training - Step 30415: {'lr': 0.0004558861597120119, 'samples': 15572992, 'steps': 30415, 'loss/train': 2.163285493850708} +03/05/2022 01:12:38 - INFO - codeparrot_training - Skipping example with length 885 (seq_length=1024) +03/05/2022 01:12:43 - INFO - codeparrot_training - Step 30416: {'lr': 0.00045588314940710683, 'samples': 15573504, 'steps': 30416, 'loss/train': 1.4755897521972656} +03/05/2022 01:12:46 - INFO - codeparrot_training - Step 30417: {'lr': 0.00045588013900943404, 'samples': 15574016, 'steps': 30417, 'loss/train': 1.805010199546814} +03/05/2022 01:12:46 - INFO - codeparrot_training - Skipping example with length 188 (seq_length=1024) +03/05/2022 01:12:51 - INFO - codeparrot_training - Step 30418: {'lr': 0.0004558771285189948, 'samples': 15574528, 'steps': 30418, 'loss/train': 1.4233644008636475} +03/05/2022 01:12:54 - INFO - codeparrot_training - Step 30419: {'lr': 0.00045587411793579047, 'samples': 15575040, 'steps': 30419, 'loss/train': 1.7176231145858765} +03/05/2022 01:12:55 - INFO - codeparrot_training - Skipping example with length 199 (seq_length=1024) +03/05/2022 01:13:00 - INFO - codeparrot_training - Step 30420: {'lr': 0.0004558711072598225, 'samples': 15575552, 'steps': 30420, 'loss/train': 2.1467010974884033} +03/05/2022 01:13:03 - INFO - codeparrot_training - Step 30421: {'lr': 0.0004558680964910922, 'samples': 15576064, 'steps': 30421, 'loss/train': 0.9580603837966919} +03/05/2022 01:13:03 - INFO - codeparrot_training - Skipping example with length 117 (seq_length=1024) +03/05/2022 01:13:08 - INFO - codeparrot_training - Step 30422: {'lr': 0.0004558650856296008, 'samples': 15576576, 'steps': 30422, 'loss/train': 1.9012800455093384} +03/05/2022 01:13:11 - INFO - codeparrot_training - Step 30423: {'lr': 0.0004558620746753499, 'samples': 15577088, 'steps': 30423, 'loss/train': 1.4355158805847168} +03/05/2022 01:13:12 - INFO - codeparrot_training - Skipping example with length 58 (seq_length=1024) +03/05/2022 01:13:17 - INFO - codeparrot_training - Step 30424: {'lr': 0.00045585906362834063, 'samples': 15577600, 'steps': 30424, 'loss/train': 1.8312486410140991} +03/05/2022 01:13:20 - INFO - codeparrot_training - Step 30425: {'lr': 0.00045585605248857456, 'samples': 15578112, 'steps': 30425, 'loss/train': 1.9815820455551147} +03/05/2022 01:13:21 - INFO - codeparrot_training - Skipping example with length 59 (seq_length=1024) +03/05/2022 01:13:25 - INFO - codeparrot_training - Step 30426: {'lr': 0.00045585304125605276, 'samples': 15578624, 'steps': 30426, 'loss/train': 1.1288591623306274} +03/05/2022 01:13:28 - INFO - codeparrot_training - Step 30427: {'lr': 0.0004558500299307768, 'samples': 15579136, 'steps': 30427, 'loss/train': 1.4727312326431274} +03/05/2022 01:13:29 - INFO - codeparrot_training - Skipping example with length 182 (seq_length=1024) +03/05/2022 01:13:34 - INFO - codeparrot_training - Step 30428: {'lr': 0.00045584701851274814, 'samples': 15579648, 'steps': 30428, 'loss/train': 2.0945613384246826} +03/05/2022 01:13:37 - INFO - codeparrot_training - Step 30429: {'lr': 0.0004558440070019678, 'samples': 15580160, 'steps': 30429, 'loss/train': 4.615679740905762} +03/05/2022 01:13:38 - INFO - codeparrot_training - Skipping example with length 547 (seq_length=1024) +03/05/2022 01:13:42 - INFO - codeparrot_training - Step 30430: {'lr': 0.0004558409953984375, 'samples': 15580672, 'steps': 30430, 'loss/train': 0.47348663210868835} +03/05/2022 01:13:45 - INFO - codeparrot_training - Step 30431: {'lr': 0.00045583798370215837, 'samples': 15581184, 'steps': 30431, 'loss/train': 2.1555707454681396} +03/05/2022 01:13:46 - INFO - codeparrot_training - Skipping example with length 420 (seq_length=1024) +03/05/2022 01:13:50 - INFO - codeparrot_training - Step 30432: {'lr': 0.00045583497191313175, 'samples': 15581696, 'steps': 30432, 'loss/train': 1.8784217834472656} +03/05/2022 01:13:54 - INFO - codeparrot_training - Step 30433: {'lr': 0.00045583196003135906, 'samples': 15582208, 'steps': 30433, 'loss/train': 1.1608339548110962} +03/05/2022 01:13:54 - INFO - codeparrot_training - Skipping example with length 467 (seq_length=1024) +03/05/2022 01:13:59 - INFO - codeparrot_training - Step 30434: {'lr': 0.0004558289480568417, 'samples': 15582720, 'steps': 30434, 'loss/train': 1.743011236190796} +03/05/2022 01:14:02 - INFO - codeparrot_training - Step 30435: {'lr': 0.00045582593598958107, 'samples': 15583232, 'steps': 30435, 'loss/train': 1.3328958749771118} +03/05/2022 01:14:03 - INFO - codeparrot_training - Skipping example with length 794 (seq_length=1024) +03/05/2022 01:14:07 - INFO - codeparrot_training - Step 30436: {'lr': 0.00045582292382957836, 'samples': 15583744, 'steps': 30436, 'loss/train': 3.0934886932373047} +03/05/2022 01:14:10 - INFO - codeparrot_training - Step 30437: {'lr': 0.000455819911576835, 'samples': 15584256, 'steps': 30437, 'loss/train': 0.9609709978103638} +03/05/2022 01:14:11 - INFO - codeparrot_training - Skipping example with length 526 (seq_length=1024) +03/05/2022 01:14:16 - INFO - codeparrot_training - Step 30438: {'lr': 0.00045581689923135247, 'samples': 15584768, 'steps': 30438, 'loss/train': 2.0351412296295166} +03/05/2022 01:14:19 - INFO - codeparrot_training - Step 30439: {'lr': 0.00045581388679313194, 'samples': 15585280, 'steps': 30439, 'loss/train': 1.8427801132202148} +03/05/2022 01:14:19 - INFO - codeparrot_training - Skipping example with length 97 (seq_length=1024) +03/05/2022 01:14:24 - INFO - codeparrot_training - Step 30440: {'lr': 0.0004558108742621748, 'samples': 15585792, 'steps': 30440, 'loss/train': 2.178126811981201} +03/05/2022 01:14:27 - INFO - codeparrot_training - Step 30441: {'lr': 0.00045580786163848254, 'samples': 15586304, 'steps': 30441, 'loss/train': 2.5190231800079346} +03/05/2022 01:14:27 - INFO - codeparrot_training - Skipping example with length 200 (seq_length=1024) +03/05/2022 01:14:32 - INFO - codeparrot_training - Step 30442: {'lr': 0.00045580484892205643, 'samples': 15586816, 'steps': 30442, 'loss/train': 1.1063358783721924} +03/05/2022 01:14:36 - INFO - codeparrot_training - Step 30443: {'lr': 0.0004558018361128978, 'samples': 15587328, 'steps': 30443, 'loss/train': 1.6020057201385498} +03/05/2022 01:14:36 - INFO - codeparrot_training - Skipping example with length 379 (seq_length=1024) +03/05/2022 01:14:41 - INFO - codeparrot_training - Step 30444: {'lr': 0.0004557988232110081, 'samples': 15587840, 'steps': 30444, 'loss/train': 1.659379243850708} +03/05/2022 01:14:44 - INFO - codeparrot_training - Step 30445: {'lr': 0.00045579581021638855, 'samples': 15588352, 'steps': 30445, 'loss/train': 1.114865779876709} +03/05/2022 01:14:44 - INFO - codeparrot_training - Skipping example with length 757 (seq_length=1024) +03/05/2022 01:14:49 - INFO - codeparrot_training - Step 30446: {'lr': 0.00045579279712904057, 'samples': 15588864, 'steps': 30446, 'loss/train': 1.7532734870910645} +03/05/2022 01:14:52 - INFO - codeparrot_training - Skipping example with length 58 (seq_length=1024) +03/05/2022 01:14:55 - INFO - codeparrot_training - Step 30447: {'lr': 0.00045578978394896565, 'samples': 15589376, 'steps': 30447, 'loss/train': 1.9886479377746582} +03/05/2022 01:14:58 - INFO - codeparrot_training - Step 30448: {'lr': 0.00045578677067616494, 'samples': 15589888, 'steps': 30448, 'loss/train': 1.309191107749939} +03/05/2022 01:15:01 - INFO - codeparrot_training - Step 30449: {'lr': 0.0004557837573106399, 'samples': 15590400, 'steps': 30449, 'loss/train': 2.432729482650757} +03/05/2022 01:15:01 - INFO - codeparrot_training - Skipping example with length 918 (seq_length=1024) +03/05/2022 01:15:06 - INFO - codeparrot_training - Step 30450: {'lr': 0.0004557807438523919, 'samples': 15590912, 'steps': 30450, 'loss/train': 1.957144021987915} +03/05/2022 01:15:10 - INFO - codeparrot_training - Step 30451: {'lr': 0.00045577773030142224, 'samples': 15591424, 'steps': 30451, 'loss/train': 1.6094367504119873} +03/05/2022 01:15:10 - INFO - codeparrot_training - Skipping example with length 174 (seq_length=1024) +03/05/2022 01:15:15 - INFO - codeparrot_training - Step 30452: {'lr': 0.0004557747166577323, 'samples': 15591936, 'steps': 30452, 'loss/train': 1.1868141889572144} +03/05/2022 01:15:18 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 01:15:20 - INFO - codeparrot_training - Step 30453: {'lr': 0.0004557717029213234, 'samples': 15592448, 'steps': 30453, 'loss/train': 1.7298978567123413} +03/05/2022 01:15:23 - INFO - codeparrot_training - Step 30454: {'lr': 0.00045576868909219704, 'samples': 15592960, 'steps': 30454, 'loss/train': 1.0971542596817017} +03/05/2022 01:15:26 - INFO - codeparrot_training - Skipping example with length 576 (seq_length=1024) +03/05/2022 01:15:29 - INFO - codeparrot_training - Step 30455: {'lr': 0.0004557656751703544, 'samples': 15593472, 'steps': 30455, 'loss/train': 0.8508080840110779} +03/05/2022 01:15:32 - INFO - codeparrot_training - Step 30456: {'lr': 0.000455762661155797, 'samples': 15593984, 'steps': 30456, 'loss/train': 1.371014952659607} +03/05/2022 01:15:35 - INFO - codeparrot_training - Skipping example with length 732 (seq_length=1024) +03/05/2022 01:15:37 - INFO - codeparrot_training - Step 30457: {'lr': 0.0004557596470485261, 'samples': 15594496, 'steps': 30457, 'loss/train': 1.753208875656128} +03/05/2022 01:15:40 - INFO - codeparrot_training - Step 30458: {'lr': 0.0004557566328485431, 'samples': 15595008, 'steps': 30458, 'loss/train': 1.8668346405029297} +03/05/2022 01:15:43 - INFO - codeparrot_training - Skipping example with length 458 (seq_length=1024) +03/05/2022 01:15:45 - INFO - codeparrot_training - Step 30459: {'lr': 0.00045575361855584927, 'samples': 15595520, 'steps': 30459, 'loss/train': 1.6284278631210327} +03/05/2022 01:15:49 - INFO - codeparrot_training - Step 30460: {'lr': 0.00045575060417044614, 'samples': 15596032, 'steps': 30460, 'loss/train': 2.095759630203247} +03/05/2022 01:15:51 - INFO - codeparrot_training - Skipping example with length 1023 (seq_length=1024) +03/05/2022 01:15:54 - INFO - codeparrot_training - Step 30461: {'lr': 0.0004557475896923349, 'samples': 15596544, 'steps': 30461, 'loss/train': 1.7722729444503784} +03/05/2022 01:15:57 - INFO - codeparrot_training - Step 30462: {'lr': 0.0004557445751215169, 'samples': 15597056, 'steps': 30462, 'loss/train': 2.435866117477417} +03/05/2022 01:16:00 - INFO - codeparrot_training - Step 30463: {'lr': 0.00045574156045799367, 'samples': 15597568, 'steps': 30463, 'loss/train': 2.07511830329895} +03/05/2022 01:16:00 - INFO - codeparrot_training - Skipping example with length 772 (seq_length=1024) +03/05/2022 01:16:06 - INFO - codeparrot_training - Step 30464: {'lr': 0.0004557385457017664, 'samples': 15598080, 'steps': 30464, 'loss/train': 2.5630083084106445} +03/05/2022 01:16:09 - INFO - codeparrot_training - Step 30465: {'lr': 0.0004557355308528366, 'samples': 15598592, 'steps': 30465, 'loss/train': 2.3153674602508545} +03/05/2022 01:16:10 - INFO - codeparrot_training - Skipping example with length 714 (seq_length=1024) +03/05/2022 01:16:14 - INFO - codeparrot_training - Step 30466: {'lr': 0.00045573251591120545, 'samples': 15599104, 'steps': 30466, 'loss/train': 1.7814710140228271} +03/05/2022 01:16:18 - INFO - codeparrot_training - Step 30467: {'lr': 0.00045572950087687447, 'samples': 15599616, 'steps': 30467, 'loss/train': 2.207195520401001} +03/05/2022 01:16:18 - INFO - codeparrot_training - Skipping example with length 419 (seq_length=1024) +03/05/2022 01:16:23 - INFO - codeparrot_training - Step 30468: {'lr': 0.0004557264857498449, 'samples': 15600128, 'steps': 30468, 'loss/train': 2.0599067211151123} +03/05/2022 01:16:26 - INFO - codeparrot_training - Step 30469: {'lr': 0.0004557234705301182, 'samples': 15600640, 'steps': 30469, 'loss/train': 2.0651638507843018} +03/05/2022 01:16:26 - INFO - codeparrot_training - Skipping example with length 526 (seq_length=1024) +03/05/2022 01:16:31 - INFO - codeparrot_training - Step 30470: {'lr': 0.0004557204552176957, 'samples': 15601152, 'steps': 30470, 'loss/train': 2.6290104389190674} +03/05/2022 01:16:34 - INFO - codeparrot_training - Step 30471: {'lr': 0.0004557174398125786, 'samples': 15601664, 'steps': 30471, 'loss/train': 1.8247712850570679} +03/05/2022 01:16:34 - INFO - codeparrot_training - Skipping example with length 360 (seq_length=1024) +03/05/2022 01:16:40 - INFO - codeparrot_training - Step 30472: {'lr': 0.00045571442431476856, 'samples': 15602176, 'steps': 30472, 'loss/train': 1.9465539455413818} +03/05/2022 01:16:42 - INFO - codeparrot_training - Skipping example with length 520 (seq_length=1024) +03/05/2022 01:16:45 - INFO - codeparrot_training - Step 30473: {'lr': 0.0004557114087242667, 'samples': 15602688, 'steps': 30473, 'loss/train': 1.3080689907073975} +03/05/2022 01:16:48 - INFO - codeparrot_training - Step 30474: {'lr': 0.0004557083930410745, 'samples': 15603200, 'steps': 30474, 'loss/train': 1.3806581497192383} +03/05/2022 01:16:51 - INFO - codeparrot_training - Skipping example with length 901 (seq_length=1024) +03/05/2022 01:16:53 - INFO - codeparrot_training - Step 30475: {'lr': 0.0004557053772651932, 'samples': 15603712, 'steps': 30475, 'loss/train': 1.6152102947235107} +03/05/2022 01:16:57 - INFO - codeparrot_training - Step 30476: {'lr': 0.00045570236139662426, 'samples': 15604224, 'steps': 30476, 'loss/train': 1.8976211547851562} +03/05/2022 01:16:59 - INFO - codeparrot_training - Skipping example with length 951 (seq_length=1024) +03/05/2022 01:17:02 - INFO - codeparrot_training - Step 30477: {'lr': 0.000455699345435369, 'samples': 15604736, 'steps': 30477, 'loss/train': 1.6124889850616455} +03/05/2022 01:17:05 - INFO - codeparrot_training - Step 30478: {'lr': 0.0004556963293814288, 'samples': 15605248, 'steps': 30478, 'loss/train': 2.411875009536743} +03/05/2022 01:17:08 - INFO - codeparrot_training - Skipping example with length 99 (seq_length=1024) +03/05/2022 01:17:10 - INFO - codeparrot_training - Step 30479: {'lr': 0.000455693313234805, 'samples': 15605760, 'steps': 30479, 'loss/train': 1.7829580307006836} +03/05/2022 01:17:14 - INFO - codeparrot_training - Step 30480: {'lr': 0.000455690296995499, 'samples': 15606272, 'steps': 30480, 'loss/train': 3.618541717529297} +03/05/2022 01:17:16 - INFO - codeparrot_training - Skipping example with length 852 (seq_length=1024) +03/05/2022 01:17:19 - INFO - codeparrot_training - Step 30481: {'lr': 0.00045568728066351205, 'samples': 15606784, 'steps': 30481, 'loss/train': 0.8460149168968201} +03/05/2022 01:17:22 - INFO - codeparrot_training - Step 30482: {'lr': 0.0004556842642388457, 'samples': 15607296, 'steps': 30482, 'loss/train': 1.5652014017105103} +03/05/2022 01:17:24 - INFO - codeparrot_training - Skipping example with length 324 (seq_length=1024) +03/05/2022 01:17:27 - INFO - codeparrot_training - Step 30483: {'lr': 0.0004556812477215011, 'samples': 15607808, 'steps': 30483, 'loss/train': 2.0389010906219482} +03/05/2022 01:17:30 - INFO - codeparrot_training - Step 30484: {'lr': 0.0004556782311114798, 'samples': 15608320, 'steps': 30484, 'loss/train': 1.4681047201156616} +03/05/2022 01:17:33 - INFO - codeparrot_training - Skipping example with length 964 (seq_length=1024) +03/05/2022 01:17:36 - INFO - codeparrot_training - Step 30485: {'lr': 0.00045567521440878294, 'samples': 15608832, 'steps': 30485, 'loss/train': 1.9434428215026855} +03/05/2022 01:17:39 - INFO - codeparrot_training - Step 30486: {'lr': 0.000455672197613412, 'samples': 15609344, 'steps': 30486, 'loss/train': 1.3529409170150757} +03/05/2022 01:17:41 - INFO - codeparrot_training - Skipping example with length 996 (seq_length=1024) +03/05/2022 01:17:44 - INFO - codeparrot_training - Step 30487: {'lr': 0.00045566918072536844, 'samples': 15609856, 'steps': 30487, 'loss/train': 2.5418858528137207} +03/05/2022 01:17:48 - INFO - codeparrot_training - Step 30488: {'lr': 0.00045566616374465355, 'samples': 15610368, 'steps': 30488, 'loss/train': 1.7175304889678955} +03/05/2022 01:17:50 - INFO - codeparrot_training - Skipping example with length 560 (seq_length=1024) +03/05/2022 01:17:53 - INFO - codeparrot_training - Step 30489: {'lr': 0.0004556631466712686, 'samples': 15610880, 'steps': 30489, 'loss/train': 1.1236913204193115} +03/05/2022 01:17:56 - INFO - codeparrot_training - Step 30490: {'lr': 0.00045566012950521497, 'samples': 15611392, 'steps': 30490, 'loss/train': 1.595499873161316} +03/05/2022 01:17:58 - INFO - codeparrot_training - Skipping example with length 899 (seq_length=1024) +03/05/2022 01:18:01 - INFO - codeparrot_training - Step 30491: {'lr': 0.0004556571122464941, 'samples': 15611904, 'steps': 30491, 'loss/train': 0.9231150150299072} +03/05/2022 01:18:05 - INFO - codeparrot_training - Step 30492: {'lr': 0.0004556540948951073, 'samples': 15612416, 'steps': 30492, 'loss/train': 1.1141771078109741} +03/05/2022 01:18:07 - INFO - codeparrot_training - Skipping example with length 622 (seq_length=1024) +03/05/2022 01:18:10 - INFO - codeparrot_training - Step 30493: {'lr': 0.00045565107745105594, 'samples': 15612928, 'steps': 30493, 'loss/train': 1.700252652168274} +03/05/2022 01:18:13 - INFO - codeparrot_training - Step 30494: {'lr': 0.00045564805991434135, 'samples': 15613440, 'steps': 30494, 'loss/train': 3.7589571475982666} +03/05/2022 01:18:16 - INFO - codeparrot_training - Step 30495: {'lr': 0.00045564504228496494, 'samples': 15613952, 'steps': 30495, 'loss/train': 1.7340096235275269} +03/05/2022 01:18:16 - INFO - codeparrot_training - Skipping example with length 629 (seq_length=1024) +03/05/2022 01:18:22 - INFO - codeparrot_training - Step 30496: {'lr': 0.0004556420245629281, 'samples': 15614464, 'steps': 30496, 'loss/train': 1.672154188156128} +03/05/2022 01:18:25 - INFO - codeparrot_training - Step 30497: {'lr': 0.00045563900674823205, 'samples': 15614976, 'steps': 30497, 'loss/train': 2.5248501300811768} +03/05/2022 01:18:25 - INFO - codeparrot_training - Skipping example with length 280 (seq_length=1024) +03/05/2022 01:18:30 - INFO - codeparrot_training - Step 30498: {'lr': 0.0004556359888408783, 'samples': 15615488, 'steps': 30498, 'loss/train': 6.580761909484863} +03/05/2022 01:18:33 - INFO - codeparrot_training - Step 30499: {'lr': 0.00045563297084086807, 'samples': 15616000, 'steps': 30499, 'loss/train': 2.007497787475586} +03/05/2022 01:18:34 - INFO - codeparrot_training - Skipping example with length 653 (seq_length=1024) +03/05/2022 01:18:39 - INFO - codeparrot_training - Step 30500: {'lr': 0.00045562995274820285, 'samples': 15616512, 'steps': 30500, 'loss/train': 1.5775742530822754} +03/05/2022 01:18:42 - INFO - codeparrot_training - Step 30501: {'lr': 0.00045562693456288394, 'samples': 15617024, 'steps': 30501, 'loss/train': 1.2036188840866089} +03/05/2022 01:18:42 - INFO - codeparrot_training - Skipping example with length 9 (seq_length=1024) +03/05/2022 01:18:47 - INFO - codeparrot_training - Step 30502: {'lr': 0.00045562391628491274, 'samples': 15617536, 'steps': 30502, 'loss/train': 1.5936039686203003} +03/05/2022 01:18:50 - INFO - codeparrot_training - Step 30503: {'lr': 0.00045562089791429056, 'samples': 15618048, 'steps': 30503, 'loss/train': 3.3216190338134766} +03/05/2022 01:18:51 - INFO - codeparrot_training - Skipping example with length 700 (seq_length=1024) +03/05/2022 01:18:56 - INFO - codeparrot_training - Step 30504: {'lr': 0.00045561787945101875, 'samples': 15618560, 'steps': 30504, 'loss/train': 2.2713258266448975} +03/05/2022 01:18:59 - INFO - codeparrot_training - Step 30505: {'lr': 0.0004556148608950987, 'samples': 15619072, 'steps': 30505, 'loss/train': 2.04522705078125} +03/05/2022 01:19:00 - INFO - codeparrot_training - Skipping example with length 623 (seq_length=1024) +03/05/2022 01:19:04 - INFO - codeparrot_training - Step 30506: {'lr': 0.0004556118422465319, 'samples': 15619584, 'steps': 30506, 'loss/train': 0.8919593095779419} +03/05/2022 01:19:07 - INFO - codeparrot_training - Step 30507: {'lr': 0.00045560882350531936, 'samples': 15620096, 'steps': 30507, 'loss/train': 2.0622689723968506} +03/05/2022 01:19:08 - INFO - codeparrot_training - Skipping example with length 102 (seq_length=1024) +03/05/2022 01:19:12 - INFO - codeparrot_training - Step 30508: {'lr': 0.00045560580467146275, 'samples': 15620608, 'steps': 30508, 'loss/train': 1.3258651494979858} +03/05/2022 01:19:15 - INFO - codeparrot_training - Step 30509: {'lr': 0.00045560278574496334, 'samples': 15621120, 'steps': 30509, 'loss/train': 2.6732876300811768} +03/05/2022 01:19:16 - INFO - codeparrot_training - Skipping example with length 504 (seq_length=1024) +03/05/2022 01:19:21 - INFO - codeparrot_training - Step 30510: {'lr': 0.0004555997667258225, 'samples': 15621632, 'steps': 30510, 'loss/train': 2.1665115356445312} +03/05/2022 01:19:24 - INFO - codeparrot_training - Step 30511: {'lr': 0.0004555967476140416, 'samples': 15622144, 'steps': 30511, 'loss/train': 1.3707630634307861} +03/05/2022 01:19:24 - INFO - codeparrot_training - Skipping example with length 1009 (seq_length=1024) +03/05/2022 01:19:29 - INFO - codeparrot_training - Step 30512: {'lr': 0.00045559372840962186, 'samples': 15622656, 'steps': 30512, 'loss/train': 1.9391942024230957} +03/05/2022 01:19:32 - INFO - codeparrot_training - Step 30513: {'lr': 0.00045559070911256486, 'samples': 15623168, 'steps': 30513, 'loss/train': 1.6365269422531128} +03/05/2022 01:19:34 - INFO - codeparrot_training - Skipping example with length 909 (seq_length=1024) +03/05/2022 01:19:38 - INFO - codeparrot_training - Step 30514: {'lr': 0.00045558768972287183, 'samples': 15623680, 'steps': 30514, 'loss/train': 1.7687983512878418} +03/05/2022 01:19:41 - INFO - codeparrot_training - Step 30515: {'lr': 0.0004555846702405442, 'samples': 15624192, 'steps': 30515, 'loss/train': 1.8858639001846313} +03/05/2022 01:19:42 - INFO - codeparrot_training - Skipping example with length 899 (seq_length=1024) +03/05/2022 01:19:46 - INFO - codeparrot_training - Step 30516: {'lr': 0.0004555816506655832, 'samples': 15624704, 'steps': 30516, 'loss/train': 2.480917453765869} +03/05/2022 01:19:49 - INFO - codeparrot_training - Step 30517: {'lr': 0.00045557863099799034, 'samples': 15625216, 'steps': 30517, 'loss/train': 2.493565082550049} +03/05/2022 01:19:50 - INFO - codeparrot_training - Skipping example with length 650 (seq_length=1024) +03/05/2022 01:19:55 - INFO - codeparrot_training - Step 30518: {'lr': 0.000455575611237767, 'samples': 15625728, 'steps': 30518, 'loss/train': 1.6163883209228516} +03/05/2022 01:19:58 - INFO - codeparrot_training - Step 30519: {'lr': 0.00045557259138491435, 'samples': 15626240, 'steps': 30519, 'loss/train': 2.393575668334961} +03/05/2022 01:19:59 - INFO - codeparrot_training - Skipping example with length 27 (seq_length=1024) +03/05/2022 01:20:03 - INFO - codeparrot_training - Step 30520: {'lr': 0.0004555695714394339, 'samples': 15626752, 'steps': 30520, 'loss/train': 5.482495307922363} +03/05/2022 01:20:06 - INFO - codeparrot_training - Step 30521: {'lr': 0.00045556655140132696, 'samples': 15627264, 'steps': 30521, 'loss/train': 1.679814338684082} +03/05/2022 01:20:07 - INFO - codeparrot_training - Skipping example with length 463 (seq_length=1024) +03/05/2022 01:20:12 - INFO - codeparrot_training - Step 30522: {'lr': 0.00045556353127059493, 'samples': 15627776, 'steps': 30522, 'loss/train': 1.9187484979629517} +03/05/2022 01:20:15 - INFO - codeparrot_training - Step 30523: {'lr': 0.0004555605110472391, 'samples': 15628288, 'steps': 30523, 'loss/train': 3.093512773513794} +03/05/2022 01:20:15 - INFO - codeparrot_training - Skipping example with length 473 (seq_length=1024) +03/05/2022 01:20:20 - INFO - codeparrot_training - Step 30524: {'lr': 0.0004555574907312609, 'samples': 15628800, 'steps': 30524, 'loss/train': 2.110553741455078} +03/05/2022 01:20:23 - INFO - codeparrot_training - Step 30525: {'lr': 0.00045555447032266167, 'samples': 15629312, 'steps': 30525, 'loss/train': 1.5908859968185425} +03/05/2022 01:20:23 - INFO - codeparrot_training - Skipping example with length 53 (seq_length=1024) +03/05/2022 01:20:28 - INFO - codeparrot_training - Step 30526: {'lr': 0.0004555514498214428, 'samples': 15629824, 'steps': 30526, 'loss/train': 1.18439781665802} +03/05/2022 01:20:32 - INFO - codeparrot_training - Step 30527: {'lr': 0.0004555484292276055, 'samples': 15630336, 'steps': 30527, 'loss/train': 1.8635817766189575} +03/05/2022 01:20:32 - INFO - codeparrot_training - Skipping example with length 777 (seq_length=1024) +03/05/2022 01:20:37 - INFO - codeparrot_training - Step 30528: {'lr': 0.0004555454085411514, 'samples': 15630848, 'steps': 30528, 'loss/train': 2.3025524616241455} +03/05/2022 01:20:40 - INFO - codeparrot_training - Step 30529: {'lr': 0.0004555423877620817, 'samples': 15631360, 'steps': 30529, 'loss/train': 6.811587810516357} +03/05/2022 01:20:41 - INFO - codeparrot_training - Skipping example with length 852 (seq_length=1024) +03/05/2022 01:20:46 - INFO - codeparrot_training - Step 30530: {'lr': 0.00045553936689039765, 'samples': 15631872, 'steps': 30530, 'loss/train': 0.7969969511032104} +03/05/2022 01:20:49 - INFO - codeparrot_training - Step 30531: {'lr': 0.00045553634592610084, 'samples': 15632384, 'steps': 30531, 'loss/train': 0.6186039447784424} +03/05/2022 01:20:49 - INFO - codeparrot_training - Skipping example with length 28 (seq_length=1024) +03/05/2022 01:20:54 - INFO - codeparrot_training - Step 30532: {'lr': 0.00045553332486919246, 'samples': 15632896, 'steps': 30532, 'loss/train': 0.7514795064926147} +03/05/2022 01:20:57 - INFO - codeparrot_training - Step 30533: {'lr': 0.000455530303719674, 'samples': 15633408, 'steps': 30533, 'loss/train': 1.7468414306640625} +03/05/2022 01:20:58 - INFO - codeparrot_training - Skipping example with length 730 (seq_length=1024) +03/05/2022 01:21:02 - INFO - codeparrot_training - Step 30534: {'lr': 0.00045552728247754673, 'samples': 15633920, 'steps': 30534, 'loss/train': 1.3344918489456177} +03/05/2022 01:21:06 - INFO - codeparrot_training - Step 30535: {'lr': 0.000455524261142812, 'samples': 15634432, 'steps': 30535, 'loss/train': 1.503164529800415} +03/05/2022 01:21:06 - INFO - codeparrot_training - Skipping example with length 215 (seq_length=1024) +03/05/2022 01:21:11 - INFO - codeparrot_training - Step 30536: {'lr': 0.00045552123971547123, 'samples': 15634944, 'steps': 30536, 'loss/train': 1.4112521409988403} +03/05/2022 01:21:14 - INFO - codeparrot_training - Step 30537: {'lr': 0.00045551821819552575, 'samples': 15635456, 'steps': 30537, 'loss/train': 1.826975703239441} +03/05/2022 01:21:15 - INFO - codeparrot_training - Skipping example with length 492 (seq_length=1024) +03/05/2022 01:21:19 - INFO - codeparrot_training - Step 30538: {'lr': 0.0004555151965829769, 'samples': 15635968, 'steps': 30538, 'loss/train': 0.896876871585846} +03/05/2022 01:21:23 - INFO - codeparrot_training - Step 30539: {'lr': 0.0004555121748778261, 'samples': 15636480, 'steps': 30539, 'loss/train': 1.764379858970642} +03/05/2022 01:21:23 - INFO - codeparrot_training - Skipping example with length 135 (seq_length=1024) +03/05/2022 01:21:28 - INFO - codeparrot_training - Step 30540: {'lr': 0.0004555091530800748, 'samples': 15636992, 'steps': 30540, 'loss/train': 2.457692861557007} +03/05/2022 01:21:31 - INFO - codeparrot_training - Step 30541: {'lr': 0.0004555061311897241, 'samples': 15637504, 'steps': 30541, 'loss/train': 1.7330117225646973} +03/05/2022 01:21:31 - INFO - codeparrot_training - Skipping example with length 727 (seq_length=1024) +03/05/2022 01:21:36 - INFO - codeparrot_training - Step 30542: {'lr': 0.0004555031092067756, 'samples': 15638016, 'steps': 30542, 'loss/train': 1.2393637895584106} +03/05/2022 01:21:39 - INFO - codeparrot_training - Step 30543: {'lr': 0.00045550008713123047, 'samples': 15638528, 'steps': 30543, 'loss/train': 1.5893667936325073} +03/05/2022 01:21:39 - INFO - codeparrot_training - Skipping example with length 189 (seq_length=1024) +03/05/2022 01:21:45 - INFO - codeparrot_training - Step 30544: {'lr': 0.00045549706496309027, 'samples': 15639040, 'steps': 30544, 'loss/train': 2.5014889240264893} +03/05/2022 01:21:48 - INFO - codeparrot_training - Step 30545: {'lr': 0.0004554940427023562, 'samples': 15639552, 'steps': 30545, 'loss/train': 1.3070255517959595} +03/05/2022 01:21:48 - INFO - codeparrot_training - Skipping example with length 908 (seq_length=1024) +03/05/2022 01:21:53 - INFO - codeparrot_training - Step 30546: {'lr': 0.00045549102034902973, 'samples': 15640064, 'steps': 30546, 'loss/train': 1.8866541385650635} +03/05/2022 01:21:56 - INFO - codeparrot_training - Step 30547: {'lr': 0.0004554879979031121, 'samples': 15640576, 'steps': 30547, 'loss/train': 1.5025571584701538} +03/05/2022 01:21:56 - INFO - codeparrot_training - Skipping example with length 585 (seq_length=1024) +03/05/2022 01:22:01 - INFO - codeparrot_training - Step 30548: {'lr': 0.00045548497536460487, 'samples': 15641088, 'steps': 30548, 'loss/train': 1.244983196258545} +03/05/2022 01:22:04 - INFO - codeparrot_training - Step 30549: {'lr': 0.00045548195273350926, 'samples': 15641600, 'steps': 30549, 'loss/train': 1.721570611000061} +03/05/2022 01:22:05 - INFO - codeparrot_training - Skipping example with length 364 (seq_length=1024) +03/05/2022 01:22:10 - INFO - codeparrot_training - Step 30550: {'lr': 0.0004554789300098265, 'samples': 15642112, 'steps': 30550, 'loss/train': 1.398437738418579} +03/05/2022 01:22:13 - INFO - codeparrot_training - Step 30551: {'lr': 0.00045547590719355823, 'samples': 15642624, 'steps': 30551, 'loss/train': 1.5419656038284302} +03/05/2022 01:22:13 - INFO - codeparrot_training - Skipping example with length 796 (seq_length=1024) +03/05/2022 01:22:18 - INFO - codeparrot_training - Step 30552: {'lr': 0.00045547288428470574, 'samples': 15643136, 'steps': 30552, 'loss/train': 1.4432038068771362} +03/05/2022 01:22:21 - INFO - codeparrot_training - Skipping example with length 973 (seq_length=1024) +03/05/2022 01:22:23 - INFO - codeparrot_training - Step 30553: {'lr': 0.0004554698612832703, 'samples': 15643648, 'steps': 30553, 'loss/train': 1.002095103263855} +03/05/2022 01:22:26 - INFO - codeparrot_training - Step 30554: {'lr': 0.00045546683818925327, 'samples': 15644160, 'steps': 30554, 'loss/train': 1.3449985980987549} +03/05/2022 01:22:29 - INFO - codeparrot_training - Skipping example with length 210 (seq_length=1024) +03/05/2022 01:22:32 - INFO - codeparrot_training - Step 30555: {'lr': 0.000455463815002656, 'samples': 15644672, 'steps': 30555, 'loss/train': 0.4842868447303772} +03/05/2022 01:22:35 - INFO - codeparrot_training - Step 30556: {'lr': 0.00045546079172348, 'samples': 15645184, 'steps': 30556, 'loss/train': 1.6641240119934082} +03/05/2022 01:22:38 - INFO - codeparrot_training - Skipping example with length 6 (seq_length=1024) +03/05/2022 01:22:40 - INFO - codeparrot_training - Step 30557: {'lr': 0.00045545776835172647, 'samples': 15645696, 'steps': 30557, 'loss/train': 1.3659201860427856} +03/05/2022 01:22:43 - INFO - codeparrot_training - Step 30558: {'lr': 0.00045545474488739693, 'samples': 15646208, 'steps': 30558, 'loss/train': 1.9520589113235474} +03/05/2022 01:22:46 - INFO - codeparrot_training - Skipping example with length 551 (seq_length=1024) +03/05/2022 01:22:48 - INFO - codeparrot_training - Step 30559: {'lr': 0.0004554517213304926, 'samples': 15646720, 'steps': 30559, 'loss/train': 2.3407187461853027} +03/05/2022 01:22:52 - INFO - codeparrot_training - Step 30560: {'lr': 0.00045544869768101486, 'samples': 15647232, 'steps': 30560, 'loss/train': 1.9165687561035156} +03/05/2022 01:22:54 - INFO - codeparrot_training - Skipping example with length 393 (seq_length=1024) +03/05/2022 01:22:57 - INFO - codeparrot_training - Step 30561: {'lr': 0.0004554456739389652, 'samples': 15647744, 'steps': 30561, 'loss/train': 1.6392617225646973} +03/05/2022 01:23:00 - INFO - codeparrot_training - Step 30562: {'lr': 0.00045544265010434484, 'samples': 15648256, 'steps': 30562, 'loss/train': 1.3429760932922363} +03/05/2022 01:23:02 - INFO - codeparrot_training - Skipping example with length 10 (seq_length=1024) +03/05/2022 01:23:05 - INFO - codeparrot_training - Step 30563: {'lr': 0.0004554396261771552, 'samples': 15648768, 'steps': 30563, 'loss/train': 1.4774656295776367} +03/05/2022 01:23:08 - INFO - codeparrot_training - Step 30564: {'lr': 0.00045543660215739755, 'samples': 15649280, 'steps': 30564, 'loss/train': 1.8188945055007935} +03/05/2022 01:23:11 - INFO - codeparrot_training - Skipping example with length 129 (seq_length=1024) +03/05/2022 01:23:14 - INFO - codeparrot_training - Step 30565: {'lr': 0.00045543357804507344, 'samples': 15649792, 'steps': 30565, 'loss/train': 1.3465498685836792} +03/05/2022 01:23:17 - INFO - codeparrot_training - Step 30566: {'lr': 0.00045543055384018405, 'samples': 15650304, 'steps': 30566, 'loss/train': 1.3827776908874512} +03/05/2022 01:23:19 - INFO - codeparrot_training - Skipping example with length 600 (seq_length=1024) +03/05/2022 01:23:22 - INFO - codeparrot_training - Step 30567: {'lr': 0.0004554275295427309, 'samples': 15650816, 'steps': 30567, 'loss/train': 0.6985491514205933} +03/05/2022 01:23:25 - INFO - codeparrot_training - Step 30568: {'lr': 0.0004554245051527153, 'samples': 15651328, 'steps': 30568, 'loss/train': 1.4645559787750244} +03/05/2022 01:23:27 - INFO - codeparrot_training - Skipping example with length 321 (seq_length=1024) +03/05/2022 01:23:30 - INFO - codeparrot_training - Step 30569: {'lr': 0.0004554214806701384, 'samples': 15651840, 'steps': 30569, 'loss/train': 2.65498685836792} +03/05/2022 01:23:34 - INFO - codeparrot_training - Step 30570: {'lr': 0.000455418456095002, 'samples': 15652352, 'steps': 30570, 'loss/train': 1.0230474472045898} +03/05/2022 01:23:36 - INFO - codeparrot_training - Skipping example with length 375 (seq_length=1024) +03/05/2022 01:23:39 - INFO - codeparrot_training - Step 30571: {'lr': 0.000455415431427307, 'samples': 15652864, 'steps': 30571, 'loss/train': 2.5440292358398438} +03/05/2022 01:23:42 - INFO - codeparrot_training - Step 30572: {'lr': 0.00045541240666705516, 'samples': 15653376, 'steps': 30572, 'loss/train': 0.7069652676582336} +03/05/2022 01:23:45 - INFO - codeparrot_training - Skipping example with length 178 (seq_length=1024) +03/05/2022 01:23:48 - INFO - codeparrot_training - Step 30573: {'lr': 0.0004554093818142475, 'samples': 15653888, 'steps': 30573, 'loss/train': 1.5299464464187622} +03/05/2022 01:23:51 - INFO - codeparrot_training - Step 30574: {'lr': 0.0004554063568688857, 'samples': 15654400, 'steps': 30574, 'loss/train': 2.3961970806121826} +03/05/2022 01:23:54 - INFO - codeparrot_training - Skipping example with length 277 (seq_length=1024) +03/05/2022 01:23:56 - INFO - codeparrot_training - Step 30575: {'lr': 0.0004554033318309708, 'samples': 15654912, 'steps': 30575, 'loss/train': 2.5076241493225098} +03/05/2022 01:23:59 - INFO - codeparrot_training - Step 30576: {'lr': 0.00045540030670050447, 'samples': 15655424, 'steps': 30576, 'loss/train': 0.21987862884998322} +03/05/2022 01:24:02 - INFO - codeparrot_training - Step 30577: {'lr': 0.0004553972814774878, 'samples': 15655936, 'steps': 30577, 'loss/train': 2.0527780055999756} +03/05/2022 01:24:02 - INFO - codeparrot_training - Skipping example with length 717 (seq_length=1024) +03/05/2022 01:24:08 - INFO - codeparrot_training - Step 30578: {'lr': 0.00045539425616192243, 'samples': 15656448, 'steps': 30578, 'loss/train': 1.390587568283081} +03/05/2022 01:24:11 - INFO - codeparrot_training - Step 30579: {'lr': 0.0004553912307538095, 'samples': 15656960, 'steps': 30579, 'loss/train': 1.6003605127334595} +03/05/2022 01:24:11 - INFO - codeparrot_training - Skipping example with length 394 (seq_length=1024) +03/05/2022 01:24:16 - INFO - codeparrot_training - Step 30580: {'lr': 0.0004553882052531504, 'samples': 15657472, 'steps': 30580, 'loss/train': 1.900411605834961} +03/05/2022 01:24:20 - INFO - codeparrot_training - Step 30581: {'lr': 0.00045538517965994663, 'samples': 15657984, 'steps': 30581, 'loss/train': 2.160693645477295} +03/05/2022 01:24:20 - INFO - codeparrot_training - Skipping example with length 444 (seq_length=1024) +03/05/2022 01:24:25 - INFO - codeparrot_training - Step 30582: {'lr': 0.0004553821539741994, 'samples': 15658496, 'steps': 30582, 'loss/train': 1.271679162979126} +03/05/2022 01:24:28 - INFO - codeparrot_training - Step 30583: {'lr': 0.0004553791281959102, 'samples': 15659008, 'steps': 30583, 'loss/train': 2.137972116470337} +03/05/2022 01:24:28 - INFO - codeparrot_training - Skipping example with length 565 (seq_length=1024) +03/05/2022 01:24:34 - INFO - codeparrot_training - Step 30584: {'lr': 0.00045537610232508033, 'samples': 15659520, 'steps': 30584, 'loss/train': 1.634616494178772} +03/05/2022 01:24:37 - INFO - codeparrot_training - Step 30585: {'lr': 0.0004553730763617111, 'samples': 15660032, 'steps': 30585, 'loss/train': 1.8432791233062744} +03/05/2022 01:24:37 - INFO - codeparrot_training - Skipping example with length 1003 (seq_length=1024) +03/05/2022 01:24:42 - INFO - codeparrot_training - Step 30586: {'lr': 0.000455370050305804, 'samples': 15660544, 'steps': 30586, 'loss/train': 2.2213644981384277} +03/05/2022 01:24:45 - INFO - codeparrot_training - Skipping example with length 450 (seq_length=1024) +03/05/2022 01:24:47 - INFO - codeparrot_training - Step 30587: {'lr': 0.0004553670241573603, 'samples': 15661056, 'steps': 30587, 'loss/train': 1.3643492460250854} +03/05/2022 01:24:51 - INFO - codeparrot_training - Step 30588: {'lr': 0.00045536399791638133, 'samples': 15661568, 'steps': 30588, 'loss/train': 0.12203964591026306} +03/05/2022 01:24:53 - INFO - codeparrot_training - Skipping example with length 800 (seq_length=1024) +03/05/2022 01:24:56 - INFO - codeparrot_training - Step 30589: {'lr': 0.0004553609715828686, 'samples': 15662080, 'steps': 30589, 'loss/train': 2.055931568145752} +03/05/2022 01:24:59 - INFO - codeparrot_training - Step 30590: {'lr': 0.00045535794515682334, 'samples': 15662592, 'steps': 30590, 'loss/train': 1.9583996534347534} +03/05/2022 01:25:02 - INFO - codeparrot_training - Skipping example with length 198 (seq_length=1024) +03/05/2022 01:25:04 - INFO - codeparrot_training - Step 30591: {'lr': 0.00045535491863824695, 'samples': 15663104, 'steps': 30591, 'loss/train': 0.9677415490150452} +03/05/2022 01:25:07 - INFO - codeparrot_training - Step 30592: {'lr': 0.0004553518920271408, 'samples': 15663616, 'steps': 30592, 'loss/train': 1.3254523277282715} +03/05/2022 01:25:10 - INFO - codeparrot_training - Skipping example with length 414 (seq_length=1024) +03/05/2022 01:25:13 - INFO - codeparrot_training - Step 30593: {'lr': 0.00045534886532350627, 'samples': 15664128, 'steps': 30593, 'loss/train': 2.040125608444214} +03/05/2022 01:25:16 - INFO - codeparrot_training - Step 30594: {'lr': 0.00045534583852734474, 'samples': 15664640, 'steps': 30594, 'loss/train': 1.9252053499221802} +03/05/2022 01:25:18 - INFO - codeparrot_training - Skipping example with length 682 (seq_length=1024) +03/05/2022 01:25:21 - INFO - codeparrot_training - Step 30595: {'lr': 0.00045534281163865756, 'samples': 15665152, 'steps': 30595, 'loss/train': 1.4463013410568237} +03/05/2022 01:25:24 - INFO - codeparrot_training - Step 30596: {'lr': 0.000455339784657446, 'samples': 15665664, 'steps': 30596, 'loss/train': 1.8405228853225708} +03/05/2022 01:25:26 - INFO - codeparrot_training - Skipping example with length 490 (seq_length=1024) +03/05/2022 01:25:29 - INFO - codeparrot_training - Step 30597: {'lr': 0.0004553367575837115, 'samples': 15666176, 'steps': 30597, 'loss/train': 1.485500693321228} +03/05/2022 01:25:33 - INFO - codeparrot_training - Step 30598: {'lr': 0.00045533373041745545, 'samples': 15666688, 'steps': 30598, 'loss/train': 1.8427996635437012} +03/05/2022 01:25:35 - INFO - codeparrot_training - Skipping example with length 247 (seq_length=1024) +03/05/2022 01:25:38 - INFO - codeparrot_training - Step 30599: {'lr': 0.00045533070315867917, 'samples': 15667200, 'steps': 30599, 'loss/train': 1.323441982269287} +03/05/2022 01:25:41 - INFO - codeparrot_training - Step 30600: {'lr': 0.0004553276758073841, 'samples': 15667712, 'steps': 30600, 'loss/train': 1.608496904373169} +03/05/2022 01:25:43 - INFO - codeparrot_training - Skipping example with length 63 (seq_length=1024) +03/05/2022 01:25:46 - INFO - codeparrot_training - Step 30601: {'lr': 0.00045532464836357155, 'samples': 15668224, 'steps': 30601, 'loss/train': 2.0748708248138428} +03/05/2022 01:25:49 - INFO - codeparrot_training - Step 30602: {'lr': 0.0004553216208272428, 'samples': 15668736, 'steps': 30602, 'loss/train': 1.092337965965271} +03/05/2022 01:25:51 - INFO - codeparrot_training - Skipping example with length 98 (seq_length=1024) +03/05/2022 01:25:55 - INFO - codeparrot_training - Step 30603: {'lr': 0.0004553185931983994, 'samples': 15669248, 'steps': 30603, 'loss/train': 1.4149433374404907} +03/05/2022 01:25:58 - INFO - codeparrot_training - Step 30604: {'lr': 0.00045531556547704255, 'samples': 15669760, 'steps': 30604, 'loss/train': 1.3749829530715942} +03/05/2022 01:26:00 - INFO - codeparrot_training - Skipping example with length 468 (seq_length=1024) +03/05/2022 01:26:03 - INFO - codeparrot_training - Step 30605: {'lr': 0.00045531253766317373, 'samples': 15670272, 'steps': 30605, 'loss/train': 1.5338456630706787} +03/05/2022 01:26:06 - INFO - codeparrot_training - Step 30606: {'lr': 0.0004553095097567942, 'samples': 15670784, 'steps': 30606, 'loss/train': 2.0647571086883545} +03/05/2022 01:26:08 - INFO - codeparrot_training - Skipping example with length 306 (seq_length=1024) +03/05/2022 01:26:11 - INFO - codeparrot_training - Step 30607: {'lr': 0.0004553064817579053, 'samples': 15671296, 'steps': 30607, 'loss/train': 0.8874843716621399} +03/05/2022 01:26:15 - INFO - codeparrot_training - Step 30608: {'lr': 0.0004553034536665086, 'samples': 15671808, 'steps': 30608, 'loss/train': 1.807150959968567} +03/05/2022 01:26:16 - INFO - codeparrot_training - Skipping example with length 266 (seq_length=1024) +03/05/2022 01:26:20 - INFO - codeparrot_training - Step 30609: {'lr': 0.0004553004254826053, 'samples': 15672320, 'steps': 30609, 'loss/train': 1.8416059017181396} +03/05/2022 01:26:23 - INFO - codeparrot_training - Step 30610: {'lr': 0.0004552973972061967, 'samples': 15672832, 'steps': 30610, 'loss/train': 1.0278350114822388} +03/05/2022 01:26:25 - INFO - codeparrot_training - Skipping example with length 217 (seq_length=1024) +03/05/2022 01:26:28 - INFO - codeparrot_training - Step 30611: {'lr': 0.00045529436883728436, 'samples': 15673344, 'steps': 30611, 'loss/train': 1.6898707151412964} +03/05/2022 01:26:32 - INFO - codeparrot_training - Step 30612: {'lr': 0.0004552913403758695, 'samples': 15673856, 'steps': 30612, 'loss/train': 1.1349802017211914} +03/05/2022 01:26:33 - INFO - codeparrot_training - Skipping example with length 404 (seq_length=1024) +03/05/2022 01:26:37 - INFO - codeparrot_training - Step 30613: {'lr': 0.00045528831182195355, 'samples': 15674368, 'steps': 30613, 'loss/train': 1.7550075054168701} +03/05/2022 01:26:40 - INFO - codeparrot_training - Step 30614: {'lr': 0.00045528528317553786, 'samples': 15674880, 'steps': 30614, 'loss/train': 2.2082571983337402} +03/05/2022 01:26:41 - INFO - codeparrot_training - Skipping example with length 935 (seq_length=1024) +03/05/2022 01:26:45 - INFO - codeparrot_training - Step 30615: {'lr': 0.0004552822544366238, 'samples': 15675392, 'steps': 30615, 'loss/train': 1.1485567092895508} +03/05/2022 01:26:48 - INFO - codeparrot_training - Step 30616: {'lr': 0.00045527922560521274, 'samples': 15675904, 'steps': 30616, 'loss/train': 0.07499045878648758} +03/05/2022 01:26:50 - INFO - codeparrot_training - Skipping example with length 492 (seq_length=1024) +03/05/2022 01:26:54 - INFO - codeparrot_training - Step 30617: {'lr': 0.0004552761966813059, 'samples': 15676416, 'steps': 30617, 'loss/train': 1.6735488176345825} +03/05/2022 01:26:57 - INFO - codeparrot_training - Step 30618: {'lr': 0.00045527316766490487, 'samples': 15676928, 'steps': 30618, 'loss/train': 1.7222900390625} +03/05/2022 01:26:58 - INFO - codeparrot_training - Skipping example with length 993 (seq_length=1024) +03/05/2022 01:27:02 - INFO - codeparrot_training - Step 30619: {'lr': 0.000455270138556011, 'samples': 15677440, 'steps': 30619, 'loss/train': 2.4266185760498047} +03/05/2022 01:27:06 - INFO - codeparrot_training - Step 30620: {'lr': 0.00045526710935462543, 'samples': 15677952, 'steps': 30620, 'loss/train': 2.022840976715088} +03/05/2022 01:27:07 - INFO - codeparrot_training - Skipping example with length 511 (seq_length=1024) +03/05/2022 01:27:11 - INFO - codeparrot_training - Step 30621: {'lr': 0.00045526408006074973, 'samples': 15678464, 'steps': 30621, 'loss/train': 1.3902665376663208} +03/05/2022 01:27:14 - INFO - codeparrot_training - Step 30622: {'lr': 0.00045526105067438525, 'samples': 15678976, 'steps': 30622, 'loss/train': 1.7090548276901245} +03/05/2022 01:27:15 - INFO - codeparrot_training - Skipping example with length 51 (seq_length=1024) +03/05/2022 01:27:19 - INFO - codeparrot_training - Step 30623: {'lr': 0.00045525802119553323, 'samples': 15679488, 'steps': 30623, 'loss/train': 1.6807901859283447} +03/05/2022 01:27:22 - INFO - codeparrot_training - Step 30624: {'lr': 0.0004552549916241951, 'samples': 15680000, 'steps': 30624, 'loss/train': 2.7836928367614746} +03/05/2022 01:27:24 - INFO - codeparrot_training - Skipping example with length 313 (seq_length=1024) +03/05/2022 01:27:28 - INFO - codeparrot_training - Step 30625: {'lr': 0.0004552519619603723, 'samples': 15680512, 'steps': 30625, 'loss/train': 1.4765536785125732} +03/05/2022 01:27:31 - INFO - codeparrot_training - Step 30626: {'lr': 0.00045524893220406617, 'samples': 15681024, 'steps': 30626, 'loss/train': 1.6688754558563232} +03/05/2022 01:27:32 - INFO - codeparrot_training - Skipping example with length 757 (seq_length=1024) +03/05/2022 01:27:36 - INFO - codeparrot_training - Step 30627: {'lr': 0.00045524590235527796, 'samples': 15681536, 'steps': 30627, 'loss/train': 0.10068529099225998} +03/05/2022 01:27:39 - INFO - codeparrot_training - Step 30628: {'lr': 0.0004552428724140091, 'samples': 15682048, 'steps': 30628, 'loss/train': 0.657551646232605} +03/05/2022 01:27:40 - INFO - codeparrot_training - Skipping example with length 80 (seq_length=1024) +03/05/2022 01:27:45 - INFO - codeparrot_training - Step 30629: {'lr': 0.000455239842380261, 'samples': 15682560, 'steps': 30629, 'loss/train': 1.9620801210403442} +03/05/2022 01:27:48 - INFO - codeparrot_training - Step 30630: {'lr': 0.000455236812254035, 'samples': 15683072, 'steps': 30630, 'loss/train': 0.7647385001182556} +03/05/2022 01:27:49 - INFO - codeparrot_training - Skipping example with length 828 (seq_length=1024) +03/05/2022 01:27:53 - INFO - codeparrot_training - Step 30631: {'lr': 0.0004552337820353325, 'samples': 15683584, 'steps': 30631, 'loss/train': 1.2443211078643799} +03/05/2022 01:27:56 - INFO - codeparrot_training - Step 30632: {'lr': 0.00045523075172415476, 'samples': 15684096, 'steps': 30632, 'loss/train': 1.95291006565094} +03/05/2022 01:27:57 - INFO - codeparrot_training - Skipping example with length 672 (seq_length=1024) +03/05/2022 01:28:02 - INFO - codeparrot_training - Step 30633: {'lr': 0.0004552277213205032, 'samples': 15684608, 'steps': 30633, 'loss/train': 1.499145746231079} +03/05/2022 01:28:05 - INFO - codeparrot_training - Step 30634: {'lr': 0.0004552246908243792, 'samples': 15685120, 'steps': 30634, 'loss/train': 1.3935949802398682} +03/05/2022 01:28:05 - INFO - codeparrot_training - Skipping example with length 650 (seq_length=1024) +03/05/2022 01:28:10 - INFO - codeparrot_training - Step 30635: {'lr': 0.00045522166023578413, 'samples': 15685632, 'steps': 30635, 'loss/train': 1.4393086433410645} +03/05/2022 01:28:13 - INFO - codeparrot_training - Step 30636: {'lr': 0.0004552186295547194, 'samples': 15686144, 'steps': 30636, 'loss/train': 1.622164249420166} +03/05/2022 01:28:14 - INFO - codeparrot_training - Skipping example with length 773 (seq_length=1024) +03/05/2022 01:28:18 - INFO - codeparrot_training - Step 30637: {'lr': 0.0004552155987811863, 'samples': 15686656, 'steps': 30637, 'loss/train': 1.506044626235962} +03/05/2022 01:28:22 - INFO - codeparrot_training - Step 30638: {'lr': 0.00045521256791518616, 'samples': 15687168, 'steps': 30638, 'loss/train': 2.505302906036377} +03/05/2022 01:28:22 - INFO - codeparrot_training - Skipping example with length 588 (seq_length=1024) +03/05/2022 01:28:27 - INFO - codeparrot_training - Step 30639: {'lr': 0.0004552095369567205, 'samples': 15687680, 'steps': 30639, 'loss/train': 2.5269901752471924} +03/05/2022 01:28:30 - INFO - codeparrot_training - Step 30640: {'lr': 0.00045520650590579056, 'samples': 15688192, 'steps': 30640, 'loss/train': 0.9382213950157166} +03/05/2022 01:28:31 - INFO - codeparrot_training - Skipping example with length 906 (seq_length=1024) +03/05/2022 01:28:35 - INFO - codeparrot_training - Step 30641: {'lr': 0.00045520347476239763, 'samples': 15688704, 'steps': 30641, 'loss/train': 1.3851901292800903} +03/05/2022 01:28:38 - INFO - codeparrot_training - Step 30642: {'lr': 0.00045520044352654335, 'samples': 15689216, 'steps': 30642, 'loss/train': 2.114215850830078} +03/05/2022 01:28:40 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 01:28:44 - INFO - codeparrot_training - Step 30643: {'lr': 0.0004551974121982288, 'samples': 15689728, 'steps': 30643, 'loss/train': 1.528570294380188} +03/05/2022 01:28:47 - INFO - codeparrot_training - Step 30644: {'lr': 0.00045519438077745543, 'samples': 15690240, 'steps': 30644, 'loss/train': 1.8173609972000122} +03/05/2022 01:28:48 - INFO - codeparrot_training - Skipping example with length 395 (seq_length=1024) +03/05/2022 01:28:52 - INFO - codeparrot_training - Step 30645: {'lr': 0.0004551913492642248, 'samples': 15690752, 'steps': 30645, 'loss/train': 2.14235782623291} +03/05/2022 01:28:55 - INFO - codeparrot_training - Step 30646: {'lr': 0.00045518831765853796, 'samples': 15691264, 'steps': 30646, 'loss/train': 1.9143075942993164} +03/05/2022 01:28:56 - INFO - codeparrot_training - Skipping example with length 121 (seq_length=1024) +03/05/2022 01:29:01 - INFO - codeparrot_training - Step 30647: {'lr': 0.0004551852859603965, 'samples': 15691776, 'steps': 30647, 'loss/train': 1.9740931987762451} +03/05/2022 01:29:04 - INFO - codeparrot_training - Step 30648: {'lr': 0.0004551822541698017, 'samples': 15692288, 'steps': 30648, 'loss/train': 1.8217936754226685} +03/05/2022 01:29:04 - INFO - codeparrot_training - Skipping example with length 798 (seq_length=1024) +03/05/2022 01:29:09 - INFO - codeparrot_training - Step 30649: {'lr': 0.0004551792222867549, 'samples': 15692800, 'steps': 30649, 'loss/train': 0.904915988445282} +03/05/2022 01:29:12 - INFO - codeparrot_training - Step 30650: {'lr': 0.0004551761903112576, 'samples': 15693312, 'steps': 30650, 'loss/train': 1.3376164436340332} +03/05/2022 01:29:13 - INFO - codeparrot_training - Skipping example with length 750 (seq_length=1024) +03/05/2022 01:29:17 - INFO - codeparrot_training - Step 30651: {'lr': 0.000455173158243311, 'samples': 15693824, 'steps': 30651, 'loss/train': 1.5543268918991089} +03/05/2022 01:29:21 - INFO - codeparrot_training - Step 30652: {'lr': 0.0004551701260829166, 'samples': 15694336, 'steps': 30652, 'loss/train': 1.339518427848816} +03/05/2022 01:29:21 - INFO - codeparrot_training - Skipping example with length 431 (seq_length=1024) +03/05/2022 01:29:26 - INFO - codeparrot_training - Step 30653: {'lr': 0.00045516709383007563, 'samples': 15694848, 'steps': 30653, 'loss/train': 2.28776216506958} +03/05/2022 01:29:29 - INFO - codeparrot_training - Step 30654: {'lr': 0.0004551640614847896, 'samples': 15695360, 'steps': 30654, 'loss/train': 1.641797661781311} +03/05/2022 01:29:29 - INFO - codeparrot_training - Skipping example with length 963 (seq_length=1024) +03/05/2022 01:29:34 - INFO - codeparrot_training - Step 30655: {'lr': 0.00045516102904705983, 'samples': 15695872, 'steps': 30655, 'loss/train': 1.7911276817321777} +03/05/2022 01:29:38 - INFO - codeparrot_training - Step 30656: {'lr': 0.0004551579965168876, 'samples': 15696384, 'steps': 30656, 'loss/train': 1.9853310585021973} +03/05/2022 01:29:38 - INFO - codeparrot_training - Skipping example with length 985 (seq_length=1024) +03/05/2022 01:29:43 - INFO - codeparrot_training - Step 30657: {'lr': 0.00045515496389427433, 'samples': 15696896, 'steps': 30657, 'loss/train': 0.0539902038872242} +03/05/2022 01:29:46 - INFO - codeparrot_training - Step 30658: {'lr': 0.0004551519311792215, 'samples': 15697408, 'steps': 30658, 'loss/train': 2.108579158782959} +03/05/2022 01:29:46 - INFO - codeparrot_training - Skipping example with length 698 (seq_length=1024) +03/05/2022 01:29:51 - INFO - codeparrot_training - Step 30659: {'lr': 0.00045514889837173025, 'samples': 15697920, 'steps': 30659, 'loss/train': 2.070024013519287} +03/05/2022 01:29:54 - INFO - codeparrot_training - Step 30660: {'lr': 0.00045514586547180214, 'samples': 15698432, 'steps': 30660, 'loss/train': 1.6773465871810913} +03/05/2022 01:29:55 - INFO - codeparrot_training - Skipping example with length 557 (seq_length=1024) +03/05/2022 01:30:00 - INFO - codeparrot_training - Step 30661: {'lr': 0.0004551428324794385, 'samples': 15698944, 'steps': 30661, 'loss/train': 1.616902470588684} +03/05/2022 01:30:03 - INFO - codeparrot_training - Step 30662: {'lr': 0.00045513979939464056, 'samples': 15699456, 'steps': 30662, 'loss/train': 1.0830869674682617} +03/05/2022 01:30:04 - INFO - codeparrot_training - Skipping example with length 603 (seq_length=1024) +03/05/2022 01:30:09 - INFO - codeparrot_training - Step 30663: {'lr': 0.0004551367662174099, 'samples': 15699968, 'steps': 30663, 'loss/train': 2.3653385639190674} +03/05/2022 01:30:12 - INFO - codeparrot_training - Step 30664: {'lr': 0.0004551337329477477, 'samples': 15700480, 'steps': 30664, 'loss/train': 1.9005095958709717} +03/05/2022 01:30:14 - INFO - codeparrot_training - Skipping example with length 103 (seq_length=1024) +03/05/2022 01:30:17 - INFO - codeparrot_training - Step 30665: {'lr': 0.00045513069958565545, 'samples': 15700992, 'steps': 30665, 'loss/train': 2.3354227542877197} +03/05/2022 01:30:20 - INFO - codeparrot_training - Step 30666: {'lr': 0.00045512766613113457, 'samples': 15701504, 'steps': 30666, 'loss/train': 2.1672818660736084} +03/05/2022 01:30:22 - INFO - codeparrot_training - Skipping example with length 28 (seq_length=1024) +03/05/2022 01:30:26 - INFO - codeparrot_training - Step 30667: {'lr': 0.00045512463258418615, 'samples': 15702016, 'steps': 30667, 'loss/train': 1.9206382036209106} +03/05/2022 01:30:30 - INFO - codeparrot_training - Step 30668: {'lr': 0.00045512159894481183, 'samples': 15702528, 'steps': 30668, 'loss/train': 2.0869898796081543} +03/05/2022 01:30:33 - INFO - codeparrot_training - Step 30669: {'lr': 0.00045511856521301286, 'samples': 15703040, 'steps': 30669, 'loss/train': 2.0879571437835693} +03/05/2022 01:30:35 - INFO - codeparrot_training - Skipping example with length 975 (seq_length=1024) +03/05/2022 01:30:38 - INFO - codeparrot_training - Step 30670: {'lr': 0.0004551155313887906, 'samples': 15703552, 'steps': 30670, 'loss/train': 1.6553771495819092} +03/05/2022 01:30:41 - INFO - codeparrot_training - Step 30671: {'lr': 0.0004551124974721465, 'samples': 15704064, 'steps': 30671, 'loss/train': 2.672435998916626} +03/05/2022 01:30:43 - INFO - codeparrot_training - Skipping example with length 687 (seq_length=1024) +03/05/2022 01:30:47 - INFO - codeparrot_training - Step 30672: {'lr': 0.00045510946346308186, 'samples': 15704576, 'steps': 30672, 'loss/train': 1.914102554321289} +03/05/2022 01:30:50 - INFO - codeparrot_training - Step 30673: {'lr': 0.0004551064293615981, 'samples': 15705088, 'steps': 30673, 'loss/train': 1.2157970666885376} +03/05/2022 01:30:52 - INFO - codeparrot_training - Skipping example with length 336 (seq_length=1024) +03/05/2022 01:30:55 - INFO - codeparrot_training - Step 30674: {'lr': 0.00045510339516769647, 'samples': 15705600, 'steps': 30674, 'loss/train': 1.1249303817749023} +03/05/2022 01:30:58 - INFO - codeparrot_training - Step 30675: {'lr': 0.0004551003608813784, 'samples': 15706112, 'steps': 30675, 'loss/train': 1.545224905014038} +03/05/2022 01:31:00 - INFO - codeparrot_training - Skipping example with length 872 (seq_length=1024) +03/05/2022 01:31:03 - INFO - codeparrot_training - Step 30676: {'lr': 0.00045509732650264535, 'samples': 15706624, 'steps': 30676, 'loss/train': 1.7151719331741333} +03/05/2022 01:31:06 - INFO - codeparrot_training - Step 30677: {'lr': 0.00045509429203149856, 'samples': 15707136, 'steps': 30677, 'loss/train': 1.8859766721725464} +03/05/2022 01:31:08 - INFO - codeparrot_training - Skipping example with length 837 (seq_length=1024) +03/05/2022 01:31:12 - INFO - codeparrot_training - Step 30678: {'lr': 0.00045509125746793946, 'samples': 15707648, 'steps': 30678, 'loss/train': 1.9827067852020264} +03/05/2022 01:31:15 - INFO - codeparrot_training - Step 30679: {'lr': 0.00045508822281196937, 'samples': 15708160, 'steps': 30679, 'loss/train': 2.3717947006225586} +03/05/2022 01:31:16 - INFO - codeparrot_training - Skipping example with length 585 (seq_length=1024) +03/05/2022 01:31:20 - INFO - codeparrot_training - Step 30680: {'lr': 0.0004550851880635898, 'samples': 15708672, 'steps': 30680, 'loss/train': 1.8342174291610718} +03/05/2022 01:31:23 - INFO - codeparrot_training - Step 30681: {'lr': 0.0004550821532228019, 'samples': 15709184, 'steps': 30681, 'loss/train': 1.468177318572998} +03/05/2022 01:31:25 - INFO - codeparrot_training - Skipping example with length 20 (seq_length=1024) +03/05/2022 01:31:29 - INFO - codeparrot_training - Step 30682: {'lr': 0.00045507911828960717, 'samples': 15709696, 'steps': 30682, 'loss/train': 1.5448837280273438} +03/05/2022 01:31:32 - INFO - codeparrot_training - Step 30683: {'lr': 0.000455076083264007, 'samples': 15710208, 'steps': 30683, 'loss/train': 1.6553038358688354} +03/05/2022 01:31:33 - INFO - codeparrot_training - Skipping example with length 621 (seq_length=1024) +03/05/2022 01:31:37 - INFO - codeparrot_training - Step 30684: {'lr': 0.0004550730481460027, 'samples': 15710720, 'steps': 30684, 'loss/train': 1.1296297311782837} +03/05/2022 01:31:40 - INFO - codeparrot_training - Step 30685: {'lr': 0.0004550700129355956, 'samples': 15711232, 'steps': 30685, 'loss/train': 1.7094225883483887} +03/05/2022 01:31:42 - INFO - codeparrot_training - Skipping example with length 371 (seq_length=1024) +03/05/2022 01:31:46 - INFO - codeparrot_training - Step 30686: {'lr': 0.0004550669776327871, 'samples': 15711744, 'steps': 30686, 'loss/train': 1.2141731977462769} +03/05/2022 01:31:49 - INFO - codeparrot_training - Step 30687: {'lr': 0.00045506394223757867, 'samples': 15712256, 'steps': 30687, 'loss/train': 1.1551674604415894} +03/05/2022 01:31:51 - INFO - codeparrot_training - Skipping example with length 712 (seq_length=1024) +03/05/2022 01:31:54 - INFO - codeparrot_training - Step 30688: {'lr': 0.00045506090674997157, 'samples': 15712768, 'steps': 30688, 'loss/train': 2.256469249725342} +03/05/2022 01:31:57 - INFO - codeparrot_training - Step 30689: {'lr': 0.00045505787116996714, 'samples': 15713280, 'steps': 30689, 'loss/train': 1.6092214584350586} +03/05/2022 01:31:59 - INFO - codeparrot_training - Skipping example with length 752 (seq_length=1024) +03/05/2022 01:32:03 - INFO - codeparrot_training - Step 30690: {'lr': 0.0004550548354975669, 'samples': 15713792, 'steps': 30690, 'loss/train': 2.069202184677124} +03/05/2022 01:32:06 - INFO - codeparrot_training - Step 30691: {'lr': 0.000455051799732772, 'samples': 15714304, 'steps': 30691, 'loss/train': 1.7116682529449463} +03/05/2022 01:32:08 - INFO - codeparrot_training - Skipping example with length 909 (seq_length=1024) +03/05/2022 01:32:11 - INFO - codeparrot_training - Step 30692: {'lr': 0.000455048763875584, 'samples': 15714816, 'steps': 30692, 'loss/train': 1.3455792665481567} +03/05/2022 01:32:14 - INFO - codeparrot_training - Step 30693: {'lr': 0.00045504572792600415, 'samples': 15715328, 'steps': 30693, 'loss/train': 1.4055207967758179} +03/05/2022 01:32:16 - INFO - codeparrot_training - Skipping example with length 774 (seq_length=1024) +03/05/2022 01:32:19 - INFO - codeparrot_training - Step 30694: {'lr': 0.00045504269188403386, 'samples': 15715840, 'steps': 30694, 'loss/train': 2.097240924835205} +03/05/2022 01:32:23 - INFO - codeparrot_training - Step 30695: {'lr': 0.00045503965574967447, 'samples': 15716352, 'steps': 30695, 'loss/train': 1.2251014709472656} +03/05/2022 01:32:24 - INFO - codeparrot_training - Skipping example with length 991 (seq_length=1024) +03/05/2022 01:32:28 - INFO - codeparrot_training - Step 30696: {'lr': 0.0004550366195229274, 'samples': 15716864, 'steps': 30696, 'loss/train': 1.4036637544631958} +03/05/2022 01:32:31 - INFO - codeparrot_training - Step 30697: {'lr': 0.00045503358320379405, 'samples': 15717376, 'steps': 30697, 'loss/train': 0.11962788552045822} +03/05/2022 01:32:33 - INFO - codeparrot_training - Skipping example with length 1020 (seq_length=1024) +03/05/2022 01:32:36 - INFO - codeparrot_training - Step 30698: {'lr': 0.00045503054679227567, 'samples': 15717888, 'steps': 30698, 'loss/train': 1.3659809827804565} +03/05/2022 01:32:39 - INFO - codeparrot_training - Step 30699: {'lr': 0.00045502751028837367, 'samples': 15718400, 'steps': 30699, 'loss/train': 1.77561616897583} +03/05/2022 01:32:41 - INFO - codeparrot_training - Skipping example with length 129 (seq_length=1024) +03/05/2022 01:32:44 - INFO - codeparrot_training - Step 30700: {'lr': 0.00045502447369208957, 'samples': 15718912, 'steps': 30700, 'loss/train': 1.814879298210144} +03/05/2022 01:32:48 - INFO - codeparrot_training - Step 30701: {'lr': 0.00045502143700342445, 'samples': 15719424, 'steps': 30701, 'loss/train': 1.8131507635116577} +03/05/2022 01:32:49 - INFO - codeparrot_training - Skipping example with length 949 (seq_length=1024) +03/05/2022 01:32:53 - INFO - codeparrot_training - Step 30702: {'lr': 0.0004550184002223799, 'samples': 15719936, 'steps': 30702, 'loss/train': 1.9509031772613525} +03/05/2022 01:32:56 - INFO - codeparrot_training - Step 30703: {'lr': 0.0004550153633489572, 'samples': 15720448, 'steps': 30703, 'loss/train': 1.8368234634399414} +03/05/2022 01:32:57 - INFO - codeparrot_training - Skipping example with length 46 (seq_length=1024) +03/05/2022 01:33:01 - INFO - codeparrot_training - Step 30704: {'lr': 0.0004550123263831578, 'samples': 15720960, 'steps': 30704, 'loss/train': 2.391666889190674} +03/05/2022 01:33:05 - INFO - codeparrot_training - Step 30705: {'lr': 0.0004550092893249829, 'samples': 15721472, 'steps': 30705, 'loss/train': 1.7643426656723022} +03/05/2022 01:33:05 - INFO - codeparrot_training - Skipping example with length 177 (seq_length=1024) +03/05/2022 01:33:10 - INFO - codeparrot_training - Step 30706: {'lr': 0.00045500625217443404, 'samples': 15721984, 'steps': 30706, 'loss/train': 1.8344625234603882} +03/05/2022 01:33:13 - INFO - codeparrot_training - Step 30707: {'lr': 0.0004550032149315125, 'samples': 15722496, 'steps': 30707, 'loss/train': 2.1288981437683105} +03/05/2022 01:33:13 - INFO - codeparrot_training - Skipping example with length 936 (seq_length=1024) +03/05/2022 01:33:18 - INFO - codeparrot_training - Step 30708: {'lr': 0.00045500017759621974, 'samples': 15723008, 'steps': 30708, 'loss/train': 1.791182041168213} +03/05/2022 01:33:21 - INFO - codeparrot_training - Step 30709: {'lr': 0.00045499714016855705, 'samples': 15723520, 'steps': 30709, 'loss/train': 1.3242042064666748} +03/05/2022 01:33:22 - INFO - codeparrot_training - Skipping example with length 162 (seq_length=1024) +03/05/2022 01:33:27 - INFO - codeparrot_training - Step 30710: {'lr': 0.0004549941026485258, 'samples': 15724032, 'steps': 30710, 'loss/train': 2.5675158500671387} +03/05/2022 01:33:30 - INFO - codeparrot_training - Step 30711: {'lr': 0.00045499106503612733, 'samples': 15724544, 'steps': 30711, 'loss/train': 1.8594111204147339} +03/05/2022 01:33:30 - INFO - codeparrot_training - Skipping example with length 14 (seq_length=1024) +03/05/2022 01:33:35 - INFO - codeparrot_training - Step 30712: {'lr': 0.00045498802733136306, 'samples': 15725056, 'steps': 30712, 'loss/train': 1.6014914512634277} +03/05/2022 01:33:38 - INFO - codeparrot_training - Step 30713: {'lr': 0.0004549849895342344, 'samples': 15725568, 'steps': 30713, 'loss/train': 1.6373192071914673} +03/05/2022 01:33:39 - INFO - codeparrot_training - Skipping example with length 70 (seq_length=1024) +03/05/2022 01:33:43 - INFO - codeparrot_training - Step 30714: {'lr': 0.00045498195164474264, 'samples': 15726080, 'steps': 30714, 'loss/train': 2.4185588359832764} +03/05/2022 01:33:47 - INFO - codeparrot_training - Step 30715: {'lr': 0.00045497891366288914, 'samples': 15726592, 'steps': 30715, 'loss/train': 2.04469895362854} +03/05/2022 01:33:47 - INFO - codeparrot_training - Skipping example with length 148 (seq_length=1024) +03/05/2022 01:33:52 - INFO - codeparrot_training - Step 30716: {'lr': 0.0004549758755886754, 'samples': 15727104, 'steps': 30716, 'loss/train': 2.1772382259368896} +03/05/2022 01:33:55 - INFO - codeparrot_training - Step 30717: {'lr': 0.00045497283742210263, 'samples': 15727616, 'steps': 30717, 'loss/train': 1.9544272422790527} +03/05/2022 01:33:55 - INFO - codeparrot_training - Skipping example with length 445 (seq_length=1024) +03/05/2022 01:34:00 - INFO - codeparrot_training - Step 30718: {'lr': 0.0004549697991631722, 'samples': 15728128, 'steps': 30718, 'loss/train': 1.6482875347137451} +03/05/2022 01:34:03 - INFO - codeparrot_training - Step 30719: {'lr': 0.0004549667608118856, 'samples': 15728640, 'steps': 30719, 'loss/train': 1.7668979167938232} +03/05/2022 01:34:04 - INFO - codeparrot_training - Skipping example with length 908 (seq_length=1024) +03/05/2022 01:34:09 - INFO - codeparrot_training - Step 30720: {'lr': 0.0004549637223682441, 'samples': 15729152, 'steps': 30720, 'loss/train': 1.7266249656677246} +03/05/2022 01:34:12 - INFO - codeparrot_training - Step 30721: {'lr': 0.0004549606838322492, 'samples': 15729664, 'steps': 30721, 'loss/train': 2.2422211170196533} +03/05/2022 01:34:12 - INFO - codeparrot_training - Skipping example with length 489 (seq_length=1024) +03/05/2022 01:34:17 - INFO - codeparrot_training - Step 30722: {'lr': 0.00045495764520390216, 'samples': 15730176, 'steps': 30722, 'loss/train': 1.8698594570159912} +03/05/2022 01:34:20 - INFO - codeparrot_training - Step 30723: {'lr': 0.0004549546064832043, 'samples': 15730688, 'steps': 30723, 'loss/train': 1.5902607440948486} +03/05/2022 01:34:20 - INFO - codeparrot_training - Skipping example with length 140 (seq_length=1024) +03/05/2022 01:34:25 - INFO - codeparrot_training - Step 30724: {'lr': 0.0004549515676701571, 'samples': 15731200, 'steps': 30724, 'loss/train': 1.7164030075073242} +03/05/2022 01:34:29 - INFO - codeparrot_training - Step 30725: {'lr': 0.0004549485287647619, 'samples': 15731712, 'steps': 30725, 'loss/train': 1.4147449731826782} +03/05/2022 01:34:29 - INFO - codeparrot_training - Skipping example with length 628 (seq_length=1024) +03/05/2022 01:34:34 - INFO - codeparrot_training - Step 30726: {'lr': 0.00045494548976702, 'samples': 15732224, 'steps': 30726, 'loss/train': 1.250527262687683} +03/05/2022 01:34:37 - INFO - codeparrot_training - Skipping example with length 369 (seq_length=1024) +03/05/2022 01:34:39 - INFO - codeparrot_training - Step 30727: {'lr': 0.0004549424506769329, 'samples': 15732736, 'steps': 30727, 'loss/train': 1.1734340190887451} +03/05/2022 01:34:42 - INFO - codeparrot_training - Step 30728: {'lr': 0.00045493941149450185, 'samples': 15733248, 'steps': 30728, 'loss/train': 1.4060382843017578} +03/05/2022 01:34:45 - INFO - codeparrot_training - Skipping example with length 777 (seq_length=1024) +03/05/2022 01:34:48 - INFO - codeparrot_training - Step 30729: {'lr': 0.00045493637221972826, 'samples': 15733760, 'steps': 30729, 'loss/train': 1.8554925918579102} +03/05/2022 01:34:51 - INFO - codeparrot_training - Step 30730: {'lr': 0.0004549333328526135, 'samples': 15734272, 'steps': 30730, 'loss/train': 2.0124828815460205} +03/05/2022 01:34:53 - INFO - codeparrot_training - Skipping example with length 852 (seq_length=1024) +03/05/2022 01:34:56 - INFO - codeparrot_training - Step 30731: {'lr': 0.0004549302933931589, 'samples': 15734784, 'steps': 30731, 'loss/train': 1.2990275621414185} +03/05/2022 01:34:59 - INFO - codeparrot_training - Step 30732: {'lr': 0.000454927253841366, 'samples': 15735296, 'steps': 30732, 'loss/train': 0.2546718716621399} +03/05/2022 01:35:01 - INFO - codeparrot_training - Skipping example with length 723 (seq_length=1024) +03/05/2022 01:35:05 - INFO - codeparrot_training - Step 30733: {'lr': 0.00045492421419723595, 'samples': 15735808, 'steps': 30733, 'loss/train': 2.787313222885132} +03/05/2022 01:35:08 - INFO - codeparrot_training - Step 30734: {'lr': 0.00045492117446077027, 'samples': 15736320, 'steps': 30734, 'loss/train': 1.8052736520767212} +03/05/2022 01:35:10 - INFO - codeparrot_training - Skipping example with length 719 (seq_length=1024) +03/05/2022 01:35:13 - INFO - codeparrot_training - Step 30735: {'lr': 0.0004549181346319702, 'samples': 15736832, 'steps': 30735, 'loss/train': 1.6567161083221436} +03/05/2022 01:35:16 - INFO - codeparrot_training - Step 30736: {'lr': 0.00045491509471083717, 'samples': 15737344, 'steps': 30736, 'loss/train': 1.5889817476272583} +03/05/2022 01:35:18 - INFO - codeparrot_training - Skipping example with length 419 (seq_length=1024) +03/05/2022 01:35:22 - INFO - codeparrot_training - Step 30737: {'lr': 0.00045491205469737263, 'samples': 15737856, 'steps': 30737, 'loss/train': 1.2483335733413696} +03/05/2022 01:35:25 - INFO - codeparrot_training - Step 30738: {'lr': 0.00045490901459157787, 'samples': 15738368, 'steps': 30738, 'loss/train': 1.6420953273773193} +03/05/2022 01:35:26 - INFO - codeparrot_training - Skipping example with length 63 (seq_length=1024) +03/05/2022 01:35:30 - INFO - codeparrot_training - Step 30739: {'lr': 0.0004549059743934543, 'samples': 15738880, 'steps': 30739, 'loss/train': 2.5171022415161133} +03/05/2022 01:35:33 - INFO - codeparrot_training - Step 30740: {'lr': 0.00045490293410300315, 'samples': 15739392, 'steps': 30740, 'loss/train': 1.0917596817016602} +03/05/2022 01:35:35 - INFO - codeparrot_training - Skipping example with length 799 (seq_length=1024) +03/05/2022 01:35:38 - INFO - codeparrot_training - Step 30741: {'lr': 0.000454899893720226, 'samples': 15739904, 'steps': 30741, 'loss/train': 1.8663716316223145} +03/05/2022 01:35:41 - INFO - codeparrot_training - Step 30742: {'lr': 0.000454896853245124, 'samples': 15740416, 'steps': 30742, 'loss/train': 1.6075266599655151} +03/05/2022 01:35:43 - INFO - codeparrot_training - Skipping example with length 268 (seq_length=1024) +03/05/2022 01:35:47 - INFO - codeparrot_training - Step 30743: {'lr': 0.00045489381267769873, 'samples': 15740928, 'steps': 30743, 'loss/train': 1.824425458908081} +03/05/2022 01:35:50 - INFO - codeparrot_training - Step 30744: {'lr': 0.00045489077201795147, 'samples': 15741440, 'steps': 30744, 'loss/train': 1.8720935583114624} +03/05/2022 01:35:51 - INFO - codeparrot_training - Skipping example with length 936 (seq_length=1024) +03/05/2022 01:35:55 - INFO - codeparrot_training - Step 30745: {'lr': 0.0004548877312658836, 'samples': 15741952, 'steps': 30745, 'loss/train': 1.1346352100372314} +03/05/2022 01:35:58 - INFO - codeparrot_training - Step 30746: {'lr': 0.0004548846904214964, 'samples': 15742464, 'steps': 30746, 'loss/train': 2.5220839977264404} +03/05/2022 01:36:00 - INFO - codeparrot_training - Skipping example with length 519 (seq_length=1024) +03/05/2022 01:36:04 - INFO - codeparrot_training - Step 30747: {'lr': 0.00045488164948479144, 'samples': 15742976, 'steps': 30747, 'loss/train': 2.026585102081299} +03/05/2022 01:36:07 - INFO - codeparrot_training - Step 30748: {'lr': 0.0004548786084557699, 'samples': 15743488, 'steps': 30748, 'loss/train': 1.0012116432189941} +03/05/2022 01:36:09 - INFO - codeparrot_training - Skipping example with length 298 (seq_length=1024) +03/05/2022 01:36:12 - INFO - codeparrot_training - Step 30749: {'lr': 0.00045487556733443327, 'samples': 15744000, 'steps': 30749, 'loss/train': 1.69420325756073} +03/05/2022 01:36:15 - INFO - codeparrot_training - Step 30750: {'lr': 0.0004548725261207828, 'samples': 15744512, 'steps': 30750, 'loss/train': 1.476548671722412} +03/05/2022 01:36:17 - INFO - codeparrot_training - Skipping example with length 816 (seq_length=1024) +03/05/2022 01:36:21 - INFO - codeparrot_training - Step 30751: {'lr': 0.0004548694848148199, 'samples': 15745024, 'steps': 30751, 'loss/train': 1.6244127750396729} +03/05/2022 01:36:24 - INFO - codeparrot_training - Step 30752: {'lr': 0.0004548664434165461, 'samples': 15745536, 'steps': 30752, 'loss/train': 2.8528285026550293} +03/05/2022 01:36:26 - INFO - codeparrot_training - Skipping example with length 807 (seq_length=1024) +03/05/2022 01:36:29 - INFO - codeparrot_training - Step 30753: {'lr': 0.0004548634019259625, 'samples': 15746048, 'steps': 30753, 'loss/train': 1.7841558456420898} +03/05/2022 01:36:32 - INFO - codeparrot_training - Step 30754: {'lr': 0.0004548603603430708, 'samples': 15746560, 'steps': 30754, 'loss/train': 4.050764083862305} +03/05/2022 01:36:34 - INFO - codeparrot_training - Skipping example with length 389 (seq_length=1024) +03/05/2022 01:36:38 - INFO - codeparrot_training - Step 30755: {'lr': 0.00045485731866787206, 'samples': 15747072, 'steps': 30755, 'loss/train': 1.7684123516082764} +03/05/2022 01:36:41 - INFO - codeparrot_training - Step 30756: {'lr': 0.00045485427690036774, 'samples': 15747584, 'steps': 30756, 'loss/train': 0.7266432642936707} +03/05/2022 01:36:43 - INFO - codeparrot_training - Skipping example with length 368 (seq_length=1024) +03/05/2022 01:36:46 - INFO - codeparrot_training - Step 30757: {'lr': 0.0004548512350405593, 'samples': 15748096, 'steps': 30757, 'loss/train': 2.1709625720977783} +03/05/2022 01:36:49 - INFO - codeparrot_training - Step 30758: {'lr': 0.00045484819308844806, 'samples': 15748608, 'steps': 30758, 'loss/train': 1.403503179550171} +03/05/2022 01:36:51 - INFO - codeparrot_training - Skipping example with length 589 (seq_length=1024) +03/05/2022 01:36:54 - INFO - codeparrot_training - Step 30759: {'lr': 0.00045484515104403535, 'samples': 15749120, 'steps': 30759, 'loss/train': 2.087512969970703} +03/05/2022 01:36:57 - INFO - codeparrot_training - Step 30760: {'lr': 0.00045484210890732257, 'samples': 15749632, 'steps': 30760, 'loss/train': 2.247074842453003} +03/05/2022 01:36:59 - INFO - codeparrot_training - Skipping example with length 469 (seq_length=1024) +03/05/2022 01:37:03 - INFO - codeparrot_training - Step 30761: {'lr': 0.0004548390666783111, 'samples': 15750144, 'steps': 30761, 'loss/train': 1.4539896249771118} +03/05/2022 01:37:06 - INFO - codeparrot_training - Step 30762: {'lr': 0.00045483602435700233, 'samples': 15750656, 'steps': 30762, 'loss/train': 1.6335994005203247} +03/05/2022 01:37:07 - INFO - codeparrot_training - Skipping example with length 840 (seq_length=1024) +03/05/2022 01:37:11 - INFO - codeparrot_training - Step 30763: {'lr': 0.0004548329819433976, 'samples': 15751168, 'steps': 30763, 'loss/train': 2.28214955329895} +03/05/2022 01:37:14 - INFO - codeparrot_training - Step 30764: {'lr': 0.00045482993943749835, 'samples': 15751680, 'steps': 30764, 'loss/train': 0.16114500164985657} +03/05/2022 01:37:16 - INFO - codeparrot_training - Skipping example with length 902 (seq_length=1024) +03/05/2022 01:37:20 - INFO - codeparrot_training - Step 30765: {'lr': 0.0004548268968393058, 'samples': 15752192, 'steps': 30765, 'loss/train': 1.8494385480880737} +03/05/2022 01:37:23 - INFO - codeparrot_training - Step 30766: {'lr': 0.0004548238541488214, 'samples': 15752704, 'steps': 30766, 'loss/train': 2.242034673690796} +03/05/2022 01:37:24 - INFO - codeparrot_training - Skipping example with length 813 (seq_length=1024) +03/05/2022 01:37:28 - INFO - codeparrot_training - Step 30767: {'lr': 0.00045482081136604665, 'samples': 15753216, 'steps': 30767, 'loss/train': 1.715653657913208} +03/05/2022 01:37:31 - INFO - codeparrot_training - Step 30768: {'lr': 0.0004548177684909827, 'samples': 15753728, 'steps': 30768, 'loss/train': 1.5245997905731201} +03/05/2022 01:37:33 - INFO - codeparrot_training - Skipping example with length 30 (seq_length=1024) +03/05/2022 01:37:37 - INFO - codeparrot_training - Step 30769: {'lr': 0.0004548147255236311, 'samples': 15754240, 'steps': 30769, 'loss/train': 1.3396127223968506} +03/05/2022 01:37:40 - INFO - codeparrot_training - Step 30770: {'lr': 0.0004548116824639931, 'samples': 15754752, 'steps': 30770, 'loss/train': 1.587066888809204} +03/05/2022 01:37:41 - INFO - codeparrot_training - Skipping example with length 166 (seq_length=1024) +03/05/2022 01:37:45 - INFO - codeparrot_training - Step 30771: {'lr': 0.00045480863931207004, 'samples': 15755264, 'steps': 30771, 'loss/train': 1.6513841152191162} +03/05/2022 01:37:48 - INFO - codeparrot_training - Step 30772: {'lr': 0.0004548055960678635, 'samples': 15755776, 'steps': 30772, 'loss/train': 2.532830238342285} +03/05/2022 01:37:49 - INFO - codeparrot_training - Skipping example with length 419 (seq_length=1024) +03/05/2022 01:37:54 - INFO - codeparrot_training - Step 30773: {'lr': 0.0004548025527313746, 'samples': 15756288, 'steps': 30773, 'loss/train': 1.7222899198532104} +03/05/2022 01:37:57 - INFO - codeparrot_training - Step 30774: {'lr': 0.00045479950930260495, 'samples': 15756800, 'steps': 30774, 'loss/train': 1.7327982187271118} +03/05/2022 01:38:00 - INFO - codeparrot_training - Skipping example with length 61 (seq_length=1024) +03/05/2022 01:38:03 - INFO - codeparrot_training - Step 30775: {'lr': 0.0004547964657815558, 'samples': 15757312, 'steps': 30775, 'loss/train': 1.6850329637527466} +03/05/2022 01:38:06 - INFO - codeparrot_training - Step 30776: {'lr': 0.0004547934221682284, 'samples': 15757824, 'steps': 30776, 'loss/train': 2.104546546936035} +03/05/2022 01:38:08 - INFO - codeparrot_training - Skipping example with length 54 (seq_length=1024) +03/05/2022 01:38:11 - INFO - codeparrot_training - Step 30777: {'lr': 0.00045479037846262436, 'samples': 15758336, 'steps': 30777, 'loss/train': 1.4078751802444458} +03/05/2022 01:38:14 - INFO - codeparrot_training - Step 30778: {'lr': 0.00045478733466474487, 'samples': 15758848, 'steps': 30778, 'loss/train': 1.4667441844940186} +03/05/2022 01:38:17 - INFO - codeparrot_training - Skipping example with length 760 (seq_length=1024) +03/05/2022 01:38:20 - INFO - codeparrot_training - Step 30779: {'lr': 0.0004547842907745914, 'samples': 15759360, 'steps': 30779, 'loss/train': 1.3903471231460571} +03/05/2022 01:38:23 - INFO - codeparrot_training - Step 30780: {'lr': 0.00045478124679216523, 'samples': 15759872, 'steps': 30780, 'loss/train': 2.5658891201019287} +03/05/2022 01:38:25 - INFO - codeparrot_training - Skipping example with length 967 (seq_length=1024) +03/05/2022 01:38:28 - INFO - codeparrot_training - Step 30781: {'lr': 0.00045477820271746784, 'samples': 15760384, 'steps': 30781, 'loss/train': 1.8569996356964111} +03/05/2022 01:38:31 - INFO - codeparrot_training - Step 30782: {'lr': 0.00045477515855050056, 'samples': 15760896, 'steps': 30782, 'loss/train': 1.5852731466293335} +03/05/2022 01:38:33 - INFO - codeparrot_training - Skipping example with length 127 (seq_length=1024) +03/05/2022 01:38:36 - INFO - codeparrot_training - Step 30783: {'lr': 0.0004547721142912647, 'samples': 15761408, 'steps': 30783, 'loss/train': 1.8996022939682007} +03/05/2022 01:38:39 - INFO - codeparrot_training - Step 30784: {'lr': 0.00045476906993976177, 'samples': 15761920, 'steps': 30784, 'loss/train': 2.065929651260376} +03/05/2022 01:38:41 - INFO - codeparrot_training - Skipping example with length 166 (seq_length=1024) +03/05/2022 01:38:45 - INFO - codeparrot_training - Step 30785: {'lr': 0.000454766025495993, 'samples': 15762432, 'steps': 30785, 'loss/train': 2.305896043777466} +03/05/2022 01:38:49 - INFO - codeparrot_training - Step 30786: {'lr': 0.00045476298095995985, 'samples': 15762944, 'steps': 30786, 'loss/train': 1.1659975051879883} +03/05/2022 01:38:52 - INFO - codeparrot_training - Step 30787: {'lr': 0.00045475993633166357, 'samples': 15763456, 'steps': 30787, 'loss/train': 1.3043948411941528} +03/05/2022 01:38:53 - INFO - codeparrot_training - Skipping example with length 479 (seq_length=1024) +03/05/2022 01:38:57 - INFO - codeparrot_training - Step 30788: {'lr': 0.00045475689161110565, 'samples': 15763968, 'steps': 30788, 'loss/train': 2.368839979171753} +03/05/2022 01:39:00 - INFO - codeparrot_training - Step 30789: {'lr': 0.0004547538467982876, 'samples': 15764480, 'steps': 30789, 'loss/train': 2.1915481090545654} +03/05/2022 01:39:01 - INFO - codeparrot_training - Skipping example with length 255 (seq_length=1024) +03/05/2022 01:39:05 - INFO - codeparrot_training - Step 30790: {'lr': 0.00045475080189321044, 'samples': 15764992, 'steps': 30790, 'loss/train': 1.7539169788360596} +03/05/2022 01:39:08 - INFO - codeparrot_training - Step 30791: {'lr': 0.00045474775689587576, 'samples': 15765504, 'steps': 30791, 'loss/train': 1.6622904539108276} +03/05/2022 01:39:10 - INFO - codeparrot_training - Skipping example with length 684 (seq_length=1024) +03/05/2022 01:39:14 - INFO - codeparrot_training - Step 30792: {'lr': 0.00045474471180628496, 'samples': 15766016, 'steps': 30792, 'loss/train': 1.3842405080795288} +03/05/2022 01:39:17 - INFO - codeparrot_training - Step 30793: {'lr': 0.0004547416666244393, 'samples': 15766528, 'steps': 30793, 'loss/train': 2.1315224170684814} +03/05/2022 01:39:18 - INFO - codeparrot_training - Skipping example with length 31 (seq_length=1024) +03/05/2022 01:39:22 - INFO - codeparrot_training - Step 30794: {'lr': 0.00045473862135034026, 'samples': 15767040, 'steps': 30794, 'loss/train': 1.0336943864822388} +03/05/2022 01:39:25 - INFO - codeparrot_training - Step 30795: {'lr': 0.0004547355759839891, 'samples': 15767552, 'steps': 30795, 'loss/train': 2.08406662940979} +03/05/2022 01:39:27 - INFO - codeparrot_training - Skipping example with length 601 (seq_length=1024) +03/05/2022 01:39:31 - INFO - codeparrot_training - Step 30796: {'lr': 0.00045473253052538725, 'samples': 15768064, 'steps': 30796, 'loss/train': 2.0980448722839355} +03/05/2022 01:39:34 - INFO - codeparrot_training - Step 30797: {'lr': 0.00045472948497453613, 'samples': 15768576, 'steps': 30797, 'loss/train': 1.688066005706787} +03/05/2022 01:39:35 - INFO - codeparrot_training - Skipping example with length 237 (seq_length=1024) +03/05/2022 01:39:39 - INFO - codeparrot_training - Step 30798: {'lr': 0.00045472643933143703, 'samples': 15769088, 'steps': 30798, 'loss/train': 1.7532328367233276} +03/05/2022 01:39:42 - INFO - codeparrot_training - Step 30799: {'lr': 0.0004547233935960914, 'samples': 15769600, 'steps': 30799, 'loss/train': 0.9880354404449463} +03/05/2022 01:39:43 - INFO - codeparrot_training - Skipping example with length 694 (seq_length=1024) +03/05/2022 01:39:48 - INFO - codeparrot_training - Step 30800: {'lr': 0.00045472034776850045, 'samples': 15770112, 'steps': 30800, 'loss/train': 1.9037271738052368} +03/05/2022 01:39:51 - INFO - codeparrot_training - Step 30801: {'lr': 0.0004547173018486658, 'samples': 15770624, 'steps': 30801, 'loss/train': 1.7513142824172974} +03/05/2022 01:39:52 - INFO - codeparrot_training - Skipping example with length 936 (seq_length=1024) +03/05/2022 01:39:56 - INFO - codeparrot_training - Step 30802: {'lr': 0.0004547142558365887, 'samples': 15771136, 'steps': 30802, 'loss/train': 1.4180409908294678} +03/05/2022 01:39:59 - INFO - codeparrot_training - Step 30803: {'lr': 0.0004547112097322704, 'samples': 15771648, 'steps': 30803, 'loss/train': 2.2047057151794434} +03/05/2022 01:40:00 - INFO - codeparrot_training - Skipping example with length 712 (seq_length=1024) +03/05/2022 01:40:04 - INFO - codeparrot_training - Step 30804: {'lr': 0.00045470816353571244, 'samples': 15772160, 'steps': 30804, 'loss/train': 2.505270004272461} +03/05/2022 01:40:07 - INFO - codeparrot_training - Step 30805: {'lr': 0.00045470511724691613, 'samples': 15772672, 'steps': 30805, 'loss/train': 2.587362289428711} +03/05/2022 01:40:08 - INFO - codeparrot_training - Skipping example with length 66 (seq_length=1024) +03/05/2022 01:40:13 - INFO - codeparrot_training - Step 30806: {'lr': 0.0004547020708658829, 'samples': 15773184, 'steps': 30806, 'loss/train': 1.6315616369247437} +03/05/2022 01:40:16 - INFO - codeparrot_training - Step 30807: {'lr': 0.000454699024392614, 'samples': 15773696, 'steps': 30807, 'loss/train': 0.7758349776268005} +03/05/2022 01:40:16 - INFO - codeparrot_training - Skipping example with length 518 (seq_length=1024) +03/05/2022 01:40:21 - INFO - codeparrot_training - Step 30808: {'lr': 0.0004546959778271109, 'samples': 15774208, 'steps': 30808, 'loss/train': 2.0164811611175537} +03/05/2022 01:40:24 - INFO - codeparrot_training - Step 30809: {'lr': 0.00045469293116937504, 'samples': 15774720, 'steps': 30809, 'loss/train': 0.0774369165301323} +03/05/2022 01:40:24 - INFO - codeparrot_training - Skipping example with length 932 (seq_length=1024) +03/05/2022 01:40:30 - INFO - codeparrot_training - Step 30810: {'lr': 0.0004546898844194076, 'samples': 15775232, 'steps': 30810, 'loss/train': 1.8789349794387817} +03/05/2022 01:40:33 - INFO - codeparrot_training - Step 30811: {'lr': 0.00045468683757721005, 'samples': 15775744, 'steps': 30811, 'loss/train': 1.7523642778396606} +03/05/2022 01:40:33 - INFO - codeparrot_training - Skipping example with length 897 (seq_length=1024) +03/05/2022 01:40:38 - INFO - codeparrot_training - Step 30812: {'lr': 0.0004546837906427839, 'samples': 15776256, 'steps': 30812, 'loss/train': 2.1858878135681152} +03/05/2022 01:40:41 - INFO - codeparrot_training - Step 30813: {'lr': 0.00045468074361613026, 'samples': 15776768, 'steps': 30813, 'loss/train': 2.0944786071777344} +03/05/2022 01:40:41 - INFO - codeparrot_training - Skipping example with length 874 (seq_length=1024) +03/05/2022 01:40:47 - INFO - codeparrot_training - Step 30814: {'lr': 0.0004546776964972507, 'samples': 15777280, 'steps': 30814, 'loss/train': 2.180429697036743} +03/05/2022 01:40:50 - INFO - codeparrot_training - Step 30815: {'lr': 0.00045467464928614657, 'samples': 15777792, 'steps': 30815, 'loss/train': 2.359980821609497} +03/05/2022 01:40:50 - INFO - codeparrot_training - Skipping example with length 111 (seq_length=1024) +03/05/2022 01:40:55 - INFO - codeparrot_training - Step 30816: {'lr': 0.0004546716019828191, 'samples': 15778304, 'steps': 30816, 'loss/train': 1.452144980430603} +03/05/2022 01:40:58 - INFO - codeparrot_training - Step 30817: {'lr': 0.00045466855458726975, 'samples': 15778816, 'steps': 30817, 'loss/train': 0.07422531396150589} +03/05/2022 01:40:58 - INFO - codeparrot_training - Skipping example with length 455 (seq_length=1024) +03/05/2022 01:41:04 - INFO - codeparrot_training - Step 30818: {'lr': 0.0004546655070995, 'samples': 15779328, 'steps': 30818, 'loss/train': 0.13780811429023743} +03/05/2022 01:41:07 - INFO - codeparrot_training - Step 30819: {'lr': 0.0004546624595195111, 'samples': 15779840, 'steps': 30819, 'loss/train': 1.803411602973938} +03/05/2022 01:41:07 - INFO - codeparrot_training - Skipping example with length 533 (seq_length=1024) +03/05/2022 01:41:12 - INFO - codeparrot_training - Step 30820: {'lr': 0.0004546594118473044, 'samples': 15780352, 'steps': 30820, 'loss/train': 2.544556140899658} +03/05/2022 01:41:15 - INFO - codeparrot_training - Step 30821: {'lr': 0.0004546563640828814, 'samples': 15780864, 'steps': 30821, 'loss/train': 2.0499353408813477} +03/05/2022 01:41:15 - INFO - codeparrot_training - Skipping example with length 610 (seq_length=1024) +03/05/2022 01:41:21 - INFO - codeparrot_training - Step 30822: {'lr': 0.0004546533162262434, 'samples': 15781376, 'steps': 30822, 'loss/train': 2.396827220916748} +03/05/2022 01:41:24 - INFO - codeparrot_training - Step 30823: {'lr': 0.00045465026827739175, 'samples': 15781888, 'steps': 30823, 'loss/train': 1.6210488080978394} +03/05/2022 01:41:24 - INFO - codeparrot_training - Skipping example with length 908 (seq_length=1024) +03/05/2022 01:41:29 - INFO - codeparrot_training - Step 30824: {'lr': 0.00045464722023632784, 'samples': 15782400, 'steps': 30824, 'loss/train': 1.2770367860794067} +03/05/2022 01:41:32 - INFO - codeparrot_training - Skipping example with length 38 (seq_length=1024) +03/05/2022 01:41:35 - INFO - codeparrot_training - Step 30825: {'lr': 0.00045464417210305303, 'samples': 15782912, 'steps': 30825, 'loss/train': 1.3899425268173218} +03/05/2022 01:41:38 - INFO - codeparrot_training - Step 30826: {'lr': 0.0004546411238775687, 'samples': 15783424, 'steps': 30826, 'loss/train': 2.4950389862060547} +03/05/2022 01:41:40 - INFO - codeparrot_training - Skipping example with length 728 (seq_length=1024) +03/05/2022 01:41:43 - INFO - codeparrot_training - Step 30827: {'lr': 0.00045463807555987633, 'samples': 15783936, 'steps': 30827, 'loss/train': 1.692447543144226} +03/05/2022 01:41:46 - INFO - codeparrot_training - Step 30828: {'lr': 0.0004546350271499772, 'samples': 15784448, 'steps': 30828, 'loss/train': 1.7099703550338745} +03/05/2022 01:41:49 - INFO - codeparrot_training - Skipping example with length 480 (seq_length=1024) +03/05/2022 01:41:52 - INFO - codeparrot_training - Step 30829: {'lr': 0.0004546319786478726, 'samples': 15784960, 'steps': 30829, 'loss/train': 0.6490452885627747} +03/05/2022 01:41:55 - INFO - codeparrot_training - Step 30830: {'lr': 0.000454628930053564, 'samples': 15785472, 'steps': 30830, 'loss/train': 0.9680806398391724} +03/05/2022 01:41:57 - INFO - codeparrot_training - Skipping example with length 704 (seq_length=1024) +03/05/2022 01:42:00 - INFO - codeparrot_training - Step 30831: {'lr': 0.0004546258813670528, 'samples': 15785984, 'steps': 30831, 'loss/train': 2.004863739013672} +03/05/2022 01:42:03 - INFO - codeparrot_training - Step 30832: {'lr': 0.0004546228325883403, 'samples': 15786496, 'steps': 30832, 'loss/train': 0.37108874320983887} +03/05/2022 01:42:06 - INFO - codeparrot_training - Skipping example with length 585 (seq_length=1024) +03/05/2022 01:42:08 - INFO - codeparrot_training - Step 30833: {'lr': 0.00045461978371742794, 'samples': 15787008, 'steps': 30833, 'loss/train': 1.5389811992645264} +03/05/2022 01:42:12 - INFO - codeparrot_training - Step 30834: {'lr': 0.00045461673475431704, 'samples': 15787520, 'steps': 30834, 'loss/train': 1.280617594718933} +03/05/2022 01:42:14 - INFO - codeparrot_training - Skipping example with length 717 (seq_length=1024) +03/05/2022 01:42:17 - INFO - codeparrot_training - Step 30835: {'lr': 0.000454613685699009, 'samples': 15788032, 'steps': 30835, 'loss/train': 2.5214040279388428} +03/05/2022 01:42:20 - INFO - codeparrot_training - Step 30836: {'lr': 0.0004546106365515052, 'samples': 15788544, 'steps': 30836, 'loss/train': 1.7270100116729736} +03/05/2022 01:42:22 - INFO - codeparrot_training - Skipping example with length 910 (seq_length=1024) +03/05/2022 01:42:25 - INFO - codeparrot_training - Step 30837: {'lr': 0.000454607587311807, 'samples': 15789056, 'steps': 30837, 'loss/train': 2.416752338409424} +03/05/2022 01:42:29 - INFO - codeparrot_training - Step 30838: {'lr': 0.00045460453797991577, 'samples': 15789568, 'steps': 30838, 'loss/train': 1.8838835954666138} +03/05/2022 01:42:31 - INFO - codeparrot_training - Skipping example with length 682 (seq_length=1024) +03/05/2022 01:42:34 - INFO - codeparrot_training - Step 30839: {'lr': 0.00045460148855583295, 'samples': 15790080, 'steps': 30839, 'loss/train': 1.6490662097930908} +03/05/2022 01:42:37 - INFO - codeparrot_training - Step 30840: {'lr': 0.00045459843903955977, 'samples': 15790592, 'steps': 30840, 'loss/train': 1.2708324193954468} +03/05/2022 01:42:39 - INFO - codeparrot_training - Skipping example with length 164 (seq_length=1024) +03/05/2022 01:42:42 - INFO - codeparrot_training - Step 30841: {'lr': 0.00045459538943109774, 'samples': 15791104, 'steps': 30841, 'loss/train': 2.188490152359009} +03/05/2022 01:42:45 - INFO - codeparrot_training - Step 30842: {'lr': 0.0004545923397304482, 'samples': 15791616, 'steps': 30842, 'loss/train': 2.501016139984131} +03/05/2022 01:42:47 - INFO - codeparrot_training - Skipping example with length 350 (seq_length=1024) +03/05/2022 01:42:51 - INFO - codeparrot_training - Step 30843: {'lr': 0.0004545892899376125, 'samples': 15792128, 'steps': 30843, 'loss/train': 1.1459052562713623} +03/05/2022 01:42:54 - INFO - codeparrot_training - Step 30844: {'lr': 0.000454586240052592, 'samples': 15792640, 'steps': 30844, 'loss/train': 1.919549584388733} +03/05/2022 01:42:56 - INFO - codeparrot_training - Skipping example with length 873 (seq_length=1024) +03/05/2022 01:42:59 - INFO - codeparrot_training - Step 30845: {'lr': 0.00045458319007538804, 'samples': 15793152, 'steps': 30845, 'loss/train': 1.5615907907485962} +03/05/2022 01:43:02 - INFO - codeparrot_training - Step 30846: {'lr': 0.00045458014000600213, 'samples': 15793664, 'steps': 30846, 'loss/train': 1.6484390497207642} +03/05/2022 01:43:05 - INFO - codeparrot_training - Skipping example with length 167 (seq_length=1024) +03/05/2022 01:43:08 - INFO - codeparrot_training - Step 30847: {'lr': 0.00045457708984443556, 'samples': 15794176, 'steps': 30847, 'loss/train': 1.230629801750183} +03/05/2022 01:43:11 - INFO - codeparrot_training - Step 30848: {'lr': 0.0004545740395906897, 'samples': 15794688, 'steps': 30848, 'loss/train': 2.2825987339019775} +03/05/2022 01:43:14 - INFO - codeparrot_training - Skipping example with length 709 (seq_length=1024) +03/05/2022 01:43:16 - INFO - codeparrot_training - Step 30849: {'lr': 0.0004545709892447659, 'samples': 15795200, 'steps': 30849, 'loss/train': 1.4703425168991089} +03/05/2022 01:43:19 - INFO - codeparrot_training - Step 30850: {'lr': 0.00045456793880666556, 'samples': 15795712, 'steps': 30850, 'loss/train': 2.123150110244751} +03/05/2022 01:43:22 - INFO - codeparrot_training - Skipping example with length 178 (seq_length=1024) +03/05/2022 01:43:25 - INFO - codeparrot_training - Step 30851: {'lr': 0.0004545648882763902, 'samples': 15796224, 'steps': 30851, 'loss/train': 1.6535041332244873} +03/05/2022 01:43:28 - INFO - codeparrot_training - Step 30852: {'lr': 0.0004545618376539409, 'samples': 15796736, 'steps': 30852, 'loss/train': 1.6485791206359863} +03/05/2022 01:43:30 - INFO - codeparrot_training - Skipping example with length 6 (seq_length=1024) +03/05/2022 01:43:33 - INFO - codeparrot_training - Step 30853: {'lr': 0.0004545587869393193, 'samples': 15797248, 'steps': 30853, 'loss/train': 1.8848695755004883} +03/05/2022 01:43:36 - INFO - codeparrot_training - Step 30854: {'lr': 0.00045455573613252667, 'samples': 15797760, 'steps': 30854, 'loss/train': 1.846081018447876} +03/05/2022 01:43:38 - INFO - codeparrot_training - Skipping example with length 186 (seq_length=1024) +03/05/2022 01:43:41 - INFO - codeparrot_training - Step 30855: {'lr': 0.0004545526852335643, 'samples': 15798272, 'steps': 30855, 'loss/train': 1.1993454694747925} +03/05/2022 01:43:45 - INFO - codeparrot_training - Step 30856: {'lr': 0.0004545496342424337, 'samples': 15798784, 'steps': 30856, 'loss/train': 0.997812032699585} +03/05/2022 01:43:46 - INFO - codeparrot_training - Skipping example with length 771 (seq_length=1024) +03/05/2022 01:43:50 - INFO - codeparrot_training - Step 30857: {'lr': 0.00045454658315913617, 'samples': 15799296, 'steps': 30857, 'loss/train': 1.7588779926300049} +03/05/2022 01:43:53 - INFO - codeparrot_training - Step 30858: {'lr': 0.0004545435319836731, 'samples': 15799808, 'steps': 30858, 'loss/train': 1.8263434171676636} +03/05/2022 01:43:55 - INFO - codeparrot_training - Skipping example with length 396 (seq_length=1024) +03/05/2022 01:43:58 - INFO - codeparrot_training - Step 30859: {'lr': 0.00045454048071604593, 'samples': 15800320, 'steps': 30859, 'loss/train': 2.0573976039886475} +03/05/2022 01:44:02 - INFO - codeparrot_training - Step 30860: {'lr': 0.0004545374293562559, 'samples': 15800832, 'steps': 30860, 'loss/train': 1.8035696744918823} +03/05/2022 01:44:03 - INFO - codeparrot_training - Skipping example with length 17 (seq_length=1024) +03/05/2022 01:44:07 - INFO - codeparrot_training - Step 30861: {'lr': 0.00045453437790430446, 'samples': 15801344, 'steps': 30861, 'loss/train': 2.455286741256714} +03/05/2022 01:44:10 - INFO - codeparrot_training - Step 30862: {'lr': 0.000454531326360193, 'samples': 15801856, 'steps': 30862, 'loss/train': 1.5836222171783447} +03/05/2022 01:44:12 - INFO - codeparrot_training - Skipping example with length 862 (seq_length=1024) +03/05/2022 01:44:15 - INFO - codeparrot_training - Step 30863: {'lr': 0.00045452827472392286, 'samples': 15802368, 'steps': 30863, 'loss/train': 1.4403066635131836} +03/05/2022 01:44:19 - INFO - codeparrot_training - Step 30864: {'lr': 0.0004545252229954955, 'samples': 15802880, 'steps': 30864, 'loss/train': 1.3540735244750977} +03/05/2022 01:44:20 - INFO - codeparrot_training - Skipping example with length 109 (seq_length=1024) +03/05/2022 01:44:24 - INFO - codeparrot_training - Step 30865: {'lr': 0.00045452217117491225, 'samples': 15803392, 'steps': 30865, 'loss/train': 2.195787191390991} +03/05/2022 01:44:27 - INFO - codeparrot_training - Step 30866: {'lr': 0.00045451911926217437, 'samples': 15803904, 'steps': 30866, 'loss/train': 0.8510196805000305} +03/05/2022 01:44:29 - INFO - codeparrot_training - Skipping example with length 116 (seq_length=1024) +03/05/2022 01:44:32 - INFO - codeparrot_training - Step 30867: {'lr': 0.00045451606725728337, 'samples': 15804416, 'steps': 30867, 'loss/train': 1.405698299407959} +03/05/2022 01:44:36 - INFO - codeparrot_training - Step 30868: {'lr': 0.0004545130151602406, 'samples': 15804928, 'steps': 30868, 'loss/train': 1.5107038021087646} +03/05/2022 01:44:37 - INFO - codeparrot_training - Skipping example with length 561 (seq_length=1024) +03/05/2022 01:44:41 - INFO - codeparrot_training - Step 30869: {'lr': 0.00045450996297104743, 'samples': 15805440, 'steps': 30869, 'loss/train': 1.181347370147705} +03/05/2022 01:44:44 - INFO - codeparrot_training - Step 30870: {'lr': 0.00045450691068970515, 'samples': 15805952, 'steps': 30870, 'loss/train': 2.0976436138153076} +03/05/2022 01:44:45 - INFO - codeparrot_training - Skipping example with length 796 (seq_length=1024) +03/05/2022 01:44:49 - INFO - codeparrot_training - Step 30871: {'lr': 0.00045450385831621534, 'samples': 15806464, 'steps': 30871, 'loss/train': 0.9618310928344727} +03/05/2022 01:44:52 - INFO - codeparrot_training - Step 30872: {'lr': 0.0004545008058505792, 'samples': 15806976, 'steps': 30872, 'loss/train': 1.975067377090454} +03/05/2022 01:44:53 - INFO - codeparrot_training - Skipping example with length 865 (seq_length=1024) +03/05/2022 01:44:57 - INFO - codeparrot_training - Step 30873: {'lr': 0.0004544977532927981, 'samples': 15807488, 'steps': 30873, 'loss/train': 2.111354112625122} +03/05/2022 01:45:01 - INFO - codeparrot_training - Step 30874: {'lr': 0.0004544947006428735, 'samples': 15808000, 'steps': 30874, 'loss/train': 2.0299127101898193} +03/05/2022 01:45:02 - INFO - codeparrot_training - Skipping example with length 402 (seq_length=1024) +03/05/2022 01:45:06 - INFO - codeparrot_training - Step 30875: {'lr': 0.00045449164790080675, 'samples': 15808512, 'steps': 30875, 'loss/train': 1.534213662147522} +03/05/2022 01:45:09 - INFO - codeparrot_training - Step 30876: {'lr': 0.00045448859506659926, 'samples': 15809024, 'steps': 30876, 'loss/train': 0.6772264242172241} +03/05/2022 01:45:10 - INFO - codeparrot_training - Skipping example with length 534 (seq_length=1024) +03/05/2022 01:45:14 - INFO - codeparrot_training - Step 30877: {'lr': 0.0004544855421402523, 'samples': 15809536, 'steps': 30877, 'loss/train': 1.5088136196136475} +03/05/2022 01:45:17 - INFO - codeparrot_training - Step 30878: {'lr': 0.00045448248912176726, 'samples': 15810048, 'steps': 30878, 'loss/train': 2.041574239730835} +03/05/2022 01:45:18 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 01:45:23 - INFO - codeparrot_training - Step 30879: {'lr': 0.00045447943601114563, 'samples': 15810560, 'steps': 30879, 'loss/train': 1.9911890029907227} +03/05/2022 01:45:26 - INFO - codeparrot_training - Step 30880: {'lr': 0.00045447638280838877, 'samples': 15811072, 'steps': 30880, 'loss/train': 1.328418254852295} +03/05/2022 01:45:26 - INFO - codeparrot_training - Skipping example with length 723 (seq_length=1024) +03/05/2022 01:45:31 - INFO - codeparrot_training - Step 30881: {'lr': 0.000454473329513498, 'samples': 15811584, 'steps': 30881, 'loss/train': 1.6789195537567139} +03/05/2022 01:45:34 - INFO - codeparrot_training - Step 30882: {'lr': 0.0004544702761264746, 'samples': 15812096, 'steps': 30882, 'loss/train': 1.9404628276824951} +03/05/2022 01:45:34 - INFO - codeparrot_training - Skipping example with length 893 (seq_length=1024) +03/05/2022 01:45:39 - INFO - codeparrot_training - Step 30883: {'lr': 0.0004544672226473201, 'samples': 15812608, 'steps': 30883, 'loss/train': 2.4385030269622803} +03/05/2022 01:45:43 - INFO - codeparrot_training - Step 30884: {'lr': 0.00045446416907603585, 'samples': 15813120, 'steps': 30884, 'loss/train': 1.62992525100708} +03/05/2022 01:45:43 - INFO - codeparrot_training - Skipping example with length 441 (seq_length=1024) +03/05/2022 01:45:48 - INFO - codeparrot_training - Step 30885: {'lr': 0.00045446111541262317, 'samples': 15813632, 'steps': 30885, 'loss/train': 0.2488349825143814} +03/05/2022 01:45:51 - INFO - codeparrot_training - Step 30886: {'lr': 0.0004544580616570835, 'samples': 15814144, 'steps': 30886, 'loss/train': 1.811905860900879} +03/05/2022 01:45:51 - INFO - codeparrot_training - Skipping example with length 61 (seq_length=1024) +03/05/2022 01:45:56 - INFO - codeparrot_training - Step 30887: {'lr': 0.0004544550078094182, 'samples': 15814656, 'steps': 30887, 'loss/train': 1.7952262163162231} +03/05/2022 01:46:00 - INFO - codeparrot_training - Step 30888: {'lr': 0.00045445195386962855, 'samples': 15815168, 'steps': 30888, 'loss/train': 1.796083927154541} +03/05/2022 01:46:00 - INFO - codeparrot_training - Skipping example with length 599 (seq_length=1024) +03/05/2022 01:46:05 - INFO - codeparrot_training - Step 30889: {'lr': 0.0004544488998377161, 'samples': 15815680, 'steps': 30889, 'loss/train': 2.588817596435547} +03/05/2022 01:46:08 - INFO - codeparrot_training - Step 30890: {'lr': 0.000454445845713682, 'samples': 15816192, 'steps': 30890, 'loss/train': 1.9734289646148682} +03/05/2022 01:46:08 - INFO - codeparrot_training - Skipping example with length 528 (seq_length=1024) +03/05/2022 01:46:13 - INFO - codeparrot_training - Step 30891: {'lr': 0.0004544427914975279, 'samples': 15816704, 'steps': 30891, 'loss/train': 2.2133333683013916} +03/05/2022 01:46:16 - INFO - codeparrot_training - Step 30892: {'lr': 0.0004544397371892549, 'samples': 15817216, 'steps': 30892, 'loss/train': 2.083092212677002} +03/05/2022 01:46:17 - INFO - codeparrot_training - Skipping example with length 883 (seq_length=1024) +03/05/2022 01:46:22 - INFO - codeparrot_training - Step 30893: {'lr': 0.00045443668278886463, 'samples': 15817728, 'steps': 30893, 'loss/train': 0.8700692653656006} +03/05/2022 01:46:25 - INFO - codeparrot_training - Step 30894: {'lr': 0.00045443362829635826, 'samples': 15818240, 'steps': 30894, 'loss/train': 1.9676061868667603} +03/05/2022 01:46:25 - INFO - codeparrot_training - Skipping example with length 48 (seq_length=1024) +03/05/2022 01:46:30 - INFO - codeparrot_training - Step 30895: {'lr': 0.00045443057371173727, 'samples': 15818752, 'steps': 30895, 'loss/train': 2.025254726409912} +03/05/2022 01:46:33 - INFO - codeparrot_training - Step 30896: {'lr': 0.00045442751903500305, 'samples': 15819264, 'steps': 30896, 'loss/train': 2.0144519805908203} +03/05/2022 01:46:33 - INFO - codeparrot_training - Skipping example with length 641 (seq_length=1024) +03/05/2022 01:46:39 - INFO - codeparrot_training - Step 30897: {'lr': 0.0004544244642661569, 'samples': 15819776, 'steps': 30897, 'loss/train': 1.6518577337265015} +03/05/2022 01:46:42 - INFO - codeparrot_training - Step 30898: {'lr': 0.00045442140940520027, 'samples': 15820288, 'steps': 30898, 'loss/train': 2.2372217178344727} +03/05/2022 01:46:43 - INFO - codeparrot_training - Skipping example with length 912 (seq_length=1024) +03/05/2022 01:46:47 - INFO - codeparrot_training - Step 30899: {'lr': 0.0004544183544521345, 'samples': 15820800, 'steps': 30899, 'loss/train': 1.3643090724945068} +03/05/2022 01:46:50 - INFO - codeparrot_training - Step 30900: {'lr': 0.00045441529940696104, 'samples': 15821312, 'steps': 30900, 'loss/train': 1.5926587581634521} +03/05/2022 01:46:51 - INFO - codeparrot_training - Skipping example with length 799 (seq_length=1024) +03/05/2022 01:46:55 - INFO - codeparrot_training - Step 30901: {'lr': 0.0004544122442696811, 'samples': 15821824, 'steps': 30901, 'loss/train': 2.7287845611572266} +03/05/2022 01:46:59 - INFO - codeparrot_training - Step 30902: {'lr': 0.0004544091890402962, 'samples': 15822336, 'steps': 30902, 'loss/train': 1.090118408203125} +03/05/2022 01:46:59 - INFO - codeparrot_training - Skipping example with length 765 (seq_length=1024) +03/05/2022 01:47:04 - INFO - codeparrot_training - Step 30903: {'lr': 0.0004544061337188077, 'samples': 15822848, 'steps': 30903, 'loss/train': 1.7343541383743286} +03/05/2022 01:47:07 - INFO - codeparrot_training - Step 30904: {'lr': 0.0004544030783052169, 'samples': 15823360, 'steps': 30904, 'loss/train': 1.6753623485565186} +03/05/2022 01:47:07 - INFO - codeparrot_training - Skipping example with length 534 (seq_length=1024) +03/05/2022 01:47:12 - INFO - codeparrot_training - Step 30905: {'lr': 0.0004544000227995253, 'samples': 15823872, 'steps': 30905, 'loss/train': 1.3007274866104126} +03/05/2022 01:47:15 - INFO - codeparrot_training - Skipping example with length 704 (seq_length=1024) +03/05/2022 01:47:17 - INFO - codeparrot_training - Step 30906: {'lr': 0.00045439696720173405, 'samples': 15824384, 'steps': 30906, 'loss/train': 1.2722312211990356} +03/05/2022 01:47:21 - INFO - codeparrot_training - Step 30907: {'lr': 0.00045439391151184483, 'samples': 15824896, 'steps': 30907, 'loss/train': 1.3966833353042603} +03/05/2022 01:47:23 - INFO - codeparrot_training - Skipping example with length 269 (seq_length=1024) +03/05/2022 01:47:26 - INFO - codeparrot_training - Step 30908: {'lr': 0.0004543908557298588, 'samples': 15825408, 'steps': 30908, 'loss/train': 1.4870173931121826} +03/05/2022 01:47:29 - INFO - codeparrot_training - Step 30909: {'lr': 0.0004543877998557775, 'samples': 15825920, 'steps': 30909, 'loss/train': 0.7243610620498657} +03/05/2022 01:47:32 - INFO - codeparrot_training - Skipping example with length 724 (seq_length=1024) +03/05/2022 01:47:34 - INFO - codeparrot_training - Step 30910: {'lr': 0.00045438474388960205, 'samples': 15826432, 'steps': 30910, 'loss/train': 2.09417986869812} +03/05/2022 01:47:37 - INFO - codeparrot_training - Step 30911: {'lr': 0.0004543816878313341, 'samples': 15826944, 'steps': 30911, 'loss/train': 2.2226531505584717} +03/05/2022 01:47:40 - INFO - codeparrot_training - Skipping example with length 945 (seq_length=1024) +03/05/2022 01:47:43 - INFO - codeparrot_training - Step 30912: {'lr': 0.0004543786316809749, 'samples': 15827456, 'steps': 30912, 'loss/train': 1.6105252504348755} +03/05/2022 01:47:46 - INFO - codeparrot_training - Step 30913: {'lr': 0.0004543755754385258, 'samples': 15827968, 'steps': 30913, 'loss/train': 1.6186732053756714} +03/05/2022 01:47:49 - INFO - codeparrot_training - Skipping example with length 495 (seq_length=1024) +03/05/2022 01:47:51 - INFO - codeparrot_training - Step 30914: {'lr': 0.00045437251910398824, 'samples': 15828480, 'steps': 30914, 'loss/train': 1.6683251857757568} +03/05/2022 01:47:54 - INFO - codeparrot_training - Step 30915: {'lr': 0.00045436946267736364, 'samples': 15828992, 'steps': 30915, 'loss/train': 2.114124298095703} +03/05/2022 01:47:57 - INFO - codeparrot_training - Skipping example with length 542 (seq_length=1024) +03/05/2022 01:48:00 - INFO - codeparrot_training - Step 30916: {'lr': 0.0004543664061586532, 'samples': 15829504, 'steps': 30916, 'loss/train': 1.229833960533142} +03/05/2022 01:48:03 - INFO - codeparrot_training - Step 30917: {'lr': 0.00045436334954785854, 'samples': 15830016, 'steps': 30917, 'loss/train': 1.546056866645813} +03/05/2022 01:48:05 - INFO - codeparrot_training - Skipping example with length 423 (seq_length=1024) +03/05/2022 01:48:08 - INFO - codeparrot_training - Step 30918: {'lr': 0.0004543602928449808, 'samples': 15830528, 'steps': 30918, 'loss/train': 1.2573237419128418} +03/05/2022 01:48:11 - INFO - codeparrot_training - Step 30919: {'lr': 0.00045435723605002156, 'samples': 15831040, 'steps': 30919, 'loss/train': 1.9178073406219482} +03/05/2022 01:48:14 - INFO - codeparrot_training - Skipping example with length 513 (seq_length=1024) +03/05/2022 01:48:16 - INFO - codeparrot_training - Step 30920: {'lr': 0.00045435417916298205, 'samples': 15831552, 'steps': 30920, 'loss/train': 1.5800565481185913} +03/05/2022 01:48:20 - INFO - codeparrot_training - Step 30921: {'lr': 0.00045435112218386364, 'samples': 15832064, 'steps': 30921, 'loss/train': 1.99652099609375} +03/05/2022 01:48:22 - INFO - codeparrot_training - Skipping example with length 765 (seq_length=1024) +03/05/2022 01:48:25 - INFO - codeparrot_training - Step 30922: {'lr': 0.00045434806511266784, 'samples': 15832576, 'steps': 30922, 'loss/train': 2.527116298675537} +03/05/2022 01:48:28 - INFO - codeparrot_training - Step 30923: {'lr': 0.0004543450079493959, 'samples': 15833088, 'steps': 30923, 'loss/train': 1.7062276601791382} +03/05/2022 01:48:30 - INFO - codeparrot_training - Skipping example with length 318 (seq_length=1024) +03/05/2022 01:48:33 - INFO - codeparrot_training - Step 30924: {'lr': 0.0004543419506940494, 'samples': 15833600, 'steps': 30924, 'loss/train': 2.6366090774536133} +03/05/2022 01:48:37 - INFO - codeparrot_training - Step 30925: {'lr': 0.0004543388933466294, 'samples': 15834112, 'steps': 30925, 'loss/train': 1.983325719833374} +03/05/2022 01:48:40 - INFO - codeparrot_training - Step 30926: {'lr': 0.00045433583590713756, 'samples': 15834624, 'steps': 30926, 'loss/train': 0.17568804323673248} +03/05/2022 01:48:40 - INFO - codeparrot_training - Skipping example with length 659 (seq_length=1024) +03/05/2022 01:48:45 - INFO - codeparrot_training - Step 30927: {'lr': 0.0004543327783755751, 'samples': 15835136, 'steps': 30927, 'loss/train': 1.6338725090026855} +03/05/2022 01:48:48 - INFO - codeparrot_training - Skipping example with length 254 (seq_length=1024) +03/05/2022 01:48:50 - INFO - codeparrot_training - Step 30928: {'lr': 0.0004543297207519434, 'samples': 15835648, 'steps': 30928, 'loss/train': 1.9122414588928223} +03/05/2022 01:48:54 - INFO - codeparrot_training - Step 30929: {'lr': 0.0004543266630362439, 'samples': 15836160, 'steps': 30929, 'loss/train': 2.424015998840332} +03/05/2022 01:48:56 - INFO - codeparrot_training - Skipping example with length 436 (seq_length=1024) +03/05/2022 01:48:59 - INFO - codeparrot_training - Step 30930: {'lr': 0.00045432360522847803, 'samples': 15836672, 'steps': 30930, 'loss/train': 2.0605716705322266} +03/05/2022 01:49:02 - INFO - codeparrot_training - Step 30931: {'lr': 0.000454320547328647, 'samples': 15837184, 'steps': 30931, 'loss/train': 1.8656967878341675} +03/05/2022 01:49:06 - INFO - codeparrot_training - Step 30932: {'lr': 0.00045431748933675236, 'samples': 15837696, 'steps': 30932, 'loss/train': 0.9715030193328857} +03/05/2022 01:49:06 - INFO - codeparrot_training - Skipping example with length 453 (seq_length=1024) +03/05/2022 01:49:11 - INFO - codeparrot_training - Step 30933: {'lr': 0.00045431443125279534, 'samples': 15838208, 'steps': 30933, 'loss/train': 1.5591328144073486} +03/05/2022 01:49:14 - INFO - codeparrot_training - Step 30934: {'lr': 0.00045431137307677753, 'samples': 15838720, 'steps': 30934, 'loss/train': 2.092139959335327} +03/05/2022 01:49:15 - INFO - codeparrot_training - Skipping example with length 613 (seq_length=1024) +03/05/2022 01:49:20 - INFO - codeparrot_training - Step 30935: {'lr': 0.00045430831480870005, 'samples': 15839232, 'steps': 30935, 'loss/train': 1.1295056343078613} +03/05/2022 01:49:23 - INFO - codeparrot_training - Step 30936: {'lr': 0.0004543052564485644, 'samples': 15839744, 'steps': 30936, 'loss/train': 2.2334303855895996} +03/05/2022 01:49:23 - INFO - codeparrot_training - Skipping example with length 617 (seq_length=1024) +03/05/2022 01:49:28 - INFO - codeparrot_training - Step 30937: {'lr': 0.00045430219799637197, 'samples': 15840256, 'steps': 30937, 'loss/train': 1.2963814735412598} +03/05/2022 01:49:31 - INFO - codeparrot_training - Step 30938: {'lr': 0.0004542991394521241, 'samples': 15840768, 'steps': 30938, 'loss/train': 1.444502830505371} +03/05/2022 01:49:31 - INFO - codeparrot_training - Skipping example with length 773 (seq_length=1024) +03/05/2022 01:49:37 - INFO - codeparrot_training - Step 30939: {'lr': 0.00045429608081582216, 'samples': 15841280, 'steps': 30939, 'loss/train': 1.8565610647201538} +03/05/2022 01:49:40 - INFO - codeparrot_training - Step 30940: {'lr': 0.0004542930220874677, 'samples': 15841792, 'steps': 30940, 'loss/train': 2.0522801876068115} +03/05/2022 01:49:40 - INFO - codeparrot_training - Skipping example with length 351 (seq_length=1024) +03/05/2022 01:49:45 - INFO - codeparrot_training - Step 30941: {'lr': 0.00045428996326706185, 'samples': 15842304, 'steps': 30941, 'loss/train': 2.016282320022583} +03/05/2022 01:49:48 - INFO - codeparrot_training - Step 30942: {'lr': 0.0004542869043546061, 'samples': 15842816, 'steps': 30942, 'loss/train': 1.8218531608581543} +03/05/2022 01:49:48 - INFO - codeparrot_training - Skipping example with length 353 (seq_length=1024) +03/05/2022 01:49:53 - INFO - codeparrot_training - Step 30943: {'lr': 0.0004542838453501018, 'samples': 15843328, 'steps': 30943, 'loss/train': 0.8377234935760498} +03/05/2022 01:49:57 - INFO - codeparrot_training - Step 30944: {'lr': 0.0004542807862535504, 'samples': 15843840, 'steps': 30944, 'loss/train': 1.2963526248931885} +03/05/2022 01:49:57 - INFO - codeparrot_training - Skipping example with length 76 (seq_length=1024) +03/05/2022 01:50:02 - INFO - codeparrot_training - Step 30945: {'lr': 0.0004542777270649533, 'samples': 15844352, 'steps': 30945, 'loss/train': 2.0030367374420166} +03/05/2022 01:50:05 - INFO - codeparrot_training - Step 30946: {'lr': 0.0004542746677843117, 'samples': 15844864, 'steps': 30946, 'loss/train': 0.07478119432926178} +03/05/2022 01:50:05 - INFO - codeparrot_training - Skipping example with length 118 (seq_length=1024) +03/05/2022 01:50:10 - INFO - codeparrot_training - Step 30947: {'lr': 0.0004542716084116271, 'samples': 15845376, 'steps': 30947, 'loss/train': 1.6268080472946167} +03/05/2022 01:50:13 - INFO - codeparrot_training - Skipping example with length 963 (seq_length=1024) +03/05/2022 01:50:16 - INFO - codeparrot_training - Step 30948: {'lr': 0.0004542685489469008, 'samples': 15845888, 'steps': 30948, 'loss/train': 1.643465518951416} +03/05/2022 01:50:19 - INFO - codeparrot_training - Step 30949: {'lr': 0.0004542654893901344, 'samples': 15846400, 'steps': 30949, 'loss/train': 1.7122445106506348} +03/05/2022 01:50:22 - INFO - codeparrot_training - Skipping example with length 967 (seq_length=1024) +03/05/2022 01:50:24 - INFO - codeparrot_training - Step 30950: {'lr': 0.00045426242974132904, 'samples': 15846912, 'steps': 30950, 'loss/train': 2.2826390266418457} +03/05/2022 01:50:27 - INFO - codeparrot_training - Step 30951: {'lr': 0.0004542593700004862, 'samples': 15847424, 'steps': 30951, 'loss/train': 1.8122682571411133} +03/05/2022 01:50:31 - INFO - codeparrot_training - Step 30952: {'lr': 0.0004542563101676072, 'samples': 15847936, 'steps': 30952, 'loss/train': 1.7694283723831177} +03/05/2022 01:50:31 - INFO - codeparrot_training - Skipping example with length 858 (seq_length=1024) +03/05/2022 01:50:36 - INFO - codeparrot_training - Step 30953: {'lr': 0.0004542532502426935, 'samples': 15848448, 'steps': 30953, 'loss/train': 0.6644503474235535} +03/05/2022 01:50:39 - INFO - codeparrot_training - Step 30954: {'lr': 0.0004542501902257464, 'samples': 15848960, 'steps': 30954, 'loss/train': 2.0675861835479736} +03/05/2022 01:50:39 - INFO - codeparrot_training - Skipping example with length 501 (seq_length=1024) +03/05/2022 01:50:44 - INFO - codeparrot_training - Step 30955: {'lr': 0.0004542471301167673, 'samples': 15849472, 'steps': 30955, 'loss/train': 2.1627542972564697} +03/05/2022 01:50:47 - INFO - codeparrot_training - Step 30956: {'lr': 0.0004542440699157577, 'samples': 15849984, 'steps': 30956, 'loss/train': 0.9101678133010864} +03/05/2022 01:50:48 - INFO - codeparrot_training - Skipping example with length 720 (seq_length=1024) +03/05/2022 01:50:53 - INFO - codeparrot_training - Step 30957: {'lr': 0.00045424100962271883, 'samples': 15850496, 'steps': 30957, 'loss/train': 0.7713713049888611} +03/05/2022 01:50:56 - INFO - codeparrot_training - Step 30958: {'lr': 0.00045423794923765204, 'samples': 15851008, 'steps': 30958, 'loss/train': 2.854386806488037} +03/05/2022 01:50:56 - INFO - codeparrot_training - Skipping example with length 537 (seq_length=1024) +03/05/2022 01:51:01 - INFO - codeparrot_training - Step 30959: {'lr': 0.00045423488876055883, 'samples': 15851520, 'steps': 30959, 'loss/train': 1.8214255571365356} +03/05/2022 01:51:04 - INFO - codeparrot_training - Skipping example with length 899 (seq_length=1024) +03/05/2022 01:51:06 - INFO - codeparrot_training - Step 30960: {'lr': 0.00045423182819144054, 'samples': 15852032, 'steps': 30960, 'loss/train': 0.833591639995575} +03/05/2022 01:51:10 - INFO - codeparrot_training - Step 30961: {'lr': 0.00045422876753029853, 'samples': 15852544, 'steps': 30961, 'loss/train': 1.5145734548568726} +03/05/2022 01:51:13 - INFO - codeparrot_training - Step 30962: {'lr': 0.0004542257067771342, 'samples': 15853056, 'steps': 30962, 'loss/train': 1.9908989667892456} +03/05/2022 01:51:13 - INFO - codeparrot_training - Skipping example with length 375 (seq_length=1024) +03/05/2022 01:51:18 - INFO - codeparrot_training - Step 30963: {'lr': 0.0004542226459319489, 'samples': 15853568, 'steps': 30963, 'loss/train': 2.1853761672973633} +03/05/2022 01:51:21 - INFO - codeparrot_training - Skipping example with length 614 (seq_length=1024) +03/05/2022 01:51:23 - INFO - codeparrot_training - Step 30964: {'lr': 0.000454219584994744, 'samples': 15854080, 'steps': 30964, 'loss/train': 1.9599518775939941} +03/05/2022 01:51:27 - INFO - codeparrot_training - Step 30965: {'lr': 0.00045421652396552094, 'samples': 15854592, 'steps': 30965, 'loss/train': 1.5561466217041016} +03/05/2022 01:51:30 - INFO - codeparrot_training - Step 30966: {'lr': 0.0004542134628442811, 'samples': 15855104, 'steps': 30966, 'loss/train': 1.2308969497680664} +03/05/2022 01:51:30 - INFO - codeparrot_training - Skipping example with length 608 (seq_length=1024) +03/05/2022 01:51:35 - INFO - codeparrot_training - Step 30967: {'lr': 0.0004542104016310258, 'samples': 15855616, 'steps': 30967, 'loss/train': 1.7305328845977783} +03/05/2022 01:51:38 - INFO - codeparrot_training - Step 30968: {'lr': 0.0004542073403257564, 'samples': 15856128, 'steps': 30968, 'loss/train': 1.3858481645584106} +03/05/2022 01:51:38 - INFO - codeparrot_training - Skipping example with length 444 (seq_length=1024) +03/05/2022 01:51:43 - INFO - codeparrot_training - Step 30969: {'lr': 0.0004542042789284744, 'samples': 15856640, 'steps': 30969, 'loss/train': 1.6783955097198486} +03/05/2022 01:51:46 - INFO - codeparrot_training - Step 30970: {'lr': 0.0004542012174391811, 'samples': 15857152, 'steps': 30970, 'loss/train': 1.8002711534500122} +03/05/2022 01:51:47 - INFO - codeparrot_training - Skipping example with length 720 (seq_length=1024) +03/05/2022 01:51:52 - INFO - codeparrot_training - Step 30971: {'lr': 0.0004541981558578778, 'samples': 15857664, 'steps': 30971, 'loss/train': 2.291543960571289} +03/05/2022 01:51:55 - INFO - codeparrot_training - Step 30972: {'lr': 0.00045419509418456603, 'samples': 15858176, 'steps': 30972, 'loss/train': 2.367621421813965} +03/05/2022 01:51:55 - INFO - codeparrot_training - Skipping example with length 729 (seq_length=1024) +03/05/2022 01:52:00 - INFO - codeparrot_training - Step 30973: {'lr': 0.00045419203241924705, 'samples': 15858688, 'steps': 30973, 'loss/train': 1.5764976739883423} +03/05/2022 01:52:03 - INFO - codeparrot_training - Step 30974: {'lr': 0.00045418897056192234, 'samples': 15859200, 'steps': 30974, 'loss/train': 1.3960379362106323} +03/05/2022 01:52:04 - INFO - codeparrot_training - Skipping example with length 709 (seq_length=1024) +03/05/2022 01:52:09 - INFO - codeparrot_training - Step 30975: {'lr': 0.00045418590861259317, 'samples': 15859712, 'steps': 30975, 'loss/train': 0.8297275304794312} +03/05/2022 01:52:12 - INFO - codeparrot_training - Step 30976: {'lr': 0.0004541828465712611, 'samples': 15860224, 'steps': 30976, 'loss/train': 0.06625861674547195} +03/05/2022 01:52:12 - INFO - codeparrot_training - Skipping example with length 184 (seq_length=1024) +03/05/2022 01:52:17 - INFO - codeparrot_training - Step 30977: {'lr': 0.0004541797844379273, 'samples': 15860736, 'steps': 30977, 'loss/train': 1.4072949886322021} +03/05/2022 01:52:20 - INFO - codeparrot_training - Step 30978: {'lr': 0.0004541767222125932, 'samples': 15861248, 'steps': 30978, 'loss/train': 1.5770609378814697} +03/05/2022 01:52:20 - INFO - codeparrot_training - Skipping example with length 715 (seq_length=1024) +03/05/2022 01:52:26 - INFO - codeparrot_training - Step 30979: {'lr': 0.0004541736598952603, 'samples': 15861760, 'steps': 30979, 'loss/train': 1.1852333545684814} +03/05/2022 01:52:29 - INFO - codeparrot_training - Step 30980: {'lr': 0.0004541705974859298, 'samples': 15862272, 'steps': 30980, 'loss/train': 1.466752290725708} +03/05/2022 01:52:29 - INFO - codeparrot_training - Skipping example with length 776 (seq_length=1024) +03/05/2022 01:52:34 - INFO - codeparrot_training - Step 30981: {'lr': 0.0004541675349846033, 'samples': 15862784, 'steps': 30981, 'loss/train': 1.243790626525879} +03/05/2022 01:52:37 - INFO - codeparrot_training - Step 30982: {'lr': 0.000454164472391282, 'samples': 15863296, 'steps': 30982, 'loss/train': 1.6239548921585083} +03/05/2022 01:52:37 - INFO - codeparrot_training - Skipping example with length 497 (seq_length=1024) +03/05/2022 01:52:43 - INFO - codeparrot_training - Step 30983: {'lr': 0.00045416140970596736, 'samples': 15863808, 'steps': 30983, 'loss/train': 1.53493070602417} +03/05/2022 01:52:46 - INFO - codeparrot_training - Step 30984: {'lr': 0.0004541583469286607, 'samples': 15864320, 'steps': 30984, 'loss/train': 1.5314464569091797} +03/05/2022 01:52:46 - INFO - codeparrot_training - Skipping example with length 143 (seq_length=1024) +03/05/2022 01:52:51 - INFO - codeparrot_training - Step 30985: {'lr': 0.00045415528405936347, 'samples': 15864832, 'steps': 30985, 'loss/train': 2.0324625968933105} +03/05/2022 01:52:54 - INFO - codeparrot_training - Step 30986: {'lr': 0.000454152221098077, 'samples': 15865344, 'steps': 30986, 'loss/train': 2.337380886077881} +03/05/2022 01:52:54 - INFO - codeparrot_training - Skipping example with length 195 (seq_length=1024) +03/05/2022 01:52:59 - INFO - codeparrot_training - Step 30987: {'lr': 0.0004541491580448027, 'samples': 15865856, 'steps': 30987, 'loss/train': 2.3334641456604004} +03/05/2022 01:53:02 - INFO - codeparrot_training - Skipping example with length 969 (seq_length=1024) +03/05/2022 01:53:05 - INFO - codeparrot_training - Step 30988: {'lr': 0.00045414609489954195, 'samples': 15866368, 'steps': 30988, 'loss/train': 1.7933517694473267} +03/05/2022 01:53:08 - INFO - codeparrot_training - Step 30989: {'lr': 0.00045414303166229616, 'samples': 15866880, 'steps': 30989, 'loss/train': 1.2874490022659302} +03/05/2022 01:53:10 - INFO - codeparrot_training - Skipping example with length 450 (seq_length=1024) +03/05/2022 01:53:13 - INFO - codeparrot_training - Step 30990: {'lr': 0.0004541399683330666, 'samples': 15867392, 'steps': 30990, 'loss/train': 0.8950868844985962} +03/05/2022 01:53:16 - INFO - codeparrot_training - Step 30991: {'lr': 0.00045413690491185476, 'samples': 15867904, 'steps': 30991, 'loss/train': 1.63676917552948} +03/05/2022 01:53:19 - INFO - codeparrot_training - Skipping example with length 361 (seq_length=1024) +03/05/2022 01:53:21 - INFO - codeparrot_training - Step 30992: {'lr': 0.00045413384139866196, 'samples': 15868416, 'steps': 30992, 'loss/train': 1.4612616300582886} +03/05/2022 01:53:25 - INFO - codeparrot_training - Step 30993: {'lr': 0.0004541307777934896, 'samples': 15868928, 'steps': 30993, 'loss/train': 2.029505968093872} +03/05/2022 01:53:27 - INFO - codeparrot_training - Skipping example with length 121 (seq_length=1024) +03/05/2022 01:53:30 - INFO - codeparrot_training - Step 30994: {'lr': 0.00045412771409633905, 'samples': 15869440, 'steps': 30994, 'loss/train': 1.956223487854004} +03/05/2022 01:53:33 - INFO - codeparrot_training - Step 30995: {'lr': 0.0004541246503072117, 'samples': 15869952, 'steps': 30995, 'loss/train': 2.00334095954895} +03/05/2022 01:53:35 - INFO - codeparrot_training - Skipping example with length 265 (seq_length=1024) +03/05/2022 01:53:38 - INFO - codeparrot_training - Step 30996: {'lr': 0.000454121586426109, 'samples': 15870464, 'steps': 30996, 'loss/train': 1.388145923614502} +03/05/2022 01:53:42 - INFO - codeparrot_training - Step 30997: {'lr': 0.0004541185224530322, 'samples': 15870976, 'steps': 30997, 'loss/train': 0.17015931010246277} +03/05/2022 01:53:44 - INFO - codeparrot_training - Skipping example with length 159 (seq_length=1024) +03/05/2022 01:53:47 - INFO - codeparrot_training - Step 30998: {'lr': 0.00045411545838798273, 'samples': 15871488, 'steps': 30998, 'loss/train': 1.5545047521591187} +03/05/2022 01:53:50 - INFO - codeparrot_training - Step 30999: {'lr': 0.00045411239423096206, 'samples': 15872000, 'steps': 30999, 'loss/train': 1.5775765180587769} +03/05/2022 01:53:52 - INFO - codeparrot_training - Skipping example with length 902 (seq_length=1024) +03/05/2022 01:53:55 - INFO - codeparrot_training - Step 31000: {'lr': 0.0004541093299819714, 'samples': 15872512, 'steps': 31000, 'loss/train': 1.723979115486145} +03/05/2022 01:53:59 - INFO - codeparrot_training - Step 31001: {'lr': 0.0004541062656410123, 'samples': 15873024, 'steps': 31001, 'loss/train': 1.4222108125686646} +03/05/2022 01:54:01 - INFO - codeparrot_training - Skipping example with length 227 (seq_length=1024) +03/05/2022 01:54:04 - INFO - codeparrot_training - Step 31002: {'lr': 0.000454103201208086, 'samples': 15873536, 'steps': 31002, 'loss/train': 1.3299506902694702} +03/05/2022 01:54:07 - INFO - codeparrot_training - Step 31003: {'lr': 0.00045410013668319404, 'samples': 15874048, 'steps': 31003, 'loss/train': 1.6875066757202148} +03/05/2022 01:54:09 - INFO - codeparrot_training - Skipping example with length 793 (seq_length=1024) +03/05/2022 01:54:12 - INFO - codeparrot_training - Step 31004: {'lr': 0.00045409707206633764, 'samples': 15874560, 'steps': 31004, 'loss/train': 1.080405354499817} +03/05/2022 01:54:15 - INFO - codeparrot_training - Step 31005: {'lr': 0.0004540940073575183, 'samples': 15875072, 'steps': 31005, 'loss/train': 1.7155218124389648} +03/05/2022 01:54:18 - INFO - codeparrot_training - Skipping example with length 679 (seq_length=1024) +03/05/2022 01:54:21 - INFO - codeparrot_training - Step 31006: {'lr': 0.00045409094255673734, 'samples': 15875584, 'steps': 31006, 'loss/train': 1.581612229347229} +03/05/2022 01:54:24 - INFO - codeparrot_training - Step 31007: {'lr': 0.00045408787766399605, 'samples': 15876096, 'steps': 31007, 'loss/train': 1.2886601686477661} +03/05/2022 01:54:26 - INFO - codeparrot_training - Skipping example with length 666 (seq_length=1024) +03/05/2022 01:54:29 - INFO - codeparrot_training - Step 31008: {'lr': 0.00045408481267929604, 'samples': 15876608, 'steps': 31008, 'loss/train': 1.9097386598587036} +03/05/2022 01:54:33 - INFO - codeparrot_training - Step 31009: {'lr': 0.0004540817476026385, 'samples': 15877120, 'steps': 31009, 'loss/train': 2.1265344619750977} +03/05/2022 01:54:35 - INFO - codeparrot_training - Skipping example with length 844 (seq_length=1024) +03/05/2022 01:54:38 - INFO - codeparrot_training - Step 31010: {'lr': 0.00045407868243402483, 'samples': 15877632, 'steps': 31010, 'loss/train': 1.6197446584701538} +03/05/2022 01:54:41 - INFO - codeparrot_training - Step 31011: {'lr': 0.0004540756171734565, 'samples': 15878144, 'steps': 31011, 'loss/train': 2.1251659393310547} +03/05/2022 01:54:43 - INFO - codeparrot_training - Skipping example with length 853 (seq_length=1024) +03/05/2022 01:54:46 - INFO - codeparrot_training - Step 31012: {'lr': 0.0004540725518209349, 'samples': 15878656, 'steps': 31012, 'loss/train': 1.3918331861495972} +03/05/2022 01:54:49 - INFO - codeparrot_training - Step 31013: {'lr': 0.0004540694863764613, 'samples': 15879168, 'steps': 31013, 'loss/train': 1.3065340518951416} +03/05/2022 01:54:51 - INFO - codeparrot_training - Skipping example with length 81 (seq_length=1024) +03/05/2022 01:54:55 - INFO - codeparrot_training - Step 31014: {'lr': 0.0004540664208400371, 'samples': 15879680, 'steps': 31014, 'loss/train': 1.8788014650344849} +03/05/2022 01:54:58 - INFO - codeparrot_training - Step 31015: {'lr': 0.0004540633552116638, 'samples': 15880192, 'steps': 31015, 'loss/train': 1.3577966690063477} +03/05/2022 01:55:00 - INFO - codeparrot_training - Skipping example with length 35 (seq_length=1024) +03/05/2022 01:55:03 - INFO - codeparrot_training - Step 31016: {'lr': 0.0004540602894913427, 'samples': 15880704, 'steps': 31016, 'loss/train': 1.5502246618270874} +03/05/2022 01:55:06 - INFO - codeparrot_training - Step 31017: {'lr': 0.0004540572236790751, 'samples': 15881216, 'steps': 31017, 'loss/train': 1.9129462242126465} +03/05/2022 01:55:08 - INFO - codeparrot_training - Skipping example with length 275 (seq_length=1024) +03/05/2022 01:55:12 - INFO - codeparrot_training - Step 31018: {'lr': 0.0004540541577748625, 'samples': 15881728, 'steps': 31018, 'loss/train': 0.9524648189544678} +03/05/2022 01:55:15 - INFO - codeparrot_training - Step 31019: {'lr': 0.0004540510917787063, 'samples': 15882240, 'steps': 31019, 'loss/train': 1.6206148862838745} +03/05/2022 01:55:18 - INFO - codeparrot_training - Skipping example with length 726 (seq_length=1024) +03/05/2022 01:55:20 - INFO - codeparrot_training - Step 31020: {'lr': 0.00045404802569060776, 'samples': 15882752, 'steps': 31020, 'loss/train': 0.23085585236549377} +03/05/2022 01:55:23 - INFO - codeparrot_training - Step 31021: {'lr': 0.00045404495951056835, 'samples': 15883264, 'steps': 31021, 'loss/train': 1.185053825378418} +03/05/2022 01:55:26 - INFO - codeparrot_training - Skipping example with length 301 (seq_length=1024) +03/05/2022 01:55:29 - INFO - codeparrot_training - Step 31022: {'lr': 0.00045404189323858946, 'samples': 15883776, 'steps': 31022, 'loss/train': 2.0368337631225586} +03/05/2022 01:55:32 - INFO - codeparrot_training - Step 31023: {'lr': 0.0004540388268746724, 'samples': 15884288, 'steps': 31023, 'loss/train': 0.5062656998634338} +03/05/2022 01:55:35 - INFO - codeparrot_training - Skipping example with length 272 (seq_length=1024) +03/05/2022 01:55:37 - INFO - codeparrot_training - Step 31024: {'lr': 0.0004540357604188186, 'samples': 15884800, 'steps': 31024, 'loss/train': 1.846888780593872} +03/05/2022 01:55:41 - INFO - codeparrot_training - Step 31025: {'lr': 0.0004540326938710295, 'samples': 15885312, 'steps': 31025, 'loss/train': 2.523287296295166} +03/05/2022 01:55:43 - INFO - codeparrot_training - Skipping example with length 75 (seq_length=1024) +03/05/2022 01:55:46 - INFO - codeparrot_training - Step 31026: {'lr': 0.0004540296272313064, 'samples': 15885824, 'steps': 31026, 'loss/train': 1.6225273609161377} +03/05/2022 01:55:49 - INFO - codeparrot_training - Step 31027: {'lr': 0.00045402656049965055, 'samples': 15886336, 'steps': 31027, 'loss/train': 1.668952226638794} +03/05/2022 01:55:51 - INFO - codeparrot_training - Skipping example with length 832 (seq_length=1024) +03/05/2022 01:55:54 - INFO - codeparrot_training - Step 31028: {'lr': 0.0004540234936760636, 'samples': 15886848, 'steps': 31028, 'loss/train': 1.7061861753463745} +03/05/2022 01:55:57 - INFO - codeparrot_training - Step 31029: {'lr': 0.00045402042676054684, 'samples': 15887360, 'steps': 31029, 'loss/train': 1.356921911239624} +03/05/2022 01:56:00 - INFO - codeparrot_training - Skipping example with length 845 (seq_length=1024) +03/05/2022 01:56:03 - INFO - codeparrot_training - Step 31030: {'lr': 0.0004540173597531015, 'samples': 15887872, 'steps': 31030, 'loss/train': 0.9442176818847656} +03/05/2022 01:56:06 - INFO - codeparrot_training - Step 31031: {'lr': 0.00045401429265372925, 'samples': 15888384, 'steps': 31031, 'loss/train': 0.9786296486854553} +03/05/2022 01:56:08 - INFO - codeparrot_training - Skipping example with length 639 (seq_length=1024) +03/05/2022 01:56:11 - INFO - codeparrot_training - Step 31032: {'lr': 0.0004540112254624312, 'samples': 15888896, 'steps': 31032, 'loss/train': 2.161379098892212} +03/05/2022 01:56:14 - INFO - codeparrot_training - Step 31033: {'lr': 0.0004540081581792089, 'samples': 15889408, 'steps': 31033, 'loss/train': 1.3048256635665894} +03/05/2022 01:56:17 - INFO - codeparrot_training - Skipping example with length 484 (seq_length=1024) +03/05/2022 01:56:20 - INFO - codeparrot_training - Step 31034: {'lr': 0.0004540050908040636, 'samples': 15889920, 'steps': 31034, 'loss/train': 1.5006375312805176} +03/05/2022 01:56:23 - INFO - codeparrot_training - Step 31035: {'lr': 0.0004540020233369968, 'samples': 15890432, 'steps': 31035, 'loss/train': 2.5797078609466553} +03/05/2022 01:56:25 - INFO - codeparrot_training - Skipping example with length 24 (seq_length=1024) +03/05/2022 01:56:28 - INFO - codeparrot_training - Step 31036: {'lr': 0.00045399895577800985, 'samples': 15890944, 'steps': 31036, 'loss/train': 1.9128408432006836} +03/05/2022 01:56:31 - INFO - codeparrot_training - Step 31037: {'lr': 0.00045399588812710415, 'samples': 15891456, 'steps': 31037, 'loss/train': 2.336669445037842} +03/05/2022 01:56:33 - INFO - codeparrot_training - Skipping example with length 123 (seq_length=1024) +03/05/2022 01:56:36 - INFO - codeparrot_training - Step 31038: {'lr': 0.0004539928203842809, 'samples': 15891968, 'steps': 31038, 'loss/train': 2.016925096511841} +03/05/2022 01:56:39 - INFO - codeparrot_training - Step 31039: {'lr': 0.0004539897525495418, 'samples': 15892480, 'steps': 31039, 'loss/train': 2.2826406955718994} +03/05/2022 01:56:42 - INFO - codeparrot_training - Skipping example with length 734 (seq_length=1024) +03/05/2022 01:56:45 - INFO - codeparrot_training - Step 31040: {'lr': 0.0004539866846228879, 'samples': 15892992, 'steps': 31040, 'loss/train': 1.7109838724136353} +03/05/2022 01:56:48 - INFO - codeparrot_training - Step 31041: {'lr': 0.0004539836166043209, 'samples': 15893504, 'steps': 31041, 'loss/train': 0.2107848972082138} +03/05/2022 01:56:50 - INFO - codeparrot_training - Skipping example with length 493 (seq_length=1024) +03/05/2022 01:56:53 - INFO - codeparrot_training - Step 31042: {'lr': 0.00045398054849384197, 'samples': 15894016, 'steps': 31042, 'loss/train': 2.0768253803253174} +03/05/2022 01:56:56 - INFO - codeparrot_training - Step 31043: {'lr': 0.0004539774802914526, 'samples': 15894528, 'steps': 31043, 'loss/train': 2.1518638134002686} +03/05/2022 01:56:58 - INFO - codeparrot_training - Skipping example with length 533 (seq_length=1024) +03/05/2022 01:57:02 - INFO - codeparrot_training - Step 31044: {'lr': 0.00045397441199715406, 'samples': 15895040, 'steps': 31044, 'loss/train': 2.0035881996154785} +03/05/2022 01:57:05 - INFO - codeparrot_training - Step 31045: {'lr': 0.0004539713436109478, 'samples': 15895552, 'steps': 31045, 'loss/train': 1.3785030841827393} +03/05/2022 01:57:07 - INFO - codeparrot_training - Skipping example with length 655 (seq_length=1024) +03/05/2022 01:57:10 - INFO - codeparrot_training - Step 31046: {'lr': 0.0004539682751328352, 'samples': 15896064, 'steps': 31046, 'loss/train': 1.39830482006073} +03/05/2022 01:57:13 - INFO - codeparrot_training - Step 31047: {'lr': 0.0004539652065628177, 'samples': 15896576, 'steps': 31047, 'loss/train': 2.4769535064697266} +03/05/2022 01:57:15 - INFO - codeparrot_training - Skipping example with length 492 (seq_length=1024) +03/05/2022 01:57:19 - INFO - codeparrot_training - Step 31048: {'lr': 0.00045396213790089657, 'samples': 15897088, 'steps': 31048, 'loss/train': 1.1181715726852417} +03/05/2022 01:57:22 - INFO - codeparrot_training - Step 31049: {'lr': 0.0004539590691470733, 'samples': 15897600, 'steps': 31049, 'loss/train': 2.0698914527893066} +03/05/2022 01:57:24 - INFO - codeparrot_training - Skipping example with length 54 (seq_length=1024) +03/05/2022 01:57:27 - INFO - codeparrot_training - Step 31050: {'lr': 0.0004539560003013492, 'samples': 15898112, 'steps': 31050, 'loss/train': 1.4740917682647705} +03/05/2022 01:57:30 - INFO - codeparrot_training - Step 31051: {'lr': 0.0004539529313637256, 'samples': 15898624, 'steps': 31051, 'loss/train': 0.8870312571525574} +03/05/2022 01:57:32 - INFO - codeparrot_training - Skipping example with length 613 (seq_length=1024) +03/05/2022 01:57:35 - INFO - codeparrot_training - Step 31052: {'lr': 0.0004539498623342041, 'samples': 15899136, 'steps': 31052, 'loss/train': 2.3583619594573975} +03/05/2022 01:57:39 - INFO - codeparrot_training - Step 31053: {'lr': 0.0004539467932127858, 'samples': 15899648, 'steps': 31053, 'loss/train': 1.639033317565918} +03/05/2022 01:57:40 - INFO - codeparrot_training - Skipping example with length 514 (seq_length=1024) +03/05/2022 01:57:44 - INFO - codeparrot_training - Step 31054: {'lr': 0.00045394372399947225, 'samples': 15900160, 'steps': 31054, 'loss/train': 1.6291180849075317} +03/05/2022 01:57:47 - INFO - codeparrot_training - Step 31055: {'lr': 0.0004539406546942649, 'samples': 15900672, 'steps': 31055, 'loss/train': 0.5368399024009705} +03/05/2022 01:57:49 - INFO - codeparrot_training - Skipping example with length 762 (seq_length=1024) +03/05/2022 01:57:52 - INFO - codeparrot_training - Step 31056: {'lr': 0.00045393758529716497, 'samples': 15901184, 'steps': 31056, 'loss/train': 0.30685704946517944} +03/05/2022 01:57:55 - INFO - codeparrot_training - Step 31057: {'lr': 0.0004539345158081739, 'samples': 15901696, 'steps': 31057, 'loss/train': 1.618955135345459} +03/05/2022 01:57:57 - INFO - codeparrot_training - Skipping example with length 344 (seq_length=1024) +03/05/2022 01:58:01 - INFO - codeparrot_training - Step 31058: {'lr': 0.0004539314462272931, 'samples': 15902208, 'steps': 31058, 'loss/train': 2.251624345779419} +03/05/2022 01:58:04 - INFO - codeparrot_training - Step 31059: {'lr': 0.0004539283765545239, 'samples': 15902720, 'steps': 31059, 'loss/train': 2.048711061477661} +03/05/2022 01:58:06 - INFO - codeparrot_training - Skipping example with length 217 (seq_length=1024) +03/05/2022 01:58:09 - INFO - codeparrot_training - Step 31060: {'lr': 0.00045392530678986775, 'samples': 15903232, 'steps': 31060, 'loss/train': 1.6102041006088257} +03/05/2022 01:58:12 - INFO - codeparrot_training - Step 31061: {'lr': 0.00045392223693332604, 'samples': 15903744, 'steps': 31061, 'loss/train': 2.021141767501831} +03/05/2022 01:58:14 - INFO - codeparrot_training - Skipping example with length 117 (seq_length=1024) +03/05/2022 01:58:17 - INFO - codeparrot_training - Step 31062: {'lr': 0.0004539191669849001, 'samples': 15904256, 'steps': 31062, 'loss/train': 2.0053646564483643} +03/05/2022 01:58:21 - INFO - codeparrot_training - Step 31063: {'lr': 0.0004539160969445913, 'samples': 15904768, 'steps': 31063, 'loss/train': 1.594766616821289} +03/05/2022 01:58:22 - INFO - codeparrot_training - Skipping example with length 603 (seq_length=1024) +03/05/2022 01:58:26 - INFO - codeparrot_training - Step 31064: {'lr': 0.0004539130268124011, 'samples': 15905280, 'steps': 31064, 'loss/train': 1.4969077110290527} +03/05/2022 01:58:29 - INFO - codeparrot_training - Step 31065: {'lr': 0.0004539099565883308, 'samples': 15905792, 'steps': 31065, 'loss/train': 2.3274800777435303} +03/05/2022 01:58:30 - INFO - codeparrot_training - Skipping example with length 759 (seq_length=1024) +03/05/2022 01:58:34 - INFO - codeparrot_training - Step 31066: {'lr': 0.0004539068862723818, 'samples': 15906304, 'steps': 31066, 'loss/train': 1.3392586708068848} +03/05/2022 01:58:37 - INFO - codeparrot_training - Step 31067: {'lr': 0.0004539038158645555, 'samples': 15906816, 'steps': 31067, 'loss/train': 1.635895013809204} +03/05/2022 01:58:38 - INFO - codeparrot_training - Skipping example with length 928 (seq_length=1024) +03/05/2022 01:58:43 - INFO - codeparrot_training - Step 31068: {'lr': 0.00045390074536485336, 'samples': 15907328, 'steps': 31068, 'loss/train': 1.365620493888855} +03/05/2022 01:58:46 - INFO - codeparrot_training - Step 31069: {'lr': 0.00045389767477327657, 'samples': 15907840, 'steps': 31069, 'loss/train': 0.15375058352947235} +03/05/2022 01:58:47 - INFO - codeparrot_training - Skipping example with length 30 (seq_length=1024) +03/05/2022 01:58:51 - INFO - codeparrot_training - Step 31070: {'lr': 0.00045389460408982676, 'samples': 15908352, 'steps': 31070, 'loss/train': 2.339210271835327} +03/05/2022 01:58:54 - INFO - codeparrot_training - Step 31071: {'lr': 0.0004538915333145052, 'samples': 15908864, 'steps': 31071, 'loss/train': 1.7322310209274292} +03/05/2022 01:58:55 - INFO - codeparrot_training - Skipping example with length 609 (seq_length=1024) +03/05/2022 01:58:59 - INFO - codeparrot_training - Step 31072: {'lr': 0.00045388846244731314, 'samples': 15909376, 'steps': 31072, 'loss/train': 1.9424974918365479} +03/05/2022 01:59:03 - INFO - codeparrot_training - Step 31073: {'lr': 0.00045388539148825214, 'samples': 15909888, 'steps': 31073, 'loss/train': 1.668043613433838} +03/05/2022 01:59:03 - INFO - codeparrot_training - Skipping example with length 866 (seq_length=1024) +03/05/2022 01:59:08 - INFO - codeparrot_training - Step 31074: {'lr': 0.0004538823204373235, 'samples': 15910400, 'steps': 31074, 'loss/train': 1.9071142673492432} +03/05/2022 01:59:11 - INFO - codeparrot_training - Step 31075: {'lr': 0.00045387924929452873, 'samples': 15910912, 'steps': 31075, 'loss/train': 2.2375648021698} +03/05/2022 01:59:12 - INFO - codeparrot_training - Skipping example with length 1018 (seq_length=1024) +03/05/2022 01:59:16 - INFO - codeparrot_training - Step 31076: {'lr': 0.000453876178059869, 'samples': 15911424, 'steps': 31076, 'loss/train': 1.8308181762695312} +03/05/2022 01:59:19 - INFO - codeparrot_training - Step 31077: {'lr': 0.0004538731067333459, 'samples': 15911936, 'steps': 31077, 'loss/train': 1.0102323293685913} +03/05/2022 01:59:25 - INFO - codeparrot_training - Step 31078: {'lr': 0.00045387003531496064, 'samples': 15912448, 'steps': 31078, 'loss/train': 1.622928500175476} +03/05/2022 01:59:28 - INFO - codeparrot_training - Step 31079: {'lr': 0.00045386696380471473, 'samples': 15912960, 'steps': 31079, 'loss/train': 2.0409433841705322} +03/05/2022 01:59:28 - INFO - codeparrot_training - Skipping example with length 459 (seq_length=1024) +03/05/2022 01:59:33 - INFO - codeparrot_training - Step 31080: {'lr': 0.0004538638922026095, 'samples': 15913472, 'steps': 31080, 'loss/train': 2.378960371017456} +03/05/2022 01:59:36 - INFO - codeparrot_training - Step 31081: {'lr': 0.0004538608205086464, 'samples': 15913984, 'steps': 31081, 'loss/train': 1.8667718172073364} +03/05/2022 01:59:37 - INFO - codeparrot_training - Skipping example with length 290 (seq_length=1024) +03/05/2022 01:59:42 - INFO - codeparrot_training - Step 31082: {'lr': 0.0004538577487228267, 'samples': 15914496, 'steps': 31082, 'loss/train': 2.2108724117279053} +03/05/2022 01:59:45 - INFO - codeparrot_training - Step 31083: {'lr': 0.00045385467684515193, 'samples': 15915008, 'steps': 31083, 'loss/train': 2.2047266960144043} +03/05/2022 01:59:45 - INFO - codeparrot_training - Skipping example with length 94 (seq_length=1024) +03/05/2022 01:59:50 - INFO - codeparrot_training - Step 31084: {'lr': 0.0004538516048756233, 'samples': 15915520, 'steps': 31084, 'loss/train': 2.0003206729888916} +03/05/2022 01:59:53 - INFO - codeparrot_training - Step 31085: {'lr': 0.00045384853281424235, 'samples': 15916032, 'steps': 31085, 'loss/train': 0.9549766182899475} +03/05/2022 01:59:53 - INFO - codeparrot_training - Skipping example with length 543 (seq_length=1024) +03/05/2022 01:59:59 - INFO - codeparrot_training - Step 31086: {'lr': 0.0004538454606610103, 'samples': 15916544, 'steps': 31086, 'loss/train': 1.8502594232559204} +03/05/2022 02:00:02 - INFO - codeparrot_training - Step 31087: {'lr': 0.0004538423884159287, 'samples': 15917056, 'steps': 31087, 'loss/train': 2.1873044967651367} +03/05/2022 02:00:02 - INFO - codeparrot_training - Skipping example with length 493 (seq_length=1024) +03/05/2022 02:00:07 - INFO - codeparrot_training - Step 31088: {'lr': 0.0004538393160789988, 'samples': 15917568, 'steps': 31088, 'loss/train': 1.227258324623108} +03/05/2022 02:00:10 - INFO - codeparrot_training - Step 31089: {'lr': 0.0004538362436502221, 'samples': 15918080, 'steps': 31089, 'loss/train': 1.5615841150283813} +03/05/2022 02:00:10 - INFO - codeparrot_training - Skipping example with length 513 (seq_length=1024) +03/05/2022 02:00:16 - INFO - codeparrot_training - Step 31090: {'lr': 0.00045383317112959997, 'samples': 15918592, 'steps': 31090, 'loss/train': 1.8077309131622314} +03/05/2022 02:00:19 - INFO - codeparrot_training - Step 31091: {'lr': 0.0004538300985171337, 'samples': 15919104, 'steps': 31091, 'loss/train': 0.5859639048576355} +03/05/2022 02:00:19 - INFO - codeparrot_training - Skipping example with length 242 (seq_length=1024) +03/05/2022 02:00:24 - INFO - codeparrot_training - Step 31092: {'lr': 0.00045382702581282477, 'samples': 15919616, 'steps': 31092, 'loss/train': 1.071000099182129} +03/05/2022 02:00:27 - INFO - codeparrot_training - Skipping example with length 1019 (seq_length=1024) +03/05/2022 02:00:29 - INFO - codeparrot_training - Step 31093: {'lr': 0.0004538239530166745, 'samples': 15920128, 'steps': 31093, 'loss/train': 1.5428143739700317} +03/05/2022 02:00:32 - INFO - codeparrot_training - Step 31094: {'lr': 0.0004538208801286843, 'samples': 15920640, 'steps': 31094, 'loss/train': 2.3137831687927246} +03/05/2022 02:00:35 - INFO - codeparrot_training - Skipping example with length 360 (seq_length=1024) +03/05/2022 02:00:38 - INFO - codeparrot_training - Step 31095: {'lr': 0.0004538178071488556, 'samples': 15921152, 'steps': 31095, 'loss/train': 1.9550915956497192} +03/05/2022 02:00:41 - INFO - codeparrot_training - Step 31096: {'lr': 0.00045381473407718963, 'samples': 15921664, 'steps': 31096, 'loss/train': 1.4543966054916382} +03/05/2022 02:00:44 - INFO - codeparrot_training - Step 31097: {'lr': 0.000453811660913688, 'samples': 15922176, 'steps': 31097, 'loss/train': 1.9568668603897095} +03/05/2022 02:00:44 - INFO - codeparrot_training - Skipping example with length 828 (seq_length=1024) +03/05/2022 02:00:49 - INFO - codeparrot_training - Step 31098: {'lr': 0.000453808587658352, 'samples': 15922688, 'steps': 31098, 'loss/train': 2.397277593612671} +03/05/2022 02:00:52 - INFO - codeparrot_training - Skipping example with length 622 (seq_length=1024) +03/05/2022 02:00:55 - INFO - codeparrot_training - Step 31099: {'lr': 0.0004538055143111829, 'samples': 15923200, 'steps': 31099, 'loss/train': 1.4020473957061768} +03/05/2022 02:00:58 - INFO - codeparrot_training - Step 31100: {'lr': 0.00045380244087218224, 'samples': 15923712, 'steps': 31100, 'loss/train': 1.963415265083313} +03/05/2022 02:01:01 - INFO - codeparrot_training - Skipping example with length 896 (seq_length=1024) +03/05/2022 02:01:03 - INFO - codeparrot_training - Step 31101: {'lr': 0.0004537993673413513, 'samples': 15924224, 'steps': 31101, 'loss/train': 2.28629994392395} +03/05/2022 02:01:06 - INFO - codeparrot_training - Step 31102: {'lr': 0.0004537962937186916, 'samples': 15924736, 'steps': 31102, 'loss/train': 1.4422993659973145} +03/05/2022 02:01:09 - INFO - codeparrot_training - Skipping example with length 209 (seq_length=1024) +03/05/2022 02:01:11 - INFO - codeparrot_training - Step 31103: {'lr': 0.00045379322000420433, 'samples': 15925248, 'steps': 31103, 'loss/train': 1.5797686576843262} +03/05/2022 02:01:15 - INFO - codeparrot_training - Step 31104: {'lr': 0.00045379014619789106, 'samples': 15925760, 'steps': 31104, 'loss/train': 1.93656587600708} +03/05/2022 02:01:17 - INFO - codeparrot_training - Skipping example with length 864 (seq_length=1024) +03/05/2022 02:01:20 - INFO - codeparrot_training - Step 31105: {'lr': 0.00045378707229975303, 'samples': 15926272, 'steps': 31105, 'loss/train': 0.9083523154258728} +03/05/2022 02:01:23 - INFO - codeparrot_training - Step 31106: {'lr': 0.0004537839983097917, 'samples': 15926784, 'steps': 31106, 'loss/train': 2.0974676609039307} +03/05/2022 02:01:25 - INFO - codeparrot_training - Skipping example with length 594 (seq_length=1024) +03/05/2022 02:01:28 - INFO - codeparrot_training - Step 31107: {'lr': 0.0004537809242280085, 'samples': 15927296, 'steps': 31107, 'loss/train': 1.553531527519226} +03/05/2022 02:01:31 - INFO - codeparrot_training - Step 31108: {'lr': 0.0004537778500544047, 'samples': 15927808, 'steps': 31108, 'loss/train': 2.1052277088165283} +03/05/2022 02:01:34 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 02:01:37 - INFO - codeparrot_training - Step 31109: {'lr': 0.0004537747757889817, 'samples': 15928320, 'steps': 31109, 'loss/train': 0.12641894817352295} +03/05/2022 02:01:40 - INFO - codeparrot_training - Step 31110: {'lr': 0.0004537717014317411, 'samples': 15928832, 'steps': 31110, 'loss/train': 1.6423856019973755} +03/05/2022 02:01:42 - INFO - codeparrot_training - Skipping example with length 627 (seq_length=1024) +03/05/2022 02:01:45 - INFO - codeparrot_training - Step 31111: {'lr': 0.00045376862698268393, 'samples': 15929344, 'steps': 31111, 'loss/train': 1.6166242361068726} +03/05/2022 02:01:48 - INFO - codeparrot_training - Step 31112: {'lr': 0.0004537655524418119, 'samples': 15929856, 'steps': 31112, 'loss/train': 0.6394819617271423} +03/05/2022 02:01:51 - INFO - codeparrot_training - Skipping example with length 799 (seq_length=1024) +03/05/2022 02:01:54 - INFO - codeparrot_training - Step 31113: {'lr': 0.00045376247780912616, 'samples': 15930368, 'steps': 31113, 'loss/train': 1.6246287822723389} +03/05/2022 02:01:57 - INFO - codeparrot_training - Step 31114: {'lr': 0.00045375940308462826, 'samples': 15930880, 'steps': 31114, 'loss/train': 2.0412142276763916} +03/05/2022 02:02:00 - INFO - codeparrot_training - Skipping example with length 55 (seq_length=1024) +03/05/2022 02:02:02 - INFO - codeparrot_training - Step 31115: {'lr': 0.00045375632826831947, 'samples': 15931392, 'steps': 31115, 'loss/train': 1.929744005203247} +03/05/2022 02:02:05 - INFO - codeparrot_training - Step 31116: {'lr': 0.00045375325336020124, 'samples': 15931904, 'steps': 31116, 'loss/train': 1.6718261241912842} +03/05/2022 02:02:08 - INFO - codeparrot_training - Skipping example with length 211 (seq_length=1024) +03/05/2022 02:02:10 - INFO - codeparrot_training - Step 31117: {'lr': 0.000453750178360275, 'samples': 15932416, 'steps': 31117, 'loss/train': 0.9813358783721924} +03/05/2022 02:02:14 - INFO - codeparrot_training - Step 31118: {'lr': 0.00045374710326854194, 'samples': 15932928, 'steps': 31118, 'loss/train': 2.6160011291503906} +03/05/2022 02:02:16 - INFO - codeparrot_training - Skipping example with length 307 (seq_length=1024) +03/05/2022 02:02:19 - INFO - codeparrot_training - Step 31119: {'lr': 0.0004537440280850037, 'samples': 15933440, 'steps': 31119, 'loss/train': 2.3415873050689697} +03/05/2022 02:02:22 - INFO - codeparrot_training - Step 31120: {'lr': 0.00045374095280966147, 'samples': 15933952, 'steps': 31120, 'loss/train': 1.3892284631729126} +03/05/2022 02:02:24 - INFO - codeparrot_training - Skipping example with length 825 (seq_length=1024) +03/05/2022 02:02:27 - INFO - codeparrot_training - Step 31121: {'lr': 0.00045373787744251677, 'samples': 15934464, 'steps': 31121, 'loss/train': 1.7189258337020874} +03/05/2022 02:02:30 - INFO - codeparrot_training - Step 31122: {'lr': 0.0004537348019835709, 'samples': 15934976, 'steps': 31122, 'loss/train': 2.0913403034210205} +03/05/2022 02:02:33 - INFO - codeparrot_training - Skipping example with length 970 (seq_length=1024) +03/05/2022 02:02:36 - INFO - codeparrot_training - Step 31123: {'lr': 0.0004537317264328252, 'samples': 15935488, 'steps': 31123, 'loss/train': 1.1791996955871582} +03/05/2022 02:02:39 - INFO - codeparrot_training - Step 31124: {'lr': 0.00045372865079028123, 'samples': 15936000, 'steps': 31124, 'loss/train': 1.0934760570526123} +03/05/2022 02:02:41 - INFO - codeparrot_training - Skipping example with length 840 (seq_length=1024) +03/05/2022 02:02:44 - INFO - codeparrot_training - Step 31125: {'lr': 0.00045372557505594024, 'samples': 15936512, 'steps': 31125, 'loss/train': 2.094167947769165} +03/05/2022 02:02:47 - INFO - codeparrot_training - Step 31126: {'lr': 0.0004537224992298037, 'samples': 15937024, 'steps': 31126, 'loss/train': 2.194850206375122} +03/05/2022 02:02:50 - INFO - codeparrot_training - Skipping example with length 539 (seq_length=1024) +03/05/2022 02:02:53 - INFO - codeparrot_training - Step 31127: {'lr': 0.00045371942331187286, 'samples': 15937536, 'steps': 31127, 'loss/train': 1.3411511182785034} +03/05/2022 02:02:56 - INFO - codeparrot_training - Step 31128: {'lr': 0.00045371634730214923, 'samples': 15938048, 'steps': 31128, 'loss/train': 1.4223006963729858} +03/05/2022 02:02:58 - INFO - codeparrot_training - Skipping example with length 683 (seq_length=1024) +03/05/2022 02:03:01 - INFO - codeparrot_training - Step 31129: {'lr': 0.00045371327120063417, 'samples': 15938560, 'steps': 31129, 'loss/train': 1.844749093055725} +03/05/2022 02:03:04 - INFO - codeparrot_training - Step 31130: {'lr': 0.00045371019500732904, 'samples': 15939072, 'steps': 31130, 'loss/train': 1.2477525472640991} +03/05/2022 02:03:06 - INFO - codeparrot_training - Skipping example with length 414 (seq_length=1024) +03/05/2022 02:03:09 - INFO - codeparrot_training - Step 31131: {'lr': 0.00045370711872223525, 'samples': 15939584, 'steps': 31131, 'loss/train': 1.799143671989441} +03/05/2022 02:03:13 - INFO - codeparrot_training - Step 31132: {'lr': 0.00045370404234535414, 'samples': 15940096, 'steps': 31132, 'loss/train': 1.3410942554473877} +03/05/2022 02:03:15 - INFO - codeparrot_training - Skipping example with length 643 (seq_length=1024) +03/05/2022 02:03:18 - INFO - codeparrot_training - Step 31133: {'lr': 0.00045370096587668714, 'samples': 15940608, 'steps': 31133, 'loss/train': 1.060439109802246} +03/05/2022 02:03:21 - INFO - codeparrot_training - Step 31134: {'lr': 0.0004536978893162357, 'samples': 15941120, 'steps': 31134, 'loss/train': 1.4308747053146362} +03/05/2022 02:03:23 - INFO - codeparrot_training - Skipping example with length 21 (seq_length=1024) +03/05/2022 02:03:26 - INFO - codeparrot_training - Step 31135: {'lr': 0.000453694812664001, 'samples': 15941632, 'steps': 31135, 'loss/train': 1.652655005455017} +03/05/2022 02:03:29 - INFO - codeparrot_training - Step 31136: {'lr': 0.00045369173591998466, 'samples': 15942144, 'steps': 31136, 'loss/train': 1.6214581727981567} +03/05/2022 02:03:31 - INFO - codeparrot_training - Skipping example with length 888 (seq_length=1024) +03/05/2022 02:03:35 - INFO - codeparrot_training - Step 31137: {'lr': 0.00045368865908418794, 'samples': 15942656, 'steps': 31137, 'loss/train': 2.6861472129821777} +03/05/2022 02:03:38 - INFO - codeparrot_training - Step 31138: {'lr': 0.00045368558215661225, 'samples': 15943168, 'steps': 31138, 'loss/train': 2.5820486545562744} +03/05/2022 02:03:39 - INFO - codeparrot_training - Skipping example with length 229 (seq_length=1024) +03/05/2022 02:03:43 - INFO - codeparrot_training - Step 31139: {'lr': 0.00045368250513725896, 'samples': 15943680, 'steps': 31139, 'loss/train': 1.6927965879440308} +03/05/2022 02:03:46 - INFO - codeparrot_training - Step 31140: {'lr': 0.00045367942802612953, 'samples': 15944192, 'steps': 31140, 'loss/train': 2.1222760677337646} +03/05/2022 02:03:48 - INFO - codeparrot_training - Skipping example with length 367 (seq_length=1024) +03/05/2022 02:03:52 - INFO - codeparrot_training - Step 31141: {'lr': 0.0004536763508232252, 'samples': 15944704, 'steps': 31141, 'loss/train': 2.0758845806121826} +03/05/2022 02:03:55 - INFO - codeparrot_training - Step 31142: {'lr': 0.0004536732735285476, 'samples': 15945216, 'steps': 31142, 'loss/train': 1.521748661994934} +03/05/2022 02:03:56 - INFO - codeparrot_training - Skipping example with length 945 (seq_length=1024) +03/05/2022 02:04:00 - INFO - codeparrot_training - Step 31143: {'lr': 0.00045367019614209783, 'samples': 15945728, 'steps': 31143, 'loss/train': 1.296442985534668} +03/05/2022 02:04:03 - INFO - codeparrot_training - Step 31144: {'lr': 0.0004536671186638775, 'samples': 15946240, 'steps': 31144, 'loss/train': 0.681323230266571} +03/05/2022 02:04:04 - INFO - codeparrot_training - Skipping example with length 333 (seq_length=1024) +03/05/2022 02:04:08 - INFO - codeparrot_training - Step 31145: {'lr': 0.0004536640410938879, 'samples': 15946752, 'steps': 31145, 'loss/train': 1.9207953214645386} +03/05/2022 02:04:12 - INFO - codeparrot_training - Step 31146: {'lr': 0.00045366096343213034, 'samples': 15947264, 'steps': 31146, 'loss/train': 1.1354986429214478} +03/05/2022 02:04:13 - INFO - codeparrot_training - Skipping example with length 179 (seq_length=1024) +03/05/2022 02:04:17 - INFO - codeparrot_training - Step 31147: {'lr': 0.0004536578856786064, 'samples': 15947776, 'steps': 31147, 'loss/train': 2.243995428085327} +03/05/2022 02:04:20 - INFO - codeparrot_training - Step 31148: {'lr': 0.0004536548078333172, 'samples': 15948288, 'steps': 31148, 'loss/train': 2.109376907348633} +03/05/2022 02:04:21 - INFO - codeparrot_training - Skipping example with length 203 (seq_length=1024) +03/05/2022 02:04:25 - INFO - codeparrot_training - Step 31149: {'lr': 0.0004536517298962645, 'samples': 15948800, 'steps': 31149, 'loss/train': 1.9802937507629395} +03/05/2022 02:04:28 - INFO - codeparrot_training - Step 31150: {'lr': 0.00045364865186744936, 'samples': 15949312, 'steps': 31150, 'loss/train': 1.0325675010681152} +03/05/2022 02:04:30 - INFO - codeparrot_training - Skipping example with length 950 (seq_length=1024) +03/05/2022 02:04:34 - INFO - codeparrot_training - Step 31151: {'lr': 0.0004536455737468733, 'samples': 15949824, 'steps': 31151, 'loss/train': 2.50885009765625} +03/05/2022 02:04:37 - INFO - codeparrot_training - Step 31152: {'lr': 0.00045364249553453764, 'samples': 15950336, 'steps': 31152, 'loss/train': 1.30526864528656} +03/05/2022 02:04:38 - INFO - codeparrot_training - Skipping example with length 478 (seq_length=1024) +03/05/2022 02:04:42 - INFO - codeparrot_training - Step 31153: {'lr': 0.00045363941723044386, 'samples': 15950848, 'steps': 31153, 'loss/train': 1.4854711294174194} +03/05/2022 02:04:45 - INFO - codeparrot_training - Step 31154: {'lr': 0.0004536363388345933, 'samples': 15951360, 'steps': 31154, 'loss/train': 2.256815195083618} +03/05/2022 02:04:46 - INFO - codeparrot_training - Skipping example with length 644 (seq_length=1024) +03/05/2022 02:04:51 - INFO - codeparrot_training - Step 31155: {'lr': 0.0004536332603469873, 'samples': 15951872, 'steps': 31155, 'loss/train': 1.4689518213272095} +03/05/2022 02:04:54 - INFO - codeparrot_training - Step 31156: {'lr': 0.0004536301817676274, 'samples': 15952384, 'steps': 31156, 'loss/train': 0.9998283982276917} +03/05/2022 02:04:54 - INFO - codeparrot_training - Skipping example with length 82 (seq_length=1024) +03/05/2022 02:04:59 - INFO - codeparrot_training - Step 31157: {'lr': 0.0004536271030965148, 'samples': 15952896, 'steps': 31157, 'loss/train': 1.9493473768234253} +03/05/2022 02:05:02 - INFO - codeparrot_training - Step 31158: {'lr': 0.00045362402433365094, 'samples': 15953408, 'steps': 31158, 'loss/train': 1.440495491027832} +03/05/2022 02:05:03 - INFO - codeparrot_training - Skipping example with length 726 (seq_length=1024) +03/05/2022 02:05:07 - INFO - codeparrot_training - Step 31159: {'lr': 0.0004536209454790373, 'samples': 15953920, 'steps': 31159, 'loss/train': 0.06311877816915512} +03/05/2022 02:05:11 - INFO - codeparrot_training - Step 31160: {'lr': 0.00045361786653267517, 'samples': 15954432, 'steps': 31160, 'loss/train': 1.8373218774795532} +03/05/2022 02:05:11 - INFO - codeparrot_training - Skipping example with length 220 (seq_length=1024) +03/05/2022 02:05:16 - INFO - codeparrot_training - Step 31161: {'lr': 0.00045361478749456595, 'samples': 15954944, 'steps': 31161, 'loss/train': 2.5531375408172607} +03/05/2022 02:05:19 - INFO - codeparrot_training - Step 31162: {'lr': 0.0004536117083647111, 'samples': 15955456, 'steps': 31162, 'loss/train': 1.3080500364303589} +03/05/2022 02:05:19 - INFO - codeparrot_training - Skipping example with length 973 (seq_length=1024) +03/05/2022 02:05:24 - INFO - codeparrot_training - Step 31163: {'lr': 0.00045360862914311194, 'samples': 15955968, 'steps': 31163, 'loss/train': 1.6087499856948853} +03/05/2022 02:05:27 - INFO - codeparrot_training - Step 31164: {'lr': 0.0004536055498297699, 'samples': 15956480, 'steps': 31164, 'loss/train': 1.876952886581421} +03/05/2022 02:05:28 - INFO - codeparrot_training - Skipping example with length 917 (seq_length=1024) +03/05/2022 02:05:33 - INFO - codeparrot_training - Step 31165: {'lr': 0.00045360247042468635, 'samples': 15956992, 'steps': 31165, 'loss/train': 1.6783844232559204} +03/05/2022 02:05:35 - INFO - codeparrot_training - Skipping example with length 185 (seq_length=1024) +03/05/2022 02:05:38 - INFO - codeparrot_training - Step 31166: {'lr': 0.0004535993909278626, 'samples': 15957504, 'steps': 31166, 'loss/train': 1.0046114921569824} +03/05/2022 02:05:41 - INFO - codeparrot_training - Step 31167: {'lr': 0.00045359631133930016, 'samples': 15958016, 'steps': 31167, 'loss/train': 1.724531888961792} +03/05/2022 02:05:44 - INFO - codeparrot_training - Skipping example with length 119 (seq_length=1024) +03/05/2022 02:05:46 - INFO - codeparrot_training - Step 31168: {'lr': 0.0004535932316590003, 'samples': 15958528, 'steps': 31168, 'loss/train': 1.582970380783081} +03/05/2022 02:05:49 - INFO - codeparrot_training - Step 31169: {'lr': 0.00045359015188696457, 'samples': 15959040, 'steps': 31169, 'loss/train': 1.6183720827102661} +03/05/2022 02:05:52 - INFO - codeparrot_training - Skipping example with length 97 (seq_length=1024) +03/05/2022 02:05:55 - INFO - codeparrot_training - Step 31170: {'lr': 0.00045358707202319414, 'samples': 15959552, 'steps': 31170, 'loss/train': 1.1541517972946167} +03/05/2022 02:05:58 - INFO - codeparrot_training - Step 31171: {'lr': 0.0004535839920676906, 'samples': 15960064, 'steps': 31171, 'loss/train': 1.2418867349624634} +03/05/2022 02:06:01 - INFO - codeparrot_training - Skipping example with length 683 (seq_length=1024) +03/05/2022 02:06:03 - INFO - codeparrot_training - Step 31172: {'lr': 0.0004535809120204553, 'samples': 15960576, 'steps': 31172, 'loss/train': 1.5746601819992065} +03/05/2022 02:06:06 - INFO - codeparrot_training - Step 31173: {'lr': 0.0004535778318814895, 'samples': 15961088, 'steps': 31173, 'loss/train': 2.203705072402954} +03/05/2022 02:06:09 - INFO - codeparrot_training - Skipping example with length 558 (seq_length=1024) +03/05/2022 02:06:12 - INFO - codeparrot_training - Step 31174: {'lr': 0.0004535747516507947, 'samples': 15961600, 'steps': 31174, 'loss/train': 1.0623031854629517} +03/05/2022 02:06:15 - INFO - codeparrot_training - Step 31175: {'lr': 0.00045357167132837223, 'samples': 15962112, 'steps': 31175, 'loss/train': 1.5531258583068848} +03/05/2022 02:06:17 - INFO - codeparrot_training - Skipping example with length 702 (seq_length=1024) +03/05/2022 02:06:20 - INFO - codeparrot_training - Step 31176: {'lr': 0.00045356859091422354, 'samples': 15962624, 'steps': 31176, 'loss/train': 1.5580382347106934} +03/05/2022 02:06:23 - INFO - codeparrot_training - Step 31177: {'lr': 0.00045356551040835, 'samples': 15963136, 'steps': 31177, 'loss/train': 2.2512400150299072} +03/05/2022 02:06:26 - INFO - codeparrot_training - Step 31178: {'lr': 0.0004535624298107529, 'samples': 15963648, 'steps': 31178, 'loss/train': 1.2703704833984375} +03/05/2022 02:06:27 - INFO - codeparrot_training - Skipping example with length 357 (seq_length=1024) +03/05/2022 02:06:32 - INFO - codeparrot_training - Step 31179: {'lr': 0.00045355934912143383, 'samples': 15964160, 'steps': 31179, 'loss/train': 1.8403284549713135} +03/05/2022 02:06:35 - INFO - codeparrot_training - Step 31180: {'lr': 0.00045355626834039394, 'samples': 15964672, 'steps': 31180, 'loss/train': 1.495927333831787} +03/05/2022 02:06:35 - INFO - codeparrot_training - Skipping example with length 449 (seq_length=1024) +03/05/2022 02:06:40 - INFO - codeparrot_training - Step 31181: {'lr': 0.00045355318746763477, 'samples': 15965184, 'steps': 31181, 'loss/train': 2.033578872680664} +03/05/2022 02:06:43 - INFO - codeparrot_training - Step 31182: {'lr': 0.0004535501065031577, 'samples': 15965696, 'steps': 31182, 'loss/train': 1.8074513673782349} +03/05/2022 02:06:44 - INFO - codeparrot_training - Skipping example with length 179 (seq_length=1024) +03/05/2022 02:06:49 - INFO - codeparrot_training - Step 31183: {'lr': 0.0004535470254469641, 'samples': 15966208, 'steps': 31183, 'loss/train': 1.4288966655731201} +03/05/2022 02:06:52 - INFO - codeparrot_training - Step 31184: {'lr': 0.00045354394429905534, 'samples': 15966720, 'steps': 31184, 'loss/train': 1.8764216899871826} +03/05/2022 02:06:52 - INFO - codeparrot_training - Skipping example with length 308 (seq_length=1024) +03/05/2022 02:06:57 - INFO - codeparrot_training - Step 31185: {'lr': 0.0004535408630594328, 'samples': 15967232, 'steps': 31185, 'loss/train': 3.076322555541992} +03/05/2022 02:07:00 - INFO - codeparrot_training - Step 31186: {'lr': 0.0004535377817280979, 'samples': 15967744, 'steps': 31186, 'loss/train': 2.0013303756713867} +03/05/2022 02:07:01 - INFO - codeparrot_training - Skipping example with length 516 (seq_length=1024) +03/05/2022 02:07:06 - INFO - codeparrot_training - Step 31187: {'lr': 0.0004535347003050521, 'samples': 15968256, 'steps': 31187, 'loss/train': 2.2167117595672607} +03/05/2022 02:07:09 - INFO - codeparrot_training - Step 31188: {'lr': 0.0004535316187902966, 'samples': 15968768, 'steps': 31188, 'loss/train': 1.4744330644607544} +03/05/2022 02:07:09 - INFO - codeparrot_training - Skipping example with length 92 (seq_length=1024) +03/05/2022 02:07:14 - INFO - codeparrot_training - Step 31189: {'lr': 0.00045352853718383287, 'samples': 15969280, 'steps': 31189, 'loss/train': 2.1889350414276123} +03/05/2022 02:07:17 - INFO - codeparrot_training - Step 31190: {'lr': 0.00045352545548566235, 'samples': 15969792, 'steps': 31190, 'loss/train': 1.952658772468567} +03/05/2022 02:07:17 - INFO - codeparrot_training - Skipping example with length 812 (seq_length=1024) +03/05/2022 02:07:22 - INFO - codeparrot_training - Step 31191: {'lr': 0.00045352237369578643, 'samples': 15970304, 'steps': 31191, 'loss/train': 2.1785707473754883} +03/05/2022 02:07:25 - INFO - codeparrot_training - Step 31192: {'lr': 0.00045351929181420647, 'samples': 15970816, 'steps': 31192, 'loss/train': 2.016024351119995} +03/05/2022 02:07:25 - INFO - codeparrot_training - Skipping example with length 212 (seq_length=1024) +03/05/2022 02:07:31 - INFO - codeparrot_training - Step 31193: {'lr': 0.0004535162098409238, 'samples': 15971328, 'steps': 31193, 'loss/train': 2.1145870685577393} +03/05/2022 02:07:34 - INFO - codeparrot_training - Step 31194: {'lr': 0.00045351312777593995, 'samples': 15971840, 'steps': 31194, 'loss/train': 1.5336185693740845} +03/05/2022 02:07:34 - INFO - codeparrot_training - Skipping example with length 641 (seq_length=1024) +03/05/2022 02:07:39 - INFO - codeparrot_training - Step 31195: {'lr': 0.0004535100456192562, 'samples': 15972352, 'steps': 31195, 'loss/train': 1.689664602279663} +03/05/2022 02:07:42 - INFO - codeparrot_training - Skipping example with length 98 (seq_length=1024) +03/05/2022 02:07:45 - INFO - codeparrot_training - Step 31196: {'lr': 0.00045350696337087396, 'samples': 15972864, 'steps': 31196, 'loss/train': 1.7903504371643066} +03/05/2022 02:07:48 - INFO - codeparrot_training - Step 31197: {'lr': 0.0004535038810307946, 'samples': 15973376, 'steps': 31197, 'loss/train': 1.7612403631210327} +03/05/2022 02:07:51 - INFO - codeparrot_training - Skipping example with length 207 (seq_length=1024) +03/05/2022 02:07:53 - INFO - codeparrot_training - Step 31198: {'lr': 0.00045350079859901956, 'samples': 15973888, 'steps': 31198, 'loss/train': 0.21661192178726196} +03/05/2022 02:07:56 - INFO - codeparrot_training - Step 31199: {'lr': 0.00045349771607555017, 'samples': 15974400, 'steps': 31199, 'loss/train': 1.3992919921875} +03/05/2022 02:08:00 - INFO - codeparrot_training - Step 31200: {'lr': 0.0004534946334603879, 'samples': 15974912, 'steps': 31200, 'loss/train': 1.5382903814315796} +03/05/2022 02:08:00 - INFO - codeparrot_training - Skipping example with length 578 (seq_length=1024) +03/05/2022 02:08:05 - INFO - codeparrot_training - Step 31201: {'lr': 0.000453491550753534, 'samples': 15975424, 'steps': 31201, 'loss/train': 1.9669768810272217} +03/05/2022 02:08:08 - INFO - codeparrot_training - Skipping example with length 252 (seq_length=1024) +03/05/2022 02:08:10 - INFO - codeparrot_training - Step 31202: {'lr': 0.00045348846795499, 'samples': 15975936, 'steps': 31202, 'loss/train': 1.3622984886169434} +03/05/2022 02:08:13 - INFO - codeparrot_training - Step 31203: {'lr': 0.0004534853850647572, 'samples': 15976448, 'steps': 31203, 'loss/train': 1.906019687652588} +03/05/2022 02:08:16 - INFO - codeparrot_training - Skipping example with length 416 (seq_length=1024) +03/05/2022 02:08:19 - INFO - codeparrot_training - Step 31204: {'lr': 0.00045348230208283716, 'samples': 15976960, 'steps': 31204, 'loss/train': 2.3006138801574707} +03/05/2022 02:08:22 - INFO - codeparrot_training - Step 31205: {'lr': 0.000453479219009231, 'samples': 15977472, 'steps': 31205, 'loss/train': 1.388038158416748} +03/05/2022 02:08:25 - INFO - codeparrot_training - Skipping example with length 383 (seq_length=1024) +03/05/2022 02:08:27 - INFO - codeparrot_training - Step 31206: {'lr': 0.00045347613584394034, 'samples': 15977984, 'steps': 31206, 'loss/train': 1.5862382650375366} +03/05/2022 02:08:30 - INFO - codeparrot_training - Step 31207: {'lr': 0.0004534730525869664, 'samples': 15978496, 'steps': 31207, 'loss/train': 2.2657642364501953} +03/05/2022 02:08:34 - INFO - codeparrot_training - Step 31208: {'lr': 0.0004534699692383106, 'samples': 15979008, 'steps': 31208, 'loss/train': 1.9134202003479004} +03/05/2022 02:08:34 - INFO - codeparrot_training - Skipping example with length 280 (seq_length=1024) +03/05/2022 02:08:39 - INFO - codeparrot_training - Step 31209: {'lr': 0.00045346688579797444, 'samples': 15979520, 'steps': 31209, 'loss/train': 2.785701274871826} +03/05/2022 02:08:42 - INFO - codeparrot_training - Step 31210: {'lr': 0.0004534638022659592, 'samples': 15980032, 'steps': 31210, 'loss/train': 2.153606414794922} +03/05/2022 02:08:42 - INFO - codeparrot_training - Skipping example with length 878 (seq_length=1024) +03/05/2022 02:08:47 - INFO - codeparrot_training - Step 31211: {'lr': 0.00045346071864226634, 'samples': 15980544, 'steps': 31211, 'loss/train': 1.8848086595535278} +03/05/2022 02:08:50 - INFO - codeparrot_training - Step 31212: {'lr': 0.0004534576349268973, 'samples': 15981056, 'steps': 31212, 'loss/train': 1.7241636514663696} +03/05/2022 02:08:51 - INFO - codeparrot_training - Skipping example with length 831 (seq_length=1024) +03/05/2022 02:08:56 - INFO - codeparrot_training - Step 31213: {'lr': 0.00045345455111985326, 'samples': 15981568, 'steps': 31213, 'loss/train': 1.588283896446228} +03/05/2022 02:08:59 - INFO - codeparrot_training - Step 31214: {'lr': 0.0004534514672211358, 'samples': 15982080, 'steps': 31214, 'loss/train': 0.2839645743370056} +03/05/2022 02:08:59 - INFO - codeparrot_training - Skipping example with length 349 (seq_length=1024) +03/05/2022 02:09:04 - INFO - codeparrot_training - Step 31215: {'lr': 0.0004534483832307462, 'samples': 15982592, 'steps': 31215, 'loss/train': 0.888735294342041} +03/05/2022 02:09:07 - INFO - codeparrot_training - Step 31216: {'lr': 0.00045344529914868593, 'samples': 15983104, 'steps': 31216, 'loss/train': 2.0720736980438232} +03/05/2022 02:09:09 - INFO - codeparrot_training - Skipping example with length 829 (seq_length=1024) +03/05/2022 02:09:13 - INFO - codeparrot_training - Step 31217: {'lr': 0.0004534422149749564, 'samples': 15983616, 'steps': 31217, 'loss/train': 1.3915958404541016} +03/05/2022 02:09:16 - INFO - codeparrot_training - Step 31218: {'lr': 0.0004534391307095589, 'samples': 15984128, 'steps': 31218, 'loss/train': 1.2616907358169556} +03/05/2022 02:09:17 - INFO - codeparrot_training - Skipping example with length 159 (seq_length=1024) +03/05/2022 02:09:21 - INFO - codeparrot_training - Step 31219: {'lr': 0.0004534360463524948, 'samples': 15984640, 'steps': 31219, 'loss/train': 1.9746536016464233} +03/05/2022 02:09:24 - INFO - codeparrot_training - Step 31220: {'lr': 0.00045343296190376566, 'samples': 15985152, 'steps': 31220, 'loss/train': 1.8314369916915894} +03/05/2022 02:09:26 - INFO - codeparrot_training - Skipping example with length 353 (seq_length=1024) +03/05/2022 02:09:30 - INFO - codeparrot_training - Step 31221: {'lr': 0.0004534298773633727, 'samples': 15985664, 'steps': 31221, 'loss/train': 1.94963800907135} +03/05/2022 02:09:33 - INFO - codeparrot_training - Step 31222: {'lr': 0.00045342679273131743, 'samples': 15986176, 'steps': 31222, 'loss/train': 1.6512612104415894} +03/05/2022 02:09:34 - INFO - codeparrot_training - Skipping example with length 750 (seq_length=1024) +03/05/2022 02:09:38 - INFO - codeparrot_training - Step 31223: {'lr': 0.0004534237080076011, 'samples': 15986688, 'steps': 31223, 'loss/train': 1.544721007347107} +03/05/2022 02:09:41 - INFO - codeparrot_training - Step 31224: {'lr': 0.0004534206231922253, 'samples': 15987200, 'steps': 31224, 'loss/train': 1.469767451286316} +03/05/2022 02:09:42 - INFO - codeparrot_training - Skipping example with length 575 (seq_length=1024) +03/05/2022 02:09:46 - INFO - codeparrot_training - Step 31225: {'lr': 0.0004534175382851913, 'samples': 15987712, 'steps': 31225, 'loss/train': 1.243323564529419} +03/05/2022 02:09:49 - INFO - codeparrot_training - Step 31226: {'lr': 0.0004534144532865004, 'samples': 15988224, 'steps': 31226, 'loss/train': 1.938773274421692} +03/05/2022 02:09:50 - INFO - codeparrot_training - Skipping example with length 393 (seq_length=1024) +03/05/2022 02:09:55 - INFO - codeparrot_training - Step 31227: {'lr': 0.00045341136819615415, 'samples': 15988736, 'steps': 31227, 'loss/train': 1.9212853908538818} +03/05/2022 02:09:58 - INFO - codeparrot_training - Step 31228: {'lr': 0.0004534082830141538, 'samples': 15989248, 'steps': 31228, 'loss/train': 1.1477086544036865} +03/05/2022 02:09:59 - INFO - codeparrot_training - Skipping example with length 86 (seq_length=1024) +03/05/2022 02:10:03 - INFO - codeparrot_training - Step 31229: {'lr': 0.00045340519774050093, 'samples': 15989760, 'steps': 31229, 'loss/train': 1.0667884349822998} +03/05/2022 02:10:06 - INFO - codeparrot_training - Step 31230: {'lr': 0.0004534021123751968, 'samples': 15990272, 'steps': 31230, 'loss/train': 1.9355428218841553} +03/05/2022 02:10:07 - INFO - codeparrot_training - Skipping example with length 184 (seq_length=1024) +03/05/2022 02:10:12 - INFO - codeparrot_training - Step 31231: {'lr': 0.00045339902691824275, 'samples': 15990784, 'steps': 31231, 'loss/train': 1.748635172843933} +03/05/2022 02:10:15 - INFO - codeparrot_training - Step 31232: {'lr': 0.0004533959413696402, 'samples': 15991296, 'steps': 31232, 'loss/train': 2.0622451305389404} +03/05/2022 02:10:15 - INFO - codeparrot_training - Skipping example with length 852 (seq_length=1024) +03/05/2022 02:10:20 - INFO - codeparrot_training - Step 31233: {'lr': 0.0004533928557293907, 'samples': 15991808, 'steps': 31233, 'loss/train': 1.6732925176620483} +03/05/2022 02:10:23 - INFO - codeparrot_training - Step 31234: {'lr': 0.00045338976999749546, 'samples': 15992320, 'steps': 31234, 'loss/train': 1.7939825057983398} +03/05/2022 02:10:24 - INFO - codeparrot_training - Skipping example with length 578 (seq_length=1024) +03/05/2022 02:10:29 - INFO - codeparrot_training - Step 31235: {'lr': 0.00045338668417395595, 'samples': 15992832, 'steps': 31235, 'loss/train': 1.3740499019622803} +03/05/2022 02:10:32 - INFO - codeparrot_training - Step 31236: {'lr': 0.0004533835982587735, 'samples': 15993344, 'steps': 31236, 'loss/train': 1.6959775686264038} +03/05/2022 02:10:32 - INFO - codeparrot_training - Skipping example with length 988 (seq_length=1024) +03/05/2022 02:10:37 - INFO - codeparrot_training - Step 31237: {'lr': 0.00045338051225194954, 'samples': 15993856, 'steps': 31237, 'loss/train': 1.2128299474716187} +03/05/2022 02:10:40 - INFO - codeparrot_training - Step 31238: {'lr': 0.0004533774261534855, 'samples': 15994368, 'steps': 31238, 'loss/train': 2.155068874359131} +03/05/2022 02:10:40 - INFO - codeparrot_training - Skipping example with length 131 (seq_length=1024) +03/05/2022 02:10:46 - INFO - codeparrot_training - Step 31239: {'lr': 0.00045337433996338274, 'samples': 15994880, 'steps': 31239, 'loss/train': 2.0498902797698975} +03/05/2022 02:10:49 - INFO - codeparrot_training - Step 31240: {'lr': 0.0004533712536816426, 'samples': 15995392, 'steps': 31240, 'loss/train': 1.4867193698883057} +03/05/2022 02:10:49 - INFO - codeparrot_training - Skipping example with length 991 (seq_length=1024) +03/05/2022 02:10:54 - INFO - codeparrot_training - Step 31241: {'lr': 0.0004533681673082665, 'samples': 15995904, 'steps': 31241, 'loss/train': 2.2967164516448975} +03/05/2022 02:10:57 - INFO - codeparrot_training - Step 31242: {'lr': 0.00045336508084325587, 'samples': 15996416, 'steps': 31242, 'loss/train': 1.5800848007202148} +03/05/2022 02:10:57 - INFO - codeparrot_training - Skipping example with length 359 (seq_length=1024) +03/05/2022 02:11:03 - INFO - codeparrot_training - Step 31243: {'lr': 0.0004533619942866121, 'samples': 15996928, 'steps': 31243, 'loss/train': 2.5654125213623047} +03/05/2022 02:11:06 - INFO - codeparrot_training - Step 31244: {'lr': 0.00045335890763833646, 'samples': 15997440, 'steps': 31244, 'loss/train': 2.2336838245391846} +03/05/2022 02:11:06 - INFO - codeparrot_training - Skipping example with length 795 (seq_length=1024) +03/05/2022 02:11:11 - INFO - codeparrot_training - Step 31245: {'lr': 0.0004533558208984305, 'samples': 15997952, 'steps': 31245, 'loss/train': 2.403945207595825} +03/05/2022 02:11:14 - INFO - codeparrot_training - Step 31246: {'lr': 0.0004533527340668956, 'samples': 15998464, 'steps': 31246, 'loss/train': 0.5994052886962891} +03/05/2022 02:11:14 - INFO - codeparrot_training - Skipping example with length 706 (seq_length=1024) +03/05/2022 02:11:19 - INFO - codeparrot_training - Step 31247: {'lr': 0.000453349647143733, 'samples': 15998976, 'steps': 31247, 'loss/train': 1.2113748788833618} +03/05/2022 02:11:23 - INFO - codeparrot_training - Step 31248: {'lr': 0.00045334656012894424, 'samples': 15999488, 'steps': 31248, 'loss/train': 1.7672685384750366} +03/05/2022 02:11:23 - INFO - codeparrot_training - Skipping example with length 879 (seq_length=1024) +03/05/2022 02:11:28 - INFO - codeparrot_training - Step 31249: {'lr': 0.00045334347302253064, 'samples': 16000000, 'steps': 31249, 'loss/train': 1.8587634563446045} +03/05/2022 02:11:31 - INFO - codeparrot_training - Skipping example with length 145 (seq_length=1024) +03/05/2022 02:11:33 - INFO - codeparrot_training - Step 31250: {'lr': 0.00045334038582449355, 'samples': 16000512, 'steps': 31250, 'loss/train': 1.4035993814468384} +03/05/2022 02:11:36 - INFO - codeparrot_training - Step 31251: {'lr': 0.0004533372985348345, 'samples': 16001024, 'steps': 31251, 'loss/train': 2.10274600982666} +03/05/2022 02:11:39 - INFO - codeparrot_training - Skipping example with length 893 (seq_length=1024) +03/05/2022 02:11:41 - INFO - codeparrot_training - Step 31252: {'lr': 0.00045333421115355477, 'samples': 16001536, 'steps': 31252, 'loss/train': 1.3081153631210327} +03/05/2022 02:11:45 - INFO - codeparrot_training - Step 31253: {'lr': 0.00045333112368065585, 'samples': 16002048, 'steps': 31253, 'loss/train': 1.151039719581604} +03/05/2022 02:11:47 - INFO - codeparrot_training - Skipping example with length 773 (seq_length=1024) +03/05/2022 02:11:50 - INFO - codeparrot_training - Step 31254: {'lr': 0.00045332803611613896, 'samples': 16002560, 'steps': 31254, 'loss/train': 1.4762095212936401} +03/05/2022 02:11:53 - INFO - codeparrot_training - Step 31255: {'lr': 0.00045332494846000564, 'samples': 16003072, 'steps': 31255, 'loss/train': 0.829897403717041} +03/05/2022 02:11:56 - INFO - codeparrot_training - Skipping example with length 1011 (seq_length=1024) +03/05/2022 02:11:58 - INFO - codeparrot_training - Step 31256: {'lr': 0.00045332186071225724, 'samples': 16003584, 'steps': 31256, 'loss/train': 1.4992725849151611} +03/05/2022 02:12:02 - INFO - codeparrot_training - Step 31257: {'lr': 0.00045331877287289516, 'samples': 16004096, 'steps': 31257, 'loss/train': 1.9860498905181885} +03/05/2022 02:12:04 - INFO - codeparrot_training - Skipping example with length 869 (seq_length=1024) +03/05/2022 02:12:07 - INFO - codeparrot_training - Step 31258: {'lr': 0.00045331568494192076, 'samples': 16004608, 'steps': 31258, 'loss/train': 1.2602415084838867} +03/05/2022 02:12:10 - INFO - codeparrot_training - Step 31259: {'lr': 0.00045331259691933545, 'samples': 16005120, 'steps': 31259, 'loss/train': 1.5225762128829956} +03/05/2022 02:12:12 - INFO - codeparrot_training - Skipping example with length 314 (seq_length=1024) +03/05/2022 02:12:15 - INFO - codeparrot_training - Step 31260: {'lr': 0.00045330950880514065, 'samples': 16005632, 'steps': 31260, 'loss/train': 1.94674551486969} +03/05/2022 02:12:18 - INFO - codeparrot_training - Step 31261: {'lr': 0.0004533064205993377, 'samples': 16006144, 'steps': 31261, 'loss/train': 2.097560167312622} +03/05/2022 02:12:20 - INFO - codeparrot_training - Skipping example with length 944 (seq_length=1024) +03/05/2022 02:12:24 - INFO - codeparrot_training - Step 31262: {'lr': 0.000453303332301928, 'samples': 16006656, 'steps': 31262, 'loss/train': 1.7939579486846924} +03/05/2022 02:12:27 - INFO - codeparrot_training - Step 31263: {'lr': 0.00045330024391291294, 'samples': 16007168, 'steps': 31263, 'loss/train': 1.6667006015777588} +03/05/2022 02:12:29 - INFO - codeparrot_training - Skipping example with length 603 (seq_length=1024) +03/05/2022 02:12:32 - INFO - codeparrot_training - Step 31264: {'lr': 0.00045329715543229396, 'samples': 16007680, 'steps': 31264, 'loss/train': 1.5476551055908203} +03/05/2022 02:12:35 - INFO - codeparrot_training - Step 31265: {'lr': 0.0004532940668600724, 'samples': 16008192, 'steps': 31265, 'loss/train': 2.3178257942199707} +03/05/2022 02:12:37 - INFO - codeparrot_training - Skipping example with length 877 (seq_length=1024) +03/05/2022 02:12:40 - INFO - codeparrot_training - Step 31266: {'lr': 0.00045329097819624966, 'samples': 16008704, 'steps': 31266, 'loss/train': 1.9833815097808838} +03/05/2022 02:12:44 - INFO - codeparrot_training - Step 31267: {'lr': 0.00045328788944082717, 'samples': 16009216, 'steps': 31267, 'loss/train': 1.0968315601348877} +03/05/2022 02:12:45 - INFO - codeparrot_training - Skipping example with length 363 (seq_length=1024) +03/05/2022 02:12:49 - INFO - codeparrot_training - Step 31268: {'lr': 0.0004532848005938063, 'samples': 16009728, 'steps': 31268, 'loss/train': 0.5411005616188049} +03/05/2022 02:12:52 - INFO - codeparrot_training - Step 31269: {'lr': 0.0004532817116551884, 'samples': 16010240, 'steps': 31269, 'loss/train': 0.9187597632408142} +03/05/2022 02:12:54 - INFO - codeparrot_training - Skipping example with length 841 (seq_length=1024) +03/05/2022 02:12:57 - INFO - codeparrot_training - Step 31270: {'lr': 0.00045327862262497495, 'samples': 16010752, 'steps': 31270, 'loss/train': 1.0253801345825195} +03/05/2022 02:13:01 - INFO - codeparrot_training - Step 31271: {'lr': 0.00045327553350316726, 'samples': 16011264, 'steps': 31271, 'loss/train': 0.2541907727718353} +03/05/2022 02:13:02 - INFO - codeparrot_training - Skipping example with length 79 (seq_length=1024) +03/05/2022 02:13:06 - INFO - codeparrot_training - Step 31272: {'lr': 0.00045327244428976677, 'samples': 16011776, 'steps': 31272, 'loss/train': 0.7192752361297607} +03/05/2022 02:13:09 - INFO - codeparrot_training - Step 31273: {'lr': 0.00045326935498477477, 'samples': 16012288, 'steps': 31273, 'loss/train': 1.8638173341751099} +03/05/2022 02:13:11 - INFO - codeparrot_training - Skipping example with length 500 (seq_length=1024) +03/05/2022 02:13:14 - INFO - codeparrot_training - Step 31274: {'lr': 0.00045326626558819284, 'samples': 16012800, 'steps': 31274, 'loss/train': 2.1817362308502197} +03/05/2022 02:13:18 - INFO - codeparrot_training - Step 31275: {'lr': 0.00045326317610002223, 'samples': 16013312, 'steps': 31275, 'loss/train': 1.6549276113510132} +03/05/2022 02:13:20 - INFO - codeparrot_training - Skipping example with length 230 (seq_length=1024) +03/05/2022 02:13:23 - INFO - codeparrot_training - Step 31276: {'lr': 0.00045326008652026435, 'samples': 16013824, 'steps': 31276, 'loss/train': 1.3947818279266357} +03/05/2022 02:13:26 - INFO - codeparrot_training - Step 31277: {'lr': 0.00045325699684892065, 'samples': 16014336, 'steps': 31277, 'loss/train': 2.360452651977539} +03/05/2022 02:13:28 - INFO - codeparrot_training - Skipping example with length 655 (seq_length=1024) +03/05/2022 02:13:31 - INFO - codeparrot_training - Step 31278: {'lr': 0.00045325390708599245, 'samples': 16014848, 'steps': 31278, 'loss/train': 1.9629563093185425} +03/05/2022 02:13:35 - INFO - codeparrot_training - Step 31279: {'lr': 0.0004532508172314812, 'samples': 16015360, 'steps': 31279, 'loss/train': 1.4060941934585571} +03/05/2022 02:13:37 - INFO - codeparrot_training - Skipping example with length 887 (seq_length=1024) +03/05/2022 02:13:40 - INFO - codeparrot_training - Step 31280: {'lr': 0.0004532477272853882, 'samples': 16015872, 'steps': 31280, 'loss/train': 1.2763826847076416} +03/05/2022 02:13:43 - INFO - codeparrot_training - Step 31281: {'lr': 0.000453244637247715, 'samples': 16016384, 'steps': 31281, 'loss/train': 1.9019306898117065} +03/05/2022 02:13:46 - INFO - codeparrot_training - Step 31282: {'lr': 0.0004532415471184629, 'samples': 16016896, 'steps': 31282, 'loss/train': 1.9329885244369507} +03/05/2022 02:13:46 - INFO - codeparrot_training - Skipping example with length 520 (seq_length=1024) +03/05/2022 02:13:52 - INFO - codeparrot_training - Step 31283: {'lr': 0.0004532384568976332, 'samples': 16017408, 'steps': 31283, 'loss/train': 1.425925850868225} +03/05/2022 02:13:54 - INFO - codeparrot_training - Skipping example with length 581 (seq_length=1024) +03/05/2022 02:13:57 - INFO - codeparrot_training - Step 31284: {'lr': 0.00045323536658522747, 'samples': 16017920, 'steps': 31284, 'loss/train': 1.7288312911987305} +03/05/2022 02:14:00 - INFO - codeparrot_training - Step 31285: {'lr': 0.00045323227618124695, 'samples': 16018432, 'steps': 31285, 'loss/train': 1.0297415256500244} +03/05/2022 02:14:03 - INFO - codeparrot_training - Skipping example with length 231 (seq_length=1024) +03/05/2022 02:14:05 - INFO - codeparrot_training - Step 31286: {'lr': 0.00045322918568569315, 'samples': 16018944, 'steps': 31286, 'loss/train': 1.5664710998535156} +03/05/2022 02:14:09 - INFO - codeparrot_training - Step 31287: {'lr': 0.0004532260950985675, 'samples': 16019456, 'steps': 31287, 'loss/train': 2.3907506465911865} +03/05/2022 02:14:12 - INFO - codeparrot_training - Step 31288: {'lr': 0.0004532230044198712, 'samples': 16019968, 'steps': 31288, 'loss/train': 2.0103282928466797} +03/05/2022 02:14:12 - INFO - codeparrot_training - Skipping example with length 873 (seq_length=1024) +03/05/2022 02:14:17 - INFO - codeparrot_training - Step 31289: {'lr': 0.00045321991364960577, 'samples': 16020480, 'steps': 31289, 'loss/train': 1.5371465682983398} +03/05/2022 02:14:20 - INFO - codeparrot_training - Skipping example with length 364 (seq_length=1024) +03/05/2022 02:14:23 - INFO - codeparrot_training - Step 31290: {'lr': 0.00045321682278777253, 'samples': 16020992, 'steps': 31290, 'loss/train': 2.0595197677612305} +03/05/2022 02:14:26 - INFO - codeparrot_training - Step 31291: {'lr': 0.00045321373183437305, 'samples': 16021504, 'steps': 31291, 'loss/train': 2.4261631965637207} +03/05/2022 02:14:29 - INFO - codeparrot_training - Step 31292: {'lr': 0.0004532106407894085, 'samples': 16022016, 'steps': 31292, 'loss/train': 2.2770328521728516} +03/05/2022 02:14:29 - INFO - codeparrot_training - Skipping example with length 900 (seq_length=1024) +03/05/2022 02:14:34 - INFO - codeparrot_training - Step 31293: {'lr': 0.0004532075496528804, 'samples': 16022528, 'steps': 31293, 'loss/train': 1.899196982383728} +03/05/2022 02:14:37 - INFO - codeparrot_training - Step 31294: {'lr': 0.0004532044584247901, 'samples': 16023040, 'steps': 31294, 'loss/train': 1.940315842628479} +03/05/2022 02:14:37 - INFO - codeparrot_training - Skipping example with length 952 (seq_length=1024) +03/05/2022 02:14:43 - INFO - codeparrot_training - Step 31295: {'lr': 0.00045320136710513907, 'samples': 16023552, 'steps': 31295, 'loss/train': 2.3629398345947266} +03/05/2022 02:14:46 - INFO - codeparrot_training - Step 31296: {'lr': 0.00045319827569392855, 'samples': 16024064, 'steps': 31296, 'loss/train': 2.0255892276763916} +03/05/2022 02:14:46 - INFO - codeparrot_training - Skipping example with length 722 (seq_length=1024) +03/05/2022 02:14:51 - INFO - codeparrot_training - Step 31297: {'lr': 0.00045319518419116014, 'samples': 16024576, 'steps': 31297, 'loss/train': 2.358577251434326} +03/05/2022 02:14:55 - INFO - codeparrot_training - Step 31298: {'lr': 0.00045319209259683503, 'samples': 16025088, 'steps': 31298, 'loss/train': 2.255451202392578} +03/05/2022 02:14:55 - INFO - codeparrot_training - Skipping example with length 713 (seq_length=1024) +03/05/2022 02:15:00 - INFO - codeparrot_training - Step 31299: {'lr': 0.0004531890009109547, 'samples': 16025600, 'steps': 31299, 'loss/train': 1.9258549213409424} +03/05/2022 02:15:03 - INFO - codeparrot_training - Step 31300: {'lr': 0.0004531859091335205, 'samples': 16026112, 'steps': 31300, 'loss/train': 1.7282050848007202} +03/05/2022 02:15:03 - INFO - codeparrot_training - Skipping example with length 742 (seq_length=1024) +03/05/2022 02:15:08 - INFO - codeparrot_training - Step 31301: {'lr': 0.00045318281726453393, 'samples': 16026624, 'steps': 31301, 'loss/train': 1.7986574172973633} +03/05/2022 02:15:11 - INFO - codeparrot_training - Step 31302: {'lr': 0.00045317972530399634, 'samples': 16027136, 'steps': 31302, 'loss/train': 3.4930503368377686} +03/05/2022 02:15:11 - INFO - codeparrot_training - Skipping example with length 816 (seq_length=1024) +03/05/2022 02:15:17 - INFO - codeparrot_training - Step 31303: {'lr': 0.00045317663325190904, 'samples': 16027648, 'steps': 31303, 'loss/train': 1.911583423614502} +03/05/2022 02:15:20 - INFO - codeparrot_training - Skipping example with length 934 (seq_length=1024) +03/05/2022 02:15:22 - INFO - codeparrot_training - Step 31304: {'lr': 0.00045317354110827344, 'samples': 16028160, 'steps': 31304, 'loss/train': 1.2248088121414185} +03/05/2022 02:15:25 - INFO - codeparrot_training - Step 31305: {'lr': 0.0004531704488730911, 'samples': 16028672, 'steps': 31305, 'loss/train': 0.12408903241157532} +03/05/2022 02:15:28 - INFO - codeparrot_training - Skipping example with length 14 (seq_length=1024) +03/05/2022 02:15:30 - INFO - codeparrot_training - Step 31306: {'lr': 0.0004531673565463632, 'samples': 16029184, 'steps': 31306, 'loss/train': 1.8158921003341675} +03/05/2022 02:15:34 - INFO - codeparrot_training - Step 31307: {'lr': 0.0004531642641280913, 'samples': 16029696, 'steps': 31307, 'loss/train': 0.13636095821857452} +03/05/2022 02:15:37 - INFO - codeparrot_training - Skipping example with length 299 (seq_length=1024) +03/05/2022 02:15:39 - INFO - codeparrot_training - Step 31308: {'lr': 0.0004531611716182767, 'samples': 16030208, 'steps': 31308, 'loss/train': 2.266716957092285} +03/05/2022 02:15:42 - INFO - codeparrot_training - Step 31309: {'lr': 0.0004531580790169207, 'samples': 16030720, 'steps': 31309, 'loss/train': 1.81352961063385} +03/05/2022 02:15:45 - INFO - codeparrot_training - Skipping example with length 302 (seq_length=1024) +03/05/2022 02:15:47 - INFO - codeparrot_training - Step 31310: {'lr': 0.00045315498632402494, 'samples': 16031232, 'steps': 31310, 'loss/train': 0.7700819373130798} +03/05/2022 02:15:51 - INFO - codeparrot_training - Step 31311: {'lr': 0.0004531518935395906, 'samples': 16031744, 'steps': 31311, 'loss/train': 1.8370335102081299} +03/05/2022 02:15:53 - INFO - codeparrot_training - Skipping example with length 864 (seq_length=1024) +03/05/2022 02:15:56 - INFO - codeparrot_training - Step 31312: {'lr': 0.00045314880066361923, 'samples': 16032256, 'steps': 31312, 'loss/train': 1.4086246490478516} +03/05/2022 02:15:59 - INFO - codeparrot_training - Step 31313: {'lr': 0.00045314570769611207, 'samples': 16032768, 'steps': 31313, 'loss/train': 1.8708747625350952} +03/05/2022 02:16:02 - INFO - codeparrot_training - Skipping example with length 324 (seq_length=1024) +03/05/2022 02:16:04 - INFO - codeparrot_training - Step 31314: {'lr': 0.00045314261463707064, 'samples': 16033280, 'steps': 31314, 'loss/train': 2.1223835945129395} +03/05/2022 02:16:07 - INFO - codeparrot_training - Step 31315: {'lr': 0.00045313952148649626, 'samples': 16033792, 'steps': 31315, 'loss/train': 1.892887830734253} +03/05/2022 02:16:10 - INFO - codeparrot_training - Skipping example with length 315 (seq_length=1024) +03/05/2022 02:16:13 - INFO - codeparrot_training - Step 31316: {'lr': 0.0004531364282443904, 'samples': 16034304, 'steps': 31316, 'loss/train': 1.6936484575271606} +03/05/2022 02:16:16 - INFO - codeparrot_training - Step 31317: {'lr': 0.00045313333491075433, 'samples': 16034816, 'steps': 31317, 'loss/train': 1.6351993083953857} +03/05/2022 02:16:18 - INFO - codeparrot_training - Skipping example with length 686 (seq_length=1024) +03/05/2022 02:16:21 - INFO - codeparrot_training - Step 31318: {'lr': 0.0004531302414855895, 'samples': 16035328, 'steps': 31318, 'loss/train': 0.8834212422370911} +03/05/2022 02:16:24 - INFO - codeparrot_training - Step 31319: {'lr': 0.0004531271479688974, 'samples': 16035840, 'steps': 31319, 'loss/train': 1.852533221244812} +03/05/2022 02:16:27 - INFO - codeparrot_training - Skipping example with length 871 (seq_length=1024) +03/05/2022 02:16:29 - INFO - codeparrot_training - Step 31320: {'lr': 0.00045312405436067927, 'samples': 16036352, 'steps': 31320, 'loss/train': 1.9280599355697632} +03/05/2022 02:16:33 - INFO - codeparrot_training - Step 31321: {'lr': 0.00045312096066093654, 'samples': 16036864, 'steps': 31321, 'loss/train': 1.5642390251159668} +03/05/2022 02:16:35 - INFO - codeparrot_training - Skipping example with length 733 (seq_length=1024) +03/05/2022 02:16:38 - INFO - codeparrot_training - Step 31322: {'lr': 0.0004531178668696707, 'samples': 16037376, 'steps': 31322, 'loss/train': 2.000910758972168} +03/05/2022 02:16:41 - INFO - codeparrot_training - Step 31323: {'lr': 0.00045311477298688306, 'samples': 16037888, 'steps': 31323, 'loss/train': 0.7024642825126648} +03/05/2022 02:16:43 - INFO - codeparrot_training - Skipping example with length 383 (seq_length=1024) +03/05/2022 02:16:46 - INFO - codeparrot_training - Step 31324: {'lr': 0.0004531116790125751, 'samples': 16038400, 'steps': 31324, 'loss/train': 1.7582299709320068} +03/05/2022 02:16:50 - INFO - codeparrot_training - Step 31325: {'lr': 0.00045310858494674813, 'samples': 16038912, 'steps': 31325, 'loss/train': 0.2537677586078644} +03/05/2022 02:16:51 - INFO - codeparrot_training - Skipping example with length 9 (seq_length=1024) +03/05/2022 02:16:55 - INFO - codeparrot_training - Step 31326: {'lr': 0.00045310549078940356, 'samples': 16039424, 'steps': 31326, 'loss/train': 1.4679514169692993} +03/05/2022 02:16:58 - INFO - codeparrot_training - Step 31327: {'lr': 0.00045310239654054274, 'samples': 16039936, 'steps': 31327, 'loss/train': 2.0579328536987305} +03/05/2022 02:17:00 - INFO - codeparrot_training - Skipping example with length 874 (seq_length=1024) +03/05/2022 02:17:03 - INFO - codeparrot_training - Step 31328: {'lr': 0.0004530993022001672, 'samples': 16040448, 'steps': 31328, 'loss/train': 2.586130380630493} +03/05/2022 02:17:06 - INFO - codeparrot_training - Step 31329: {'lr': 0.00045309620776827817, 'samples': 16040960, 'steps': 31329, 'loss/train': 1.7450212240219116} +03/05/2022 02:17:08 - INFO - codeparrot_training - Skipping example with length 425 (seq_length=1024) +03/05/2022 02:17:12 - INFO - codeparrot_training - Step 31330: {'lr': 0.00045309311324487713, 'samples': 16041472, 'steps': 31330, 'loss/train': 2.352889060974121} +03/05/2022 02:17:15 - INFO - codeparrot_training - Step 31331: {'lr': 0.0004530900186299655, 'samples': 16041984, 'steps': 31331, 'loss/train': 2.0452089309692383} +03/05/2022 02:17:17 - INFO - codeparrot_training - Skipping example with length 672 (seq_length=1024) +03/05/2022 02:17:20 - INFO - codeparrot_training - Step 31332: {'lr': 0.0004530869239235446, 'samples': 16042496, 'steps': 31332, 'loss/train': 1.4178394079208374} +03/05/2022 02:17:23 - INFO - codeparrot_training - Step 31333: {'lr': 0.0004530838291256159, 'samples': 16043008, 'steps': 31333, 'loss/train': 1.6011756658554077} +03/05/2022 02:17:25 - INFO - codeparrot_training - Skipping example with length 113 (seq_length=1024) +03/05/2022 02:17:28 - INFO - codeparrot_training - Step 31334: {'lr': 0.0004530807342361807, 'samples': 16043520, 'steps': 31334, 'loss/train': 1.2463372945785522} +03/05/2022 02:17:32 - INFO - codeparrot_training - Step 31335: {'lr': 0.0004530776392552406, 'samples': 16044032, 'steps': 31335, 'loss/train': 0.9086995720863342} +03/05/2022 02:17:33 - INFO - codeparrot_training - Skipping example with length 382 (seq_length=1024) +03/05/2022 02:17:37 - INFO - codeparrot_training - Step 31336: {'lr': 0.0004530745441827967, 'samples': 16044544, 'steps': 31336, 'loss/train': 1.0100091695785522} +03/05/2022 02:17:40 - INFO - codeparrot_training - Step 31337: {'lr': 0.0004530714490188506, 'samples': 16045056, 'steps': 31337, 'loss/train': 1.6336041688919067} +03/05/2022 02:17:42 - INFO - codeparrot_training - Skipping example with length 295 (seq_length=1024) +03/05/2022 02:17:45 - INFO - codeparrot_training - Step 31338: {'lr': 0.00045306835376340366, 'samples': 16045568, 'steps': 31338, 'loss/train': 2.1312601566314697} +03/05/2022 02:17:48 - INFO - codeparrot_training - Step 31339: {'lr': 0.00045306525841645723, 'samples': 16046080, 'steps': 31339, 'loss/train': 1.2842655181884766} +03/05/2022 02:17:50 - INFO - codeparrot_training - Skipping example with length 986 (seq_length=1024) +03/05/2022 02:17:54 - INFO - codeparrot_training - Step 31340: {'lr': 0.0004530621629780127, 'samples': 16046592, 'steps': 31340, 'loss/train': 1.949377417564392} +03/05/2022 02:17:57 - INFO - codeparrot_training - Step 31341: {'lr': 0.00045305906744807156, 'samples': 16047104, 'steps': 31341, 'loss/train': 1.6233694553375244} +03/05/2022 02:17:59 - INFO - codeparrot_training - Skipping example with length 540 (seq_length=1024) +03/05/2022 02:18:02 - INFO - codeparrot_training - Step 31342: {'lr': 0.0004530559718266351, 'samples': 16047616, 'steps': 31342, 'loss/train': 1.977818489074707} +03/05/2022 02:18:06 - INFO - codeparrot_training - Step 31343: {'lr': 0.0004530528761137047, 'samples': 16048128, 'steps': 31343, 'loss/train': 1.9165534973144531} +03/05/2022 02:18:08 - INFO - codeparrot_training - Skipping example with length 909 (seq_length=1024) +03/05/2022 02:18:11 - INFO - codeparrot_training - Step 31344: {'lr': 0.0004530497803092819, 'samples': 16048640, 'steps': 31344, 'loss/train': 0.1004122644662857} +03/05/2022 02:18:14 - INFO - codeparrot_training - Step 31345: {'lr': 0.000453046684413368, 'samples': 16049152, 'steps': 31345, 'loss/train': 1.3429678678512573} +03/05/2022 02:18:16 - INFO - codeparrot_training - Skipping example with length 349 (seq_length=1024) +03/05/2022 02:18:19 - INFO - codeparrot_training - Step 31346: {'lr': 0.0004530435884259644, 'samples': 16049664, 'steps': 31346, 'loss/train': 1.2767664194107056} +03/05/2022 02:18:22 - INFO - codeparrot_training - Step 31347: {'lr': 0.0004530404923470724, 'samples': 16050176, 'steps': 31347, 'loss/train': 1.4328128099441528} +03/05/2022 02:18:24 - INFO - codeparrot_training - Skipping example with length 144 (seq_length=1024) +03/05/2022 02:18:28 - INFO - codeparrot_training - Step 31348: {'lr': 0.0004530373961766935, 'samples': 16050688, 'steps': 31348, 'loss/train': 2.261796236038208} +03/05/2022 02:18:31 - INFO - codeparrot_training - Step 31349: {'lr': 0.00045303429991482914, 'samples': 16051200, 'steps': 31349, 'loss/train': 1.5826224088668823} +03/05/2022 02:18:33 - INFO - codeparrot_training - Skipping example with length 922 (seq_length=1024) +03/05/2022 02:18:36 - INFO - codeparrot_training - Step 31350: {'lr': 0.00045303120356148067, 'samples': 16051712, 'steps': 31350, 'loss/train': 1.5257384777069092} +03/05/2022 02:18:39 - INFO - codeparrot_training - Step 31351: {'lr': 0.00045302810711664944, 'samples': 16052224, 'steps': 31351, 'loss/train': 2.089235544204712} +03/05/2022 02:18:41 - INFO - codeparrot_training - Skipping example with length 739 (seq_length=1024) +03/05/2022 02:18:44 - INFO - codeparrot_training - Step 31352: {'lr': 0.00045302501058033687, 'samples': 16052736, 'steps': 31352, 'loss/train': 1.0850471258163452} +03/05/2022 02:18:48 - INFO - codeparrot_training - Step 31353: {'lr': 0.0004530219139525444, 'samples': 16053248, 'steps': 31353, 'loss/train': 1.3114135265350342} +03/05/2022 02:18:49 - INFO - codeparrot_training - Skipping example with length 291 (seq_length=1024) +03/05/2022 02:18:53 - INFO - codeparrot_training - Step 31354: {'lr': 0.0004530188172332733, 'samples': 16053760, 'steps': 31354, 'loss/train': 1.7622098922729492} +03/05/2022 02:18:56 - INFO - codeparrot_training - Step 31355: {'lr': 0.00045301572042252516, 'samples': 16054272, 'steps': 31355, 'loss/train': 1.7171176671981812} +03/05/2022 02:18:58 - INFO - codeparrot_training - Skipping example with length 991 (seq_length=1024) +03/05/2022 02:19:01 - INFO - codeparrot_training - Step 31356: {'lr': 0.00045301262352030123, 'samples': 16054784, 'steps': 31356, 'loss/train': 1.5141102075576782} +03/05/2022 02:19:05 - INFO - codeparrot_training - Step 31357: {'lr': 0.00045300952652660296, 'samples': 16055296, 'steps': 31357, 'loss/train': 2.0707833766937256} +03/05/2022 02:19:06 - INFO - codeparrot_training - Skipping example with length 804 (seq_length=1024) +03/05/2022 02:19:10 - INFO - codeparrot_training - Step 31358: {'lr': 0.0004530064294414317, 'samples': 16055808, 'steps': 31358, 'loss/train': 0.7106841802597046} +03/05/2022 02:19:13 - INFO - codeparrot_training - Step 31359: {'lr': 0.00045300333226478887, 'samples': 16056320, 'steps': 31359, 'loss/train': 1.8802953958511353} +03/05/2022 02:19:16 - INFO - codeparrot_training - Skipping example with length 890 (seq_length=1024) +03/05/2022 02:19:18 - INFO - codeparrot_training - Step 31360: {'lr': 0.0004530002349966759, 'samples': 16056832, 'steps': 31360, 'loss/train': 1.8785624504089355} +03/05/2022 02:19:22 - INFO - codeparrot_training - Step 31361: {'lr': 0.0004529971376370941, 'samples': 16057344, 'steps': 31361, 'loss/train': 1.9405207633972168} +03/05/2022 02:19:25 - INFO - codeparrot_training - Step 31362: {'lr': 0.00045299404018604494, 'samples': 16057856, 'steps': 31362, 'loss/train': 2.0269734859466553} +03/05/2022 02:19:25 - INFO - codeparrot_training - Skipping example with length 207 (seq_length=1024) +03/05/2022 02:19:30 - INFO - codeparrot_training - Step 31363: {'lr': 0.00045299094264352987, 'samples': 16058368, 'steps': 31363, 'loss/train': 1.0510669946670532} +03/05/2022 02:19:33 - INFO - codeparrot_training - Skipping example with length 981 (seq_length=1024) +03/05/2022 02:19:35 - INFO - codeparrot_training - Step 31364: {'lr': 0.00045298784500955014, 'samples': 16058880, 'steps': 31364, 'loss/train': 1.7317931652069092} +03/05/2022 02:19:39 - INFO - codeparrot_training - Step 31365: {'lr': 0.0004529847472841073, 'samples': 16059392, 'steps': 31365, 'loss/train': 1.490064024925232} +03/05/2022 02:19:41 - INFO - codeparrot_training - Skipping example with length 799 (seq_length=1024) +03/05/2022 02:19:44 - INFO - codeparrot_training - Step 31366: {'lr': 0.00045298164946720254, 'samples': 16059904, 'steps': 31366, 'loss/train': 1.401496410369873} +03/05/2022 02:19:47 - INFO - codeparrot_training - Step 31367: {'lr': 0.0004529785515588375, 'samples': 16060416, 'steps': 31367, 'loss/train': 0.9100533723831177} +03/05/2022 02:19:50 - INFO - codeparrot_training - Skipping example with length 801 (seq_length=1024) +03/05/2022 02:19:52 - INFO - codeparrot_training - Step 31368: {'lr': 0.00045297545355901336, 'samples': 16060928, 'steps': 31368, 'loss/train': 1.887742280960083} +03/05/2022 02:19:56 - INFO - codeparrot_training - Step 31369: {'lr': 0.00045297235546773175, 'samples': 16061440, 'steps': 31369, 'loss/train': 1.6553266048431396} +03/05/2022 02:19:58 - INFO - codeparrot_training - Skipping example with length 405 (seq_length=1024) +03/05/2022 02:20:01 - INFO - codeparrot_training - Step 31370: {'lr': 0.0004529692572849938, 'samples': 16061952, 'steps': 31370, 'loss/train': 2.5361480712890625} +03/05/2022 02:20:04 - INFO - codeparrot_training - Step 31371: {'lr': 0.00045296615901080107, 'samples': 16062464, 'steps': 31371, 'loss/train': 1.845834493637085} +03/05/2022 02:20:07 - INFO - codeparrot_training - Step 31372: {'lr': 0.00045296306064515493, 'samples': 16062976, 'steps': 31372, 'loss/train': 1.5230488777160645} +03/05/2022 02:20:07 - INFO - codeparrot_training - Skipping example with length 335 (seq_length=1024) +03/05/2022 02:20:13 - INFO - codeparrot_training - Step 31373: {'lr': 0.0004529599621880567, 'samples': 16063488, 'steps': 31373, 'loss/train': 1.9418060779571533} +03/05/2022 02:20:15 - INFO - codeparrot_training - Skipping example with length 108 (seq_length=1024) +03/05/2022 02:20:18 - INFO - codeparrot_training - Step 31374: {'lr': 0.00045295686363950796, 'samples': 16064000, 'steps': 31374, 'loss/train': 1.7991875410079956} +03/05/2022 02:20:21 - INFO - codeparrot_training - Step 31375: {'lr': 0.0004529537649995099, 'samples': 16064512, 'steps': 31375, 'loss/train': 1.326756477355957} +03/05/2022 02:20:24 - INFO - codeparrot_training - Skipping example with length 136 (seq_length=1024) +03/05/2022 02:20:26 - INFO - codeparrot_training - Step 31376: {'lr': 0.0004529506662680641, 'samples': 16065024, 'steps': 31376, 'loss/train': 2.5800676345825195} +03/05/2022 02:20:29 - INFO - codeparrot_training - Step 31377: {'lr': 0.00045294756744517173, 'samples': 16065536, 'steps': 31377, 'loss/train': 2.0321543216705322} +03/05/2022 02:20:32 - INFO - codeparrot_training - Skipping example with length 215 (seq_length=1024) +03/05/2022 02:20:35 - INFO - codeparrot_training - Step 31378: {'lr': 0.00045294446853083446, 'samples': 16066048, 'steps': 31378, 'loss/train': 1.50870680809021} +03/05/2022 02:20:38 - INFO - codeparrot_training - Step 31379: {'lr': 0.00045294136952505346, 'samples': 16066560, 'steps': 31379, 'loss/train': 0.0714663416147232} +03/05/2022 02:20:41 - INFO - codeparrot_training - Skipping example with length 74 (seq_length=1024) +03/05/2022 02:20:43 - INFO - codeparrot_training - Step 31380: {'lr': 0.0004529382704278302, 'samples': 16067072, 'steps': 31380, 'loss/train': 1.7470999956130981} +03/05/2022 02:20:46 - INFO - codeparrot_training - Step 31381: {'lr': 0.0004529351712391661, 'samples': 16067584, 'steps': 31381, 'loss/train': 1.7038586139678955} +03/05/2022 02:20:49 - INFO - codeparrot_training - Skipping example with length 561 (seq_length=1024) +03/05/2022 02:20:52 - INFO - codeparrot_training - Step 31382: {'lr': 0.0004529320719590626, 'samples': 16068096, 'steps': 31382, 'loss/train': 1.7704042196273804} +03/05/2022 02:20:55 - INFO - codeparrot_training - Step 31383: {'lr': 0.00045292897258752095, 'samples': 16068608, 'steps': 31383, 'loss/train': 1.6985880136489868} +03/05/2022 02:20:58 - INFO - codeparrot_training - Skipping example with length 931 (seq_length=1024) +03/05/2022 02:21:00 - INFO - codeparrot_training - Step 31384: {'lr': 0.0004529258731245427, 'samples': 16069120, 'steps': 31384, 'loss/train': 1.2498353719711304} +03/05/2022 02:21:03 - INFO - codeparrot_training - Step 31385: {'lr': 0.0004529227735701291, 'samples': 16069632, 'steps': 31385, 'loss/train': 1.8348861932754517} +03/05/2022 02:21:06 - INFO - codeparrot_training - Skipping example with length 687 (seq_length=1024) +03/05/2022 02:21:08 - INFO - codeparrot_training - Step 31386: {'lr': 0.00045291967392428175, 'samples': 16070144, 'steps': 31386, 'loss/train': 1.1844439506530762} +03/05/2022 02:21:12 - INFO - codeparrot_training - Step 31387: {'lr': 0.0004529165741870018, 'samples': 16070656, 'steps': 31387, 'loss/train': 0.6403480768203735} +03/05/2022 02:21:14 - INFO - codeparrot_training - Skipping example with length 421 (seq_length=1024) +03/05/2022 02:21:17 - INFO - codeparrot_training - Step 31388: {'lr': 0.00045291347435829087, 'samples': 16071168, 'steps': 31388, 'loss/train': 1.7669285535812378} +03/05/2022 02:21:20 - INFO - codeparrot_training - Step 31389: {'lr': 0.0004529103744381503, 'samples': 16071680, 'steps': 31389, 'loss/train': 1.2361047267913818} +03/05/2022 02:21:22 - INFO - codeparrot_training - Skipping example with length 710 (seq_length=1024) +03/05/2022 02:21:25 - INFO - codeparrot_training - Step 31390: {'lr': 0.0004529072744265813, 'samples': 16072192, 'steps': 31390, 'loss/train': 2.1734917163848877} +03/05/2022 02:21:28 - INFO - codeparrot_training - Step 31391: {'lr': 0.00045290417432358553, 'samples': 16072704, 'steps': 31391, 'loss/train': 1.6103997230529785} +03/05/2022 02:21:31 - INFO - codeparrot_training - Skipping example with length 645 (seq_length=1024) +03/05/2022 02:21:34 - INFO - codeparrot_training - Step 31392: {'lr': 0.00045290107412916425, 'samples': 16073216, 'steps': 31392, 'loss/train': 1.0613278150558472} +03/05/2022 02:21:37 - INFO - codeparrot_training - Step 31393: {'lr': 0.0004528979738433189, 'samples': 16073728, 'steps': 31393, 'loss/train': 1.2625161409378052} +03/05/2022 02:21:39 - INFO - codeparrot_training - Skipping example with length 773 (seq_length=1024) +03/05/2022 02:21:42 - INFO - codeparrot_training - Step 31394: {'lr': 0.00045289487346605075, 'samples': 16074240, 'steps': 31394, 'loss/train': 1.0009559392929077} +03/05/2022 02:21:45 - INFO - codeparrot_training - Step 31395: {'lr': 0.0004528917729973614, 'samples': 16074752, 'steps': 31395, 'loss/train': 1.4855663776397705} +03/05/2022 02:21:48 - INFO - codeparrot_training - Skipping example with length 813 (seq_length=1024) +03/05/2022 02:21:51 - INFO - codeparrot_training - Step 31396: {'lr': 0.00045288867243725207, 'samples': 16075264, 'steps': 31396, 'loss/train': 0.6834126710891724} +03/05/2022 02:21:54 - INFO - codeparrot_training - Step 31397: {'lr': 0.00045288557178572433, 'samples': 16075776, 'steps': 31397, 'loss/train': 0.7422385811805725} +03/05/2022 02:21:56 - INFO - codeparrot_training - Skipping example with length 155 (seq_length=1024) +03/05/2022 02:21:59 - INFO - codeparrot_training - Step 31398: {'lr': 0.00045288247104277937, 'samples': 16076288, 'steps': 31398, 'loss/train': 1.700618863105774} +03/05/2022 02:22:02 - INFO - codeparrot_training - Step 31399: {'lr': 0.0004528793702084187, 'samples': 16076800, 'steps': 31399, 'loss/train': 2.016258716583252} +03/05/2022 02:22:04 - INFO - codeparrot_training - Skipping example with length 228 (seq_length=1024) +03/05/2022 02:22:07 - INFO - codeparrot_training - Step 31400: {'lr': 0.0004528762692826439, 'samples': 16077312, 'steps': 31400, 'loss/train': 1.2520030736923218} +03/05/2022 02:22:11 - INFO - codeparrot_training - Step 31401: {'lr': 0.000452873168265456, 'samples': 16077824, 'steps': 31401, 'loss/train': 0.11095746606588364} +03/05/2022 02:22:13 - INFO - codeparrot_training - Skipping example with length 332 (seq_length=1024) +03/05/2022 02:22:16 - INFO - codeparrot_training - Step 31402: {'lr': 0.00045287006715685665, 'samples': 16078336, 'steps': 31402, 'loss/train': 1.6106799840927124} +03/05/2022 02:22:19 - INFO - codeparrot_training - Step 31403: {'lr': 0.0004528669659568472, 'samples': 16078848, 'steps': 31403, 'loss/train': 1.9911088943481445} +03/05/2022 02:22:21 - INFO - codeparrot_training - Skipping example with length 771 (seq_length=1024) +03/05/2022 02:22:24 - INFO - codeparrot_training - Step 31404: {'lr': 0.00045286386466542896, 'samples': 16079360, 'steps': 31404, 'loss/train': 1.654862880706787} +03/05/2022 02:22:28 - INFO - codeparrot_training - Step 31405: {'lr': 0.0004528607632826034, 'samples': 16079872, 'steps': 31405, 'loss/train': 1.80656898021698} +03/05/2022 02:22:30 - INFO - codeparrot_training - Skipping example with length 198 (seq_length=1024) +03/05/2022 02:22:33 - INFO - codeparrot_training - Step 31406: {'lr': 0.00045285766180837197, 'samples': 16080384, 'steps': 31406, 'loss/train': 2.141064167022705} +03/05/2022 02:22:36 - INFO - codeparrot_training - Step 31407: {'lr': 0.000452854560242736, 'samples': 16080896, 'steps': 31407, 'loss/train': 2.1619699001312256} +03/05/2022 02:22:39 - INFO - codeparrot_training - Step 31408: {'lr': 0.0004528514585856968, 'samples': 16081408, 'steps': 31408, 'loss/train': 0.9550679326057434} +03/05/2022 02:22:40 - INFO - codeparrot_training - Skipping example with length 336 (seq_length=1024) +03/05/2022 02:22:45 - INFO - codeparrot_training - Step 31409: {'lr': 0.0004528483568372559, 'samples': 16081920, 'steps': 31409, 'loss/train': 1.1090449094772339} +03/05/2022 02:22:48 - INFO - codeparrot_training - Step 31410: {'lr': 0.00045284525499741474, 'samples': 16082432, 'steps': 31410, 'loss/train': 2.4411656856536865} +03/05/2022 02:22:49 - INFO - codeparrot_training - Skipping example with length 967 (seq_length=1024) +03/05/2022 02:22:53 - INFO - codeparrot_training - Step 31411: {'lr': 0.0004528421530661746, 'samples': 16082944, 'steps': 31411, 'loss/train': 1.6110491752624512} +03/05/2022 02:22:56 - INFO - codeparrot_training - Step 31412: {'lr': 0.0004528390510435368, 'samples': 16083456, 'steps': 31412, 'loss/train': 2.5272371768951416} +03/05/2022 02:22:57 - INFO - codeparrot_training - Skipping example with length 768 (seq_length=1024) +03/05/2022 02:23:02 - INFO - codeparrot_training - Step 31413: {'lr': 0.0004528359489295031, 'samples': 16083968, 'steps': 31413, 'loss/train': 2.122628688812256} +03/05/2022 02:23:05 - INFO - codeparrot_training - Step 31414: {'lr': 0.00045283284672407444, 'samples': 16084480, 'steps': 31414, 'loss/train': 1.2907477617263794} +03/05/2022 02:23:05 - INFO - codeparrot_training - Skipping example with length 747 (seq_length=1024) +03/05/2022 02:23:10 - INFO - codeparrot_training - Step 31415: {'lr': 0.0004528297444272525, 'samples': 16084992, 'steps': 31415, 'loss/train': 2.3552942276000977} +03/05/2022 02:23:13 - INFO - codeparrot_training - Step 31416: {'lr': 0.0004528266420390386, 'samples': 16085504, 'steps': 31416, 'loss/train': 1.0455079078674316} +03/05/2022 02:23:14 - INFO - codeparrot_training - Skipping example with length 34 (seq_length=1024) +03/05/2022 02:23:18 - INFO - codeparrot_training - Step 31417: {'lr': 0.00045282353955943417, 'samples': 16086016, 'steps': 31417, 'loss/train': 1.358640432357788} +03/05/2022 02:23:22 - INFO - codeparrot_training - Step 31418: {'lr': 0.00045282043698844054, 'samples': 16086528, 'steps': 31418, 'loss/train': 1.064713716506958} +03/05/2022 02:23:22 - INFO - codeparrot_training - Skipping example with length 61 (seq_length=1024) +03/05/2022 02:23:27 - INFO - codeparrot_training - Step 31419: {'lr': 0.0004528173343260592, 'samples': 16087040, 'steps': 31419, 'loss/train': 1.6776224374771118} +03/05/2022 02:23:30 - INFO - codeparrot_training - Step 31420: {'lr': 0.0004528142315722915, 'samples': 16087552, 'steps': 31420, 'loss/train': 1.3401951789855957} +03/05/2022 02:23:30 - INFO - codeparrot_training - Skipping example with length 641 (seq_length=1024) +03/05/2022 02:23:35 - INFO - codeparrot_training - Step 31421: {'lr': 0.0004528111287271388, 'samples': 16088064, 'steps': 31421, 'loss/train': 3.579611301422119} +03/05/2022 02:23:39 - INFO - codeparrot_training - Step 31422: {'lr': 0.00045280802579060253, 'samples': 16088576, 'steps': 31422, 'loss/train': 1.321414589881897} +03/05/2022 02:23:39 - INFO - codeparrot_training - Skipping example with length 412 (seq_length=1024) +03/05/2022 02:23:44 - INFO - codeparrot_training - Step 31423: {'lr': 0.00045280492276268414, 'samples': 16089088, 'steps': 31423, 'loss/train': 1.0094287395477295} +03/05/2022 02:23:47 - INFO - codeparrot_training - Skipping example with length 845 (seq_length=1024) +03/05/2022 02:23:49 - INFO - codeparrot_training - Step 31424: {'lr': 0.0004528018196433849, 'samples': 16089600, 'steps': 31424, 'loss/train': 1.6512426137924194} +03/05/2022 02:23:52 - INFO - codeparrot_training - Step 31425: {'lr': 0.0004527987164327063, 'samples': 16090112, 'steps': 31425, 'loss/train': 0.055026277899742126} +03/05/2022 02:23:55 - INFO - codeparrot_training - Skipping example with length 456 (seq_length=1024) +03/05/2022 02:23:57 - INFO - codeparrot_training - Step 31426: {'lr': 0.0004527956131306498, 'samples': 16090624, 'steps': 31426, 'loss/train': 2.124762773513794} +03/05/2022 02:24:01 - INFO - codeparrot_training - Step 31427: {'lr': 0.0004527925097372168, 'samples': 16091136, 'steps': 31427, 'loss/train': 2.246474027633667} +03/05/2022 02:24:03 - INFO - codeparrot_training - Skipping example with length 846 (seq_length=1024) +03/05/2022 02:24:06 - INFO - codeparrot_training - Step 31428: {'lr': 0.0004527894062524084, 'samples': 16091648, 'steps': 31428, 'loss/train': 2.1902942657470703} +03/05/2022 02:24:09 - INFO - codeparrot_training - Step 31429: {'lr': 0.00045278630267622637, 'samples': 16092160, 'steps': 31429, 'loss/train': 2.8574414253234863} +03/05/2022 02:24:12 - INFO - codeparrot_training - Skipping example with length 765 (seq_length=1024) +03/05/2022 02:24:15 - INFO - codeparrot_training - Step 31430: {'lr': 0.0004527831990086719, 'samples': 16092672, 'steps': 31430, 'loss/train': 1.695055365562439} +03/05/2022 02:24:18 - INFO - codeparrot_training - Step 31431: {'lr': 0.0004527800952497465, 'samples': 16093184, 'steps': 31431, 'loss/train': 5.8778486251831055} +03/05/2022 02:24:21 - INFO - codeparrot_training - Step 31432: {'lr': 0.0004527769913994515, 'samples': 16093696, 'steps': 31432, 'loss/train': 1.026113748550415} +03/05/2022 02:24:22 - INFO - codeparrot_training - Skipping example with length 660 (seq_length=1024) +03/05/2022 02:24:26 - INFO - codeparrot_training - Step 31433: {'lr': 0.00045277388745778836, 'samples': 16094208, 'steps': 31433, 'loss/train': 2.012977123260498} +03/05/2022 02:24:29 - INFO - codeparrot_training - Step 31434: {'lr': 0.00045277078342475835, 'samples': 16094720, 'steps': 31434, 'loss/train': 1.8157670497894287} +03/05/2022 02:24:31 - INFO - codeparrot_training - Skipping example with length 397 (seq_length=1024) +03/05/2022 02:24:35 - INFO - codeparrot_training - Step 31435: {'lr': 0.000452767679300363, 'samples': 16095232, 'steps': 31435, 'loss/train': 1.6247193813323975} +03/05/2022 02:24:38 - INFO - codeparrot_training - Step 31436: {'lr': 0.00045276457508460367, 'samples': 16095744, 'steps': 31436, 'loss/train': 1.0068397521972656} +03/05/2022 02:24:39 - INFO - codeparrot_training - Skipping example with length 519 (seq_length=1024) +03/05/2022 02:24:43 - INFO - codeparrot_training - Step 31437: {'lr': 0.00045276147077748176, 'samples': 16096256, 'steps': 31437, 'loss/train': 2.2893378734588623} +03/05/2022 02:24:46 - INFO - codeparrot_training - Step 31438: {'lr': 0.0004527583663789986, 'samples': 16096768, 'steps': 31438, 'loss/train': 1.5257594585418701} +03/05/2022 02:24:47 - INFO - codeparrot_training - Skipping example with length 293 (seq_length=1024) +03/05/2022 02:24:51 - INFO - codeparrot_training - Step 31439: {'lr': 0.0004527552618891557, 'samples': 16097280, 'steps': 31439, 'loss/train': 1.161664605140686} +03/05/2022 02:24:55 - INFO - codeparrot_training - Step 31440: {'lr': 0.0004527521573079544, 'samples': 16097792, 'steps': 31440, 'loss/train': 1.1855353116989136} +03/05/2022 02:24:55 - INFO - codeparrot_training - Skipping example with length 216 (seq_length=1024) +03/05/2022 02:25:00 - INFO - codeparrot_training - Step 31441: {'lr': 0.0004527490526353961, 'samples': 16098304, 'steps': 31441, 'loss/train': 1.4499212503433228} +03/05/2022 02:25:03 - INFO - codeparrot_training - Step 31442: {'lr': 0.0004527459478714822, 'samples': 16098816, 'steps': 31442, 'loss/train': 2.2350080013275146} +03/05/2022 02:25:04 - INFO - codeparrot_training - Skipping example with length 197 (seq_length=1024) +03/05/2022 02:25:08 - INFO - codeparrot_training - Step 31443: {'lr': 0.00045274284301621414, 'samples': 16099328, 'steps': 31443, 'loss/train': 1.9113391637802124} +03/05/2022 02:25:11 - INFO - codeparrot_training - Step 31444: {'lr': 0.00045273973806959325, 'samples': 16099840, 'steps': 31444, 'loss/train': 1.4769452810287476} +03/05/2022 02:25:12 - INFO - codeparrot_training - Skipping example with length 689 (seq_length=1024) +03/05/2022 02:25:17 - INFO - codeparrot_training - Step 31445: {'lr': 0.00045273663303162096, 'samples': 16100352, 'steps': 31445, 'loss/train': 1.4200798273086548} +03/05/2022 02:25:20 - INFO - codeparrot_training - Step 31446: {'lr': 0.00045273352790229873, 'samples': 16100864, 'steps': 31446, 'loss/train': 2.1596243381500244} +03/05/2022 02:25:21 - INFO - codeparrot_training - Skipping example with length 464 (seq_length=1024) +03/05/2022 02:25:25 - INFO - codeparrot_training - Step 31447: {'lr': 0.0004527304226816278, 'samples': 16101376, 'steps': 31447, 'loss/train': 1.6071414947509766} +03/05/2022 02:25:28 - INFO - codeparrot_training - Step 31448: {'lr': 0.0004527273173696097, 'samples': 16101888, 'steps': 31448, 'loss/train': 1.4654426574707031} +03/05/2022 02:25:29 - INFO - codeparrot_training - Skipping example with length 583 (seq_length=1024) +03/05/2022 02:25:34 - INFO - codeparrot_training - Step 31449: {'lr': 0.0004527242119662458, 'samples': 16102400, 'steps': 31449, 'loss/train': 2.3628480434417725} +03/05/2022 02:25:37 - INFO - codeparrot_training - Step 31450: {'lr': 0.00045272110647153754, 'samples': 16102912, 'steps': 31450, 'loss/train': 7.240050315856934} +03/05/2022 02:25:38 - INFO - codeparrot_training - Skipping example with length 448 (seq_length=1024) +03/05/2022 02:25:42 - INFO - codeparrot_training - Step 31451: {'lr': 0.00045271800088548625, 'samples': 16103424, 'steps': 31451, 'loss/train': 2.433006525039673} +03/05/2022 02:25:45 - INFO - codeparrot_training - Step 31452: {'lr': 0.00045271489520809337, 'samples': 16103936, 'steps': 31452, 'loss/train': 2.3132221698760986} +03/05/2022 02:25:47 - INFO - codeparrot_training - Skipping example with length 686 (seq_length=1024) +03/05/2022 02:25:50 - INFO - codeparrot_training - Step 31453: {'lr': 0.0004527117894393603, 'samples': 16104448, 'steps': 31453, 'loss/train': 1.756961703300476} +03/05/2022 02:25:54 - INFO - codeparrot_training - Step 31454: {'lr': 0.0004527086835792884, 'samples': 16104960, 'steps': 31454, 'loss/train': 1.503247618675232} +03/05/2022 02:25:55 - INFO - codeparrot_training - Skipping example with length 44 (seq_length=1024) +03/05/2022 02:25:59 - INFO - codeparrot_training - Step 31455: {'lr': 0.0004527055776278791, 'samples': 16105472, 'steps': 31455, 'loss/train': 2.0916385650634766} +03/05/2022 02:26:02 - INFO - codeparrot_training - Step 31456: {'lr': 0.00045270247158513377, 'samples': 16105984, 'steps': 31456, 'loss/train': 1.5416643619537354} +03/05/2022 02:26:03 - INFO - codeparrot_training - Skipping example with length 348 (seq_length=1024) +03/05/2022 02:26:07 - INFO - codeparrot_training - Step 31457: {'lr': 0.00045269936545105384, 'samples': 16106496, 'steps': 31457, 'loss/train': 1.729301929473877} +03/05/2022 02:26:11 - INFO - codeparrot_training - Step 31458: {'lr': 0.0004526962592256407, 'samples': 16107008, 'steps': 31458, 'loss/train': 5.931805610656738} +03/05/2022 02:26:12 - INFO - codeparrot_training - Skipping example with length 257 (seq_length=1024) +03/05/2022 02:26:16 - INFO - codeparrot_training - Step 31459: {'lr': 0.00045269315290889583, 'samples': 16107520, 'steps': 31459, 'loss/train': 1.5502777099609375} +03/05/2022 02:26:19 - INFO - codeparrot_training - Step 31460: {'lr': 0.00045269004650082045, 'samples': 16108032, 'steps': 31460, 'loss/train': 2.217634916305542} +03/05/2022 02:26:21 - INFO - codeparrot_training - Skipping example with length 199 (seq_length=1024) +03/05/2022 02:26:24 - INFO - codeparrot_training - Step 31461: {'lr': 0.0004526869400014162, 'samples': 16108544, 'steps': 31461, 'loss/train': 0.8402490019798279} +03/05/2022 02:26:27 - INFO - codeparrot_training - Step 31462: {'lr': 0.0004526838334106842, 'samples': 16109056, 'steps': 31462, 'loss/train': 1.3982808589935303} +03/05/2022 02:26:29 - INFO - codeparrot_training - Skipping example with length 15 (seq_length=1024) +03/05/2022 02:26:33 - INFO - codeparrot_training - Step 31463: {'lr': 0.000452680726728626, 'samples': 16109568, 'steps': 31463, 'loss/train': 1.1845130920410156} +03/05/2022 02:26:36 - INFO - codeparrot_training - Step 31464: {'lr': 0.00045267761995524314, 'samples': 16110080, 'steps': 31464, 'loss/train': 1.7911897897720337} +03/05/2022 02:26:37 - INFO - codeparrot_training - Skipping example with length 34 (seq_length=1024) +03/05/2022 02:26:41 - INFO - codeparrot_training - Step 31465: {'lr': 0.00045267451309053677, 'samples': 16110592, 'steps': 31465, 'loss/train': 1.4127013683319092} +03/05/2022 02:26:44 - INFO - codeparrot_training - Step 31466: {'lr': 0.0004526714061345084, 'samples': 16111104, 'steps': 31466, 'loss/train': 1.9185951948165894} +03/05/2022 02:26:45 - INFO - codeparrot_training - Skipping example with length 755 (seq_length=1024) +03/05/2022 02:26:49 - INFO - codeparrot_training - Step 31467: {'lr': 0.0004526682990871593, 'samples': 16111616, 'steps': 31467, 'loss/train': 1.6776704788208008} +03/05/2022 02:26:52 - INFO - codeparrot_training - Step 31468: {'lr': 0.0004526651919484912, 'samples': 16112128, 'steps': 31468, 'loss/train': 1.3298616409301758} +03/05/2022 02:26:54 - INFO - codeparrot_training - Skipping example with length 415 (seq_length=1024) +03/05/2022 02:26:58 - INFO - codeparrot_training - Step 31469: {'lr': 0.00045266208471850516, 'samples': 16112640, 'steps': 31469, 'loss/train': 1.3723582029342651} +03/05/2022 02:27:01 - INFO - codeparrot_training - Step 31470: {'lr': 0.00045265897739720277, 'samples': 16113152, 'steps': 31470, 'loss/train': 0.07018920034170151} +03/05/2022 02:27:03 - INFO - codeparrot_training - Skipping example with length 128 (seq_length=1024) +03/05/2022 02:27:06 - INFO - codeparrot_training - Step 31471: {'lr': 0.00045265586998458534, 'samples': 16113664, 'steps': 31471, 'loss/train': 1.3505792617797852} +03/05/2022 02:27:09 - INFO - codeparrot_training - Step 31472: {'lr': 0.00045265276248065436, 'samples': 16114176, 'steps': 31472, 'loss/train': 1.9902453422546387} +03/05/2022 02:27:11 - INFO - codeparrot_training - Skipping example with length 772 (seq_length=1024) +03/05/2022 02:27:15 - INFO - codeparrot_training - Step 31473: {'lr': 0.0004526496548854111, 'samples': 16114688, 'steps': 31473, 'loss/train': 1.7543225288391113} +03/05/2022 02:27:18 - INFO - codeparrot_training - Step 31474: {'lr': 0.000452646547198857, 'samples': 16115200, 'steps': 31474, 'loss/train': 1.383806586265564} +03/05/2022 02:27:19 - INFO - codeparrot_training - Skipping example with length 599 (seq_length=1024) +03/05/2022 02:27:23 - INFO - codeparrot_training - Step 31475: {'lr': 0.0004526434394209936, 'samples': 16115712, 'steps': 31475, 'loss/train': 1.9744014739990234} +03/05/2022 02:27:26 - INFO - codeparrot_training - Step 31476: {'lr': 0.00045264033155182216, 'samples': 16116224, 'steps': 31476, 'loss/train': 1.5867058038711548} +03/05/2022 02:27:27 - INFO - codeparrot_training - Skipping example with length 814 (seq_length=1024) +03/05/2022 02:27:31 - INFO - codeparrot_training - Step 31477: {'lr': 0.0004526372235913441, 'samples': 16116736, 'steps': 31477, 'loss/train': 1.89089035987854} +03/05/2022 02:27:35 - INFO - codeparrot_training - Step 31478: {'lr': 0.0004526341155395608, 'samples': 16117248, 'steps': 31478, 'loss/train': 2.182331085205078} +03/05/2022 02:27:35 - INFO - codeparrot_training - Skipping example with length 825 (seq_length=1024) +03/05/2022 02:27:40 - INFO - codeparrot_training - Step 31479: {'lr': 0.00045263100739647373, 'samples': 16117760, 'steps': 31479, 'loss/train': 1.7235870361328125} +03/05/2022 02:27:43 - INFO - codeparrot_training - Step 31480: {'lr': 0.00045262789916208424, 'samples': 16118272, 'steps': 31480, 'loss/train': 1.7351253032684326} +03/05/2022 02:27:43 - INFO - codeparrot_training - Skipping example with length 414 (seq_length=1024) +03/05/2022 02:27:48 - INFO - codeparrot_training - Step 31481: {'lr': 0.00045262479083639376, 'samples': 16118784, 'steps': 31481, 'loss/train': 1.9240679740905762} +03/05/2022 02:27:51 - INFO - codeparrot_training - Step 31482: {'lr': 0.0004526216824194037, 'samples': 16119296, 'steps': 31482, 'loss/train': 1.544216275215149} +03/05/2022 02:27:52 - INFO - codeparrot_training - Skipping example with length 181 (seq_length=1024) +03/05/2022 02:27:57 - INFO - codeparrot_training - Step 31483: {'lr': 0.00045261857391111536, 'samples': 16119808, 'steps': 31483, 'loss/train': 1.9310578107833862} +03/05/2022 02:28:00 - INFO - codeparrot_training - Step 31484: {'lr': 0.0004526154653115303, 'samples': 16120320, 'steps': 31484, 'loss/train': 1.6664706468582153} +03/05/2022 02:28:00 - INFO - codeparrot_training - Skipping example with length 665 (seq_length=1024) +03/05/2022 02:28:05 - INFO - codeparrot_training - Step 31485: {'lr': 0.0004526123566206498, 'samples': 16120832, 'steps': 31485, 'loss/train': 2.1433777809143066} +03/05/2022 02:28:08 - INFO - codeparrot_training - Step 31486: {'lr': 0.0004526092478384753, 'samples': 16121344, 'steps': 31486, 'loss/train': 1.5464683771133423} +03/05/2022 02:28:09 - INFO - codeparrot_training - Skipping example with length 347 (seq_length=1024) +03/05/2022 02:28:14 - INFO - codeparrot_training - Step 31487: {'lr': 0.00045260613896500827, 'samples': 16121856, 'steps': 31487, 'loss/train': 0.8201708793640137} +03/05/2022 02:28:17 - INFO - codeparrot_training - Step 31488: {'lr': 0.00045260303000024994, 'samples': 16122368, 'steps': 31488, 'loss/train': 1.764509916305542} +03/05/2022 02:28:17 - INFO - codeparrot_training - Skipping example with length 136 (seq_length=1024) +03/05/2022 02:28:22 - INFO - codeparrot_training - Step 31489: {'lr': 0.0004525999209442018, 'samples': 16122880, 'steps': 31489, 'loss/train': 1.4597769975662231} +03/05/2022 02:28:25 - INFO - codeparrot_training - Step 31490: {'lr': 0.0004525968117968653, 'samples': 16123392, 'steps': 31490, 'loss/train': 1.5814138650894165} +03/05/2022 02:28:26 - INFO - codeparrot_training - Skipping example with length 900 (seq_length=1024) +03/05/2022 02:28:31 - INFO - codeparrot_training - Step 31491: {'lr': 0.00045259370255824183, 'samples': 16123904, 'steps': 31491, 'loss/train': 1.0628573894500732} +03/05/2022 02:28:34 - INFO - codeparrot_training - Step 31492: {'lr': 0.0004525905932283327, 'samples': 16124416, 'steps': 31492, 'loss/train': 1.9792927503585815} +03/05/2022 02:28:34 - INFO - codeparrot_training - Skipping example with length 963 (seq_length=1024) +03/05/2022 02:28:39 - INFO - codeparrot_training - Step 31493: {'lr': 0.00045258748380713943, 'samples': 16124928, 'steps': 31493, 'loss/train': 0.2514106035232544} +03/05/2022 02:28:42 - INFO - codeparrot_training - Step 31494: {'lr': 0.00045258437429466337, 'samples': 16125440, 'steps': 31494, 'loss/train': 2.0028598308563232} +03/05/2022 02:28:43 - INFO - codeparrot_training - Skipping example with length 610 (seq_length=1024) +03/05/2022 02:28:48 - INFO - codeparrot_training - Step 31495: {'lr': 0.0004525812646909059, 'samples': 16125952, 'steps': 31495, 'loss/train': 1.779821515083313} +03/05/2022 02:28:51 - INFO - codeparrot_training - Step 31496: {'lr': 0.0004525781549958684, 'samples': 16126464, 'steps': 31496, 'loss/train': 1.7870286703109741} +03/05/2022 02:28:51 - INFO - codeparrot_training - Skipping example with length 314 (seq_length=1024) +03/05/2022 02:28:56 - INFO - codeparrot_training - Step 31497: {'lr': 0.0004525750452095524, 'samples': 16126976, 'steps': 31497, 'loss/train': 0.7611998915672302} +03/05/2022 02:28:59 - INFO - codeparrot_training - Step 31498: {'lr': 0.00045257193533195916, 'samples': 16127488, 'steps': 31498, 'loss/train': 1.86409592628479} +03/05/2022 02:29:00 - INFO - codeparrot_training - Skipping example with length 77 (seq_length=1024) +03/05/2022 02:29:04 - INFO - codeparrot_training - Step 31499: {'lr': 0.0004525688253630901, 'samples': 16128000, 'steps': 31499, 'loss/train': 1.889346718788147} +03/05/2022 02:29:08 - INFO - codeparrot_training - Step 31500: {'lr': 0.00045256571530294664, 'samples': 16128512, 'steps': 31500, 'loss/train': 1.037628412246704} +03/05/2022 02:29:08 - INFO - codeparrot_training - Skipping example with length 851 (seq_length=1024) +03/05/2022 02:29:13 - INFO - codeparrot_training - Step 31501: {'lr': 0.0004525626051515302, 'samples': 16129024, 'steps': 31501, 'loss/train': 1.702979564666748} +03/05/2022 02:29:16 - INFO - codeparrot_training - Step 31502: {'lr': 0.0004525594949088423, 'samples': 16129536, 'steps': 31502, 'loss/train': 2.212418794631958} +03/05/2022 02:29:16 - INFO - codeparrot_training - Skipping example with length 430 (seq_length=1024) +03/05/2022 02:29:21 - INFO - codeparrot_training - Step 31503: {'lr': 0.00045255638457488415, 'samples': 16130048, 'steps': 31503, 'loss/train': 1.2664870023727417} +03/05/2022 02:29:24 - INFO - codeparrot_training - Step 31504: {'lr': 0.0004525532741496572, 'samples': 16130560, 'steps': 31504, 'loss/train': 1.8271229267120361} +03/05/2022 02:29:25 - INFO - codeparrot_training - Skipping example with length 404 (seq_length=1024) +03/05/2022 02:29:30 - INFO - codeparrot_training - Step 31505: {'lr': 0.0004525501636331628, 'samples': 16131072, 'steps': 31505, 'loss/train': 1.6227223873138428} +03/05/2022 02:29:33 - INFO - codeparrot_training - Step 31506: {'lr': 0.00045254705302540257, 'samples': 16131584, 'steps': 31506, 'loss/train': 1.7760080099105835} +03/05/2022 02:29:33 - INFO - codeparrot_training - Skipping example with length 243 (seq_length=1024) +03/05/2022 02:29:38 - INFO - codeparrot_training - Step 31507: {'lr': 0.00045254394232637765, 'samples': 16132096, 'steps': 31507, 'loss/train': 2.1856863498687744} +03/05/2022 02:29:41 - INFO - codeparrot_training - Step 31508: {'lr': 0.0004525408315360896, 'samples': 16132608, 'steps': 31508, 'loss/train': 1.5976295471191406} +03/05/2022 02:29:41 - INFO - codeparrot_training - Skipping example with length 359 (seq_length=1024) +03/05/2022 02:29:47 - INFO - codeparrot_training - Step 31509: {'lr': 0.00045253772065453977, 'samples': 16133120, 'steps': 31509, 'loss/train': 1.5793099403381348} +03/05/2022 02:29:50 - INFO - codeparrot_training - Step 31510: {'lr': 0.00045253460968172957, 'samples': 16133632, 'steps': 31510, 'loss/train': 2.1575217247009277} +03/05/2022 02:29:51 - INFO - codeparrot_training - Skipping example with length 429 (seq_length=1024) +03/05/2022 02:29:55 - INFO - codeparrot_training - Step 31511: {'lr': 0.0004525314986176604, 'samples': 16134144, 'steps': 31511, 'loss/train': 2.10465931892395} +03/05/2022 02:29:58 - INFO - codeparrot_training - Step 31512: {'lr': 0.0004525283874623336, 'samples': 16134656, 'steps': 31512, 'loss/train': 0.7757741808891296} +03/05/2022 02:29:59 - INFO - codeparrot_training - Skipping example with length 131 (seq_length=1024) +03/05/2022 02:30:04 - INFO - codeparrot_training - Step 31513: {'lr': 0.00045252527621575075, 'samples': 16135168, 'steps': 31513, 'loss/train': 1.1073167324066162} +03/05/2022 02:30:07 - INFO - codeparrot_training - Step 31514: {'lr': 0.0004525221648779131, 'samples': 16135680, 'steps': 31514, 'loss/train': 1.7409639358520508} +03/05/2022 02:30:08 - INFO - codeparrot_training - Skipping example with length 199 (seq_length=1024) +03/05/2022 02:30:12 - INFO - codeparrot_training - Step 31515: {'lr': 0.00045251905344882205, 'samples': 16136192, 'steps': 31515, 'loss/train': 1.4306128025054932} +03/05/2022 02:30:15 - INFO - codeparrot_training - Step 31516: {'lr': 0.000452515941928479, 'samples': 16136704, 'steps': 31516, 'loss/train': 0.8161985874176025} +03/05/2022 02:30:16 - INFO - codeparrot_training - Skipping example with length 86 (seq_length=1024) +03/05/2022 02:30:21 - INFO - codeparrot_training - Step 31517: {'lr': 0.0004525128303168855, 'samples': 16137216, 'steps': 31517, 'loss/train': 1.7841342687606812} +03/05/2022 02:30:24 - INFO - codeparrot_training - Step 31518: {'lr': 0.00045250971861404276, 'samples': 16137728, 'steps': 31518, 'loss/train': 1.29667067527771} +03/05/2022 02:30:25 - INFO - codeparrot_training - Skipping example with length 664 (seq_length=1024) +03/05/2022 02:30:29 - INFO - codeparrot_training - Step 31519: {'lr': 0.0004525066068199523, 'samples': 16138240, 'steps': 31519, 'loss/train': 2.8187217712402344} +03/05/2022 02:30:32 - INFO - codeparrot_training - Step 31520: {'lr': 0.0004525034949346155, 'samples': 16138752, 'steps': 31520, 'loss/train': 0.9589388966560364} +03/05/2022 02:30:34 - INFO - codeparrot_training - Skipping example with length 29 (seq_length=1024) +03/05/2022 02:30:38 - INFO - codeparrot_training - Step 31521: {'lr': 0.0004525003829580337, 'samples': 16139264, 'steps': 31521, 'loss/train': 0.21540480852127075} +03/05/2022 02:30:41 - INFO - codeparrot_training - Step 31522: {'lr': 0.0004524972708902084, 'samples': 16139776, 'steps': 31522, 'loss/train': 2.310816764831543} +03/05/2022 02:30:42 - INFO - codeparrot_training - Skipping example with length 501 (seq_length=1024) +03/05/2022 02:30:46 - INFO - codeparrot_training - Step 31523: {'lr': 0.0004524941587311409, 'samples': 16140288, 'steps': 31523, 'loss/train': 1.138566493988037} +03/05/2022 02:30:49 - INFO - codeparrot_training - Step 31524: {'lr': 0.0004524910464808327, 'samples': 16140800, 'steps': 31524, 'loss/train': 1.5954649448394775} +03/05/2022 02:30:50 - INFO - codeparrot_training - Skipping example with length 365 (seq_length=1024) +03/05/2022 02:30:55 - INFO - codeparrot_training - Step 31525: {'lr': 0.00045248793413928514, 'samples': 16141312, 'steps': 31525, 'loss/train': 1.9546318054199219} +03/05/2022 02:30:58 - INFO - codeparrot_training - Step 31526: {'lr': 0.0004524848217064997, 'samples': 16141824, 'steps': 31526, 'loss/train': 1.6697877645492554} +03/05/2022 02:30:58 - INFO - codeparrot_training - Skipping example with length 653 (seq_length=1024) +03/05/2022 02:31:03 - INFO - codeparrot_training - Step 31527: {'lr': 0.0004524817091824777, 'samples': 16142336, 'steps': 31527, 'loss/train': 1.5212364196777344} +03/05/2022 02:31:06 - INFO - codeparrot_training - Step 31528: {'lr': 0.00045247859656722056, 'samples': 16142848, 'steps': 31528, 'loss/train': 1.5788440704345703} +03/05/2022 02:31:07 - INFO - codeparrot_training - Skipping example with length 742 (seq_length=1024) +03/05/2022 02:31:11 - INFO - codeparrot_training - Step 31529: {'lr': 0.0004524754838607297, 'samples': 16143360, 'steps': 31529, 'loss/train': 1.4034253358840942} +03/05/2022 02:31:14 - INFO - codeparrot_training - Step 31530: {'lr': 0.0004524723710630064, 'samples': 16143872, 'steps': 31530, 'loss/train': 0.907260000705719} +03/05/2022 02:31:15 - INFO - codeparrot_training - Skipping example with length 627 (seq_length=1024) +03/05/2022 02:31:20 - INFO - codeparrot_training - Step 31531: {'lr': 0.0004524692581740523, 'samples': 16144384, 'steps': 31531, 'loss/train': 1.6518443822860718} +03/05/2022 02:31:23 - INFO - codeparrot_training - Step 31532: {'lr': 0.00045246614519386865, 'samples': 16144896, 'steps': 31532, 'loss/train': 1.483202576637268} +03/05/2022 02:31:23 - INFO - codeparrot_training - Skipping example with length 729 (seq_length=1024) +03/05/2022 02:31:28 - INFO - codeparrot_training - Step 31533: {'lr': 0.0004524630321224569, 'samples': 16145408, 'steps': 31533, 'loss/train': 2.475306510925293} +03/05/2022 02:31:31 - INFO - codeparrot_training - Step 31534: {'lr': 0.0004524599189598183, 'samples': 16145920, 'steps': 31534, 'loss/train': 1.823412537574768} +03/05/2022 02:31:31 - INFO - codeparrot_training - Skipping example with length 888 (seq_length=1024) +03/05/2022 02:31:37 - INFO - codeparrot_training - Step 31535: {'lr': 0.0004524568057059545, 'samples': 16146432, 'steps': 31535, 'loss/train': 1.9083024263381958} +03/05/2022 02:31:40 - INFO - codeparrot_training - Skipping example with length 530 (seq_length=1024) +03/05/2022 02:31:42 - INFO - codeparrot_training - Step 31536: {'lr': 0.00045245369236086673, 'samples': 16146944, 'steps': 31536, 'loss/train': 1.4512388706207275} +03/05/2022 02:31:45 - INFO - codeparrot_training - Step 31537: {'lr': 0.00045245057892455653, 'samples': 16147456, 'steps': 31537, 'loss/train': 1.086375117301941} +03/05/2022 02:31:48 - INFO - codeparrot_training - Skipping example with length 711 (seq_length=1024) +03/05/2022 02:31:51 - INFO - codeparrot_training - Step 31538: {'lr': 0.0004524474653970252, 'samples': 16147968, 'steps': 31538, 'loss/train': 1.460856556892395} +03/05/2022 02:31:54 - INFO - codeparrot_training - Step 31539: {'lr': 0.00045244435177827413, 'samples': 16148480, 'steps': 31539, 'loss/train': 0.9275199174880981} +03/05/2022 02:31:56 - INFO - codeparrot_training - Skipping example with length 562 (seq_length=1024) +03/05/2022 02:31:59 - INFO - codeparrot_training - Step 31540: {'lr': 0.00045244123806830486, 'samples': 16148992, 'steps': 31540, 'loss/train': 1.2342435121536255} +03/05/2022 02:32:02 - INFO - codeparrot_training - Step 31541: {'lr': 0.00045243812426711856, 'samples': 16149504, 'steps': 31541, 'loss/train': 1.7118326425552368} +03/05/2022 02:32:06 - INFO - codeparrot_training - Step 31542: {'lr': 0.0004524350103747168, 'samples': 16150016, 'steps': 31542, 'loss/train': 1.819670557975769} +03/05/2022 02:32:07 - INFO - codeparrot_training - Skipping example with length 459 (seq_length=1024) +03/05/2022 02:32:11 - INFO - codeparrot_training - Step 31543: {'lr': 0.00045243189639110093, 'samples': 16150528, 'steps': 31543, 'loss/train': 2.029788017272949} +03/05/2022 02:32:14 - INFO - codeparrot_training - Step 31544: {'lr': 0.00045242878231627247, 'samples': 16151040, 'steps': 31544, 'loss/train': 1.5326788425445557} +03/05/2022 02:32:15 - INFO - codeparrot_training - Skipping example with length 408 (seq_length=1024) +03/05/2022 02:32:19 - INFO - codeparrot_training - Step 31545: {'lr': 0.0004524256681502327, 'samples': 16151552, 'steps': 31545, 'loss/train': 2.779707908630371} +03/05/2022 02:32:22 - INFO - codeparrot_training - Step 31546: {'lr': 0.0004524225538929829, 'samples': 16152064, 'steps': 31546, 'loss/train': 2.1954147815704346} +03/05/2022 02:32:23 - INFO - codeparrot_training - Skipping example with length 809 (seq_length=1024) +03/05/2022 02:32:28 - INFO - codeparrot_training - Step 31547: {'lr': 0.0004524194395445248, 'samples': 16152576, 'steps': 31547, 'loss/train': 1.8565536737442017} +03/05/2022 02:32:31 - INFO - codeparrot_training - Step 31548: {'lr': 0.0004524163251048595, 'samples': 16153088, 'steps': 31548, 'loss/train': 1.7719902992248535} +03/05/2022 02:32:31 - INFO - codeparrot_training - Skipping example with length 797 (seq_length=1024) +03/05/2022 02:32:36 - INFO - codeparrot_training - Step 31549: {'lr': 0.0004524132105739886, 'samples': 16153600, 'steps': 31549, 'loss/train': 2.031679153442383} +03/05/2022 02:32:39 - INFO - codeparrot_training - Step 31550: {'lr': 0.0004524100959519134, 'samples': 16154112, 'steps': 31550, 'loss/train': 2.2447915077209473} +03/05/2022 02:32:40 - INFO - codeparrot_training - Skipping example with length 690 (seq_length=1024) +03/05/2022 02:32:45 - INFO - codeparrot_training - Step 31551: {'lr': 0.00045240698123863535, 'samples': 16154624, 'steps': 31551, 'loss/train': 1.6978462934494019} +03/05/2022 02:32:48 - INFO - codeparrot_training - Step 31552: {'lr': 0.0004524038664341558, 'samples': 16155136, 'steps': 31552, 'loss/train': 2.2094690799713135} +03/05/2022 02:32:48 - INFO - codeparrot_training - Skipping example with length 725 (seq_length=1024) +03/05/2022 02:32:53 - INFO - codeparrot_training - Step 31553: {'lr': 0.00045240075153847625, 'samples': 16155648, 'steps': 31553, 'loss/train': 1.6636077165603638} +03/05/2022 02:32:56 - INFO - codeparrot_training - Step 31554: {'lr': 0.00045239763655159805, 'samples': 16156160, 'steps': 31554, 'loss/train': 2.162144660949707} +03/05/2022 02:32:56 - INFO - codeparrot_training - Skipping example with length 193 (seq_length=1024) +03/05/2022 02:33:01 - INFO - codeparrot_training - Step 31555: {'lr': 0.00045239452147352257, 'samples': 16156672, 'steps': 31555, 'loss/train': 2.5454466342926025} +03/05/2022 02:33:05 - INFO - codeparrot_training - Step 31556: {'lr': 0.0004523914063042512, 'samples': 16157184, 'steps': 31556, 'loss/train': 1.7178024053573608} +03/05/2022 02:33:05 - INFO - codeparrot_training - Skipping example with length 527 (seq_length=1024) +03/05/2022 02:33:10 - INFO - codeparrot_training - Step 31557: {'lr': 0.00045238829104378545, 'samples': 16157696, 'steps': 31557, 'loss/train': 1.5884954929351807} +03/05/2022 02:33:13 - INFO - codeparrot_training - Step 31558: {'lr': 0.0004523851756921266, 'samples': 16158208, 'steps': 31558, 'loss/train': 1.2498162984848022} +03/05/2022 02:33:13 - INFO - codeparrot_training - Skipping example with length 708 (seq_length=1024) +03/05/2022 02:33:18 - INFO - codeparrot_training - Step 31559: {'lr': 0.00045238206024927614, 'samples': 16158720, 'steps': 31559, 'loss/train': 1.784096360206604} +03/05/2022 02:33:21 - INFO - codeparrot_training - Step 31560: {'lr': 0.00045237894471523543, 'samples': 16159232, 'steps': 31560, 'loss/train': 2.0154409408569336} +03/05/2022 02:33:22 - INFO - codeparrot_training - Skipping example with length 725 (seq_length=1024) +03/05/2022 02:33:27 - INFO - codeparrot_training - Step 31561: {'lr': 0.00045237582909000594, 'samples': 16159744, 'steps': 31561, 'loss/train': 1.7307534217834473} +03/05/2022 02:33:30 - INFO - codeparrot_training - Step 31562: {'lr': 0.00045237271337358897, 'samples': 16160256, 'steps': 31562, 'loss/train': 0.08814364671707153} +03/05/2022 02:33:30 - INFO - codeparrot_training - Skipping example with length 540 (seq_length=1024) +03/05/2022 02:33:35 - INFO - codeparrot_training - Step 31563: {'lr': 0.00045236959756598605, 'samples': 16160768, 'steps': 31563, 'loss/train': 1.4843617677688599} +03/05/2022 02:33:38 - INFO - codeparrot_training - Step 31564: {'lr': 0.0004523664816671985, 'samples': 16161280, 'steps': 31564, 'loss/train': 2.5114407539367676} +03/05/2022 02:33:38 - INFO - codeparrot_training - Skipping example with length 412 (seq_length=1024) +03/05/2022 02:33:44 - INFO - codeparrot_training - Step 31565: {'lr': 0.0004523633656772277, 'samples': 16161792, 'steps': 31565, 'loss/train': 2.127631902694702} +03/05/2022 02:33:47 - INFO - codeparrot_training - Step 31566: {'lr': 0.00045236024959607505, 'samples': 16162304, 'steps': 31566, 'loss/train': 0.7544247508049011} +03/05/2022 02:33:52 - INFO - codeparrot_training - Step 31567: {'lr': 0.00045235713342374207, 'samples': 16162816, 'steps': 31567, 'loss/train': 1.0428247451782227} +03/05/2022 02:33:55 - INFO - codeparrot_training - Step 31568: {'lr': 0.00045235401716023, 'samples': 16163328, 'steps': 31568, 'loss/train': 1.611209511756897} +03/05/2022 02:33:55 - INFO - codeparrot_training - Skipping example with length 346 (seq_length=1024) +03/05/2022 02:34:01 - INFO - codeparrot_training - Step 31569: {'lr': 0.0004523509008055404, 'samples': 16163840, 'steps': 31569, 'loss/train': 1.7495619058609009} +03/05/2022 02:34:03 - INFO - codeparrot_training - Skipping example with length 907 (seq_length=1024) +03/05/2022 02:34:06 - INFO - codeparrot_training - Step 31570: {'lr': 0.0004523477843596746, 'samples': 16164352, 'steps': 31570, 'loss/train': 1.6653902530670166} +03/05/2022 02:34:09 - INFO - codeparrot_training - Step 31571: {'lr': 0.00045234466782263403, 'samples': 16164864, 'steps': 31571, 'loss/train': 2.2409536838531494} +03/05/2022 02:34:12 - INFO - codeparrot_training - Skipping example with length 315 (seq_length=1024) +03/05/2022 02:34:14 - INFO - codeparrot_training - Step 31572: {'lr': 0.00045234155119442, 'samples': 16165376, 'steps': 31572, 'loss/train': 1.4114336967468262} +03/05/2022 02:34:17 - INFO - codeparrot_training - Step 31573: {'lr': 0.00045233843447503407, 'samples': 16165888, 'steps': 31573, 'loss/train': 1.610561490058899} +03/05/2022 02:34:20 - INFO - codeparrot_training - Skipping example with length 979 (seq_length=1024) +03/05/2022 02:34:23 - INFO - codeparrot_training - Step 31574: {'lr': 0.00045233531766447757, 'samples': 16166400, 'steps': 31574, 'loss/train': 1.8955681324005127} +03/05/2022 02:34:26 - INFO - codeparrot_training - Step 31575: {'lr': 0.00045233220076275186, 'samples': 16166912, 'steps': 31575, 'loss/train': 1.3955235481262207} +03/05/2022 02:34:29 - INFO - codeparrot_training - Skipping example with length 458 (seq_length=1024) +03/05/2022 02:34:31 - INFO - codeparrot_training - Step 31576: {'lr': 0.0004523290837698583, 'samples': 16167424, 'steps': 31576, 'loss/train': 1.9330998659133911} +03/05/2022 02:34:34 - INFO - codeparrot_training - Step 31577: {'lr': 0.0004523259666857985, 'samples': 16167936, 'steps': 31577, 'loss/train': 1.482001543045044} +03/05/2022 02:34:37 - INFO - codeparrot_training - Skipping example with length 1021 (seq_length=1024) +03/05/2022 02:34:40 - INFO - codeparrot_training - Step 31578: {'lr': 0.00045232284951057366, 'samples': 16168448, 'steps': 31578, 'loss/train': 1.8246978521347046} +03/05/2022 02:34:43 - INFO - codeparrot_training - Step 31579: {'lr': 0.00045231973224418533, 'samples': 16168960, 'steps': 31579, 'loss/train': 1.6417876482009888} +03/05/2022 02:34:45 - INFO - codeparrot_training - Skipping example with length 581 (seq_length=1024) +03/05/2022 02:34:48 - INFO - codeparrot_training - Step 31580: {'lr': 0.00045231661488663485, 'samples': 16169472, 'steps': 31580, 'loss/train': 2.2487080097198486} +03/05/2022 02:34:51 - INFO - codeparrot_training - Step 31581: {'lr': 0.0004523134974379236, 'samples': 16169984, 'steps': 31581, 'loss/train': 1.3140310049057007} +03/05/2022 02:34:54 - INFO - codeparrot_training - Skipping example with length 605 (seq_length=1024) +03/05/2022 02:34:57 - INFO - codeparrot_training - Step 31582: {'lr': 0.000452310379898053, 'samples': 16170496, 'steps': 31582, 'loss/train': 1.2727608680725098} +03/05/2022 02:35:00 - INFO - codeparrot_training - Step 31583: {'lr': 0.00045230726226702444, 'samples': 16171008, 'steps': 31583, 'loss/train': 1.4434789419174194} +03/05/2022 02:35:02 - INFO - codeparrot_training - Skipping example with length 257 (seq_length=1024) +03/05/2022 02:35:05 - INFO - codeparrot_training - Step 31584: {'lr': 0.0004523041445448394, 'samples': 16171520, 'steps': 31584, 'loss/train': 1.6618921756744385} +03/05/2022 02:35:08 - INFO - codeparrot_training - Step 31585: {'lr': 0.00045230102673149923, 'samples': 16172032, 'steps': 31585, 'loss/train': 0.2651282548904419} +03/05/2022 02:35:10 - INFO - codeparrot_training - Skipping example with length 842 (seq_length=1024) +03/05/2022 02:35:13 - INFO - codeparrot_training - Step 31586: {'lr': 0.00045229790882700535, 'samples': 16172544, 'steps': 31586, 'loss/train': 2.008523464202881} +03/05/2022 02:35:17 - INFO - codeparrot_training - Step 31587: {'lr': 0.00045229479083135917, 'samples': 16173056, 'steps': 31587, 'loss/train': 1.728901982307434} +03/05/2022 02:35:18 - INFO - codeparrot_training - Skipping example with length 843 (seq_length=1024) +03/05/2022 02:35:22 - INFO - codeparrot_training - Step 31588: {'lr': 0.000452291672744562, 'samples': 16173568, 'steps': 31588, 'loss/train': 1.3938950300216675} +03/05/2022 02:35:25 - INFO - codeparrot_training - Step 31589: {'lr': 0.0004522885545666153, 'samples': 16174080, 'steps': 31589, 'loss/train': 1.6727291345596313} +03/05/2022 02:35:27 - INFO - codeparrot_training - Skipping example with length 623 (seq_length=1024) +03/05/2022 02:35:30 - INFO - codeparrot_training - Step 31590: {'lr': 0.0004522854362975206, 'samples': 16174592, 'steps': 31590, 'loss/train': 1.5963608026504517} +03/05/2022 02:35:33 - INFO - codeparrot_training - Step 31591: {'lr': 0.00045228231793727924, 'samples': 16175104, 'steps': 31591, 'loss/train': 1.9077171087265015} +03/05/2022 02:35:35 - INFO - codeparrot_training - Skipping example with length 754 (seq_length=1024) +03/05/2022 02:35:39 - INFO - codeparrot_training - Step 31592: {'lr': 0.00045227919948589247, 'samples': 16175616, 'steps': 31592, 'loss/train': 1.5408475399017334} +03/05/2022 02:35:42 - INFO - codeparrot_training - Step 31593: {'lr': 0.0004522760809433619, 'samples': 16176128, 'steps': 31593, 'loss/train': 0.8038286566734314} +03/05/2022 02:35:43 - INFO - codeparrot_training - Skipping example with length 126 (seq_length=1024) +03/05/2022 02:35:47 - INFO - codeparrot_training - Step 31594: {'lr': 0.0004522729623096888, 'samples': 16176640, 'steps': 31594, 'loss/train': 2.239734649658203} +03/05/2022 02:35:50 - INFO - codeparrot_training - Step 31595: {'lr': 0.0004522698435848747, 'samples': 16177152, 'steps': 31595, 'loss/train': 1.4663687944412231} +03/05/2022 02:35:52 - INFO - codeparrot_training - Skipping example with length 688 (seq_length=1024) +03/05/2022 02:35:56 - INFO - codeparrot_training - Step 31596: {'lr': 0.0004522667247689208, 'samples': 16177664, 'steps': 31596, 'loss/train': 0.953043520450592} +03/05/2022 02:35:59 - INFO - codeparrot_training - Step 31597: {'lr': 0.0004522636058618287, 'samples': 16178176, 'steps': 31597, 'loss/train': 3.4511659145355225} +03/05/2022 02:36:00 - INFO - codeparrot_training - Skipping example with length 731 (seq_length=1024) +03/05/2022 02:36:04 - INFO - codeparrot_training - Step 31598: {'lr': 0.0004522604868635998, 'samples': 16178688, 'steps': 31598, 'loss/train': 1.5698630809783936} +03/05/2022 02:36:07 - INFO - codeparrot_training - Step 31599: {'lr': 0.0004522573677742353, 'samples': 16179200, 'steps': 31599, 'loss/train': 2.0832760334014893} +03/05/2022 02:36:08 - INFO - codeparrot_training - Skipping example with length 501 (seq_length=1024) +03/05/2022 02:36:13 - INFO - codeparrot_training - Step 31600: {'lr': 0.0004522542485937369, 'samples': 16179712, 'steps': 31600, 'loss/train': 3.816641092300415} +03/05/2022 02:36:16 - INFO - codeparrot_training - Step 31601: {'lr': 0.0004522511293221058, 'samples': 16180224, 'steps': 31601, 'loss/train': 1.0312228202819824} +03/05/2022 02:36:17 - INFO - codeparrot_training - Skipping example with length 16 (seq_length=1024) +03/05/2022 02:36:21 - INFO - codeparrot_training - Step 31602: {'lr': 0.00045224800995934345, 'samples': 16180736, 'steps': 31602, 'loss/train': 1.321639060974121} +03/05/2022 02:36:24 - INFO - codeparrot_training - Step 31603: {'lr': 0.00045224489050545125, 'samples': 16181248, 'steps': 31603, 'loss/train': 1.55818510055542} +03/05/2022 02:36:25 - INFO - codeparrot_training - Skipping example with length 661 (seq_length=1024) +03/05/2022 02:36:29 - INFO - codeparrot_training - Step 31604: {'lr': 0.0004522417709604306, 'samples': 16181760, 'steps': 31604, 'loss/train': 2.2859675884246826} +03/05/2022 02:36:32 - INFO - codeparrot_training - Step 31605: {'lr': 0.000452238651324283, 'samples': 16182272, 'steps': 31605, 'loss/train': 1.0731604099273682} +03/05/2022 02:36:33 - INFO - codeparrot_training - Skipping example with length 715 (seq_length=1024) +03/05/2022 02:36:38 - INFO - codeparrot_training - Step 31606: {'lr': 0.0004522355315970098, 'samples': 16182784, 'steps': 31606, 'loss/train': 1.0644035339355469} +03/05/2022 02:36:41 - INFO - codeparrot_training - Step 31607: {'lr': 0.0004522324117786123, 'samples': 16183296, 'steps': 31607, 'loss/train': 1.5141433477401733} +03/05/2022 02:36:42 - INFO - codeparrot_training - Skipping example with length 456 (seq_length=1024) +03/05/2022 02:36:46 - INFO - codeparrot_training - Step 31608: {'lr': 0.0004522292918690921, 'samples': 16183808, 'steps': 31608, 'loss/train': 1.7121999263763428} +03/05/2022 02:36:49 - INFO - codeparrot_training - Step 31609: {'lr': 0.0004522261718684504, 'samples': 16184320, 'steps': 31609, 'loss/train': 1.3490097522735596} +03/05/2022 02:36:50 - INFO - codeparrot_training - Skipping example with length 612 (seq_length=1024) +03/05/2022 02:36:55 - INFO - codeparrot_training - Step 31610: {'lr': 0.00045222305177668875, 'samples': 16184832, 'steps': 31610, 'loss/train': 1.2012062072753906} +03/05/2022 02:36:58 - INFO - codeparrot_training - Step 31611: {'lr': 0.00045221993159380857, 'samples': 16185344, 'steps': 31611, 'loss/train': 0.3338894844055176} +03/05/2022 02:36:58 - INFO - codeparrot_training - Skipping example with length 286 (seq_length=1024) +03/05/2022 02:37:03 - INFO - codeparrot_training - Step 31612: {'lr': 0.00045221681131981116, 'samples': 16185856, 'steps': 31612, 'loss/train': 2.153427839279175} +03/05/2022 02:37:06 - INFO - codeparrot_training - Step 31613: {'lr': 0.00045221369095469795, 'samples': 16186368, 'steps': 31613, 'loss/train': 1.3791075944900513} +03/05/2022 02:37:07 - INFO - codeparrot_training - Skipping example with length 628 (seq_length=1024) +03/05/2022 02:37:11 - INFO - codeparrot_training - Step 31614: {'lr': 0.00045221057049847044, 'samples': 16186880, 'steps': 31614, 'loss/train': 1.8150585889816284} +03/05/2022 02:37:15 - INFO - codeparrot_training - Step 31615: {'lr': 0.0004522074499511299, 'samples': 16187392, 'steps': 31615, 'loss/train': 1.8745017051696777} +03/05/2022 02:37:15 - INFO - codeparrot_training - Skipping example with length 698 (seq_length=1024) +03/05/2022 02:37:20 - INFO - codeparrot_training - Step 31616: {'lr': 0.0004522043293126778, 'samples': 16187904, 'steps': 31616, 'loss/train': 1.9404397010803223} +03/05/2022 02:37:23 - INFO - codeparrot_training - Step 31617: {'lr': 0.00045220120858311557, 'samples': 16188416, 'steps': 31617, 'loss/train': 1.2991234064102173} +03/05/2022 02:37:23 - INFO - codeparrot_training - Skipping example with length 911 (seq_length=1024) +03/05/2022 02:37:28 - INFO - codeparrot_training - Step 31618: {'lr': 0.0004521980877624446, 'samples': 16188928, 'steps': 31618, 'loss/train': 1.9995251893997192} +03/05/2022 02:37:31 - INFO - codeparrot_training - Step 31619: {'lr': 0.0004521949668506663, 'samples': 16189440, 'steps': 31619, 'loss/train': 0.3885086476802826} +03/05/2022 02:37:32 - INFO - codeparrot_training - Skipping example with length 73 (seq_length=1024) +03/05/2022 02:37:37 - INFO - codeparrot_training - Step 31620: {'lr': 0.00045219184584778207, 'samples': 16189952, 'steps': 31620, 'loss/train': 2.1185600757598877} +03/05/2022 02:37:40 - INFO - codeparrot_training - Step 31621: {'lr': 0.0004521887247537933, 'samples': 16190464, 'steps': 31621, 'loss/train': 1.615657925605774} +03/05/2022 02:37:42 - INFO - codeparrot_training - Skipping example with length 442 (seq_length=1024) +03/05/2022 02:37:45 - INFO - codeparrot_training - Step 31622: {'lr': 0.00045218560356870144, 'samples': 16190976, 'steps': 31622, 'loss/train': 0.8194131851196289} +03/05/2022 02:37:48 - INFO - codeparrot_training - Step 31623: {'lr': 0.0004521824822925078, 'samples': 16191488, 'steps': 31623, 'loss/train': 1.7549269199371338} +03/05/2022 02:37:50 - INFO - codeparrot_training - Skipping example with length 252 (seq_length=1024) +03/05/2022 02:37:54 - INFO - codeparrot_training - Step 31624: {'lr': 0.00045217936092521396, 'samples': 16192000, 'steps': 31624, 'loss/train': 2.2579245567321777} +03/05/2022 02:37:57 - INFO - codeparrot_training - Step 31625: {'lr': 0.00045217623946682114, 'samples': 16192512, 'steps': 31625, 'loss/train': 1.7576595544815063} +03/05/2022 02:37:58 - INFO - codeparrot_training - Skipping example with length 616 (seq_length=1024) +03/05/2022 02:38:02 - INFO - codeparrot_training - Step 31626: {'lr': 0.00045217311791733084, 'samples': 16193024, 'steps': 31626, 'loss/train': 2.0874361991882324} +03/05/2022 02:38:05 - INFO - codeparrot_training - Step 31627: {'lr': 0.00045216999627674436, 'samples': 16193536, 'steps': 31627, 'loss/train': 1.617950201034546} +03/05/2022 02:38:07 - INFO - codeparrot_training - Skipping example with length 186 (seq_length=1024) +03/05/2022 02:38:10 - INFO - codeparrot_training - Step 31628: {'lr': 0.0004521668745450633, 'samples': 16194048, 'steps': 31628, 'loss/train': 2.156216859817505} +03/05/2022 02:38:14 - INFO - codeparrot_training - Step 31629: {'lr': 0.00045216375272228907, 'samples': 16194560, 'steps': 31629, 'loss/train': 2.022632598876953} +03/05/2022 02:38:15 - INFO - codeparrot_training - Skipping example with length 747 (seq_length=1024) +03/05/2022 02:38:19 - INFO - codeparrot_training - Step 31630: {'lr': 0.00045216063080842287, 'samples': 16195072, 'steps': 31630, 'loss/train': 1.9324945211410522} +03/05/2022 02:38:22 - INFO - codeparrot_training - Step 31631: {'lr': 0.00045215750880346617, 'samples': 16195584, 'steps': 31631, 'loss/train': 0.046376414597034454} +03/05/2022 02:38:24 - INFO - codeparrot_training - Skipping example with length 221 (seq_length=1024) +03/05/2022 02:38:27 - INFO - codeparrot_training - Step 31632: {'lr': 0.00045215438670742045, 'samples': 16196096, 'steps': 31632, 'loss/train': 0.10948921740055084} +03/05/2022 02:38:31 - INFO - codeparrot_training - Step 31633: {'lr': 0.00045215126452028705, 'samples': 16196608, 'steps': 31633, 'loss/train': 2.4237914085388184} +03/05/2022 02:38:32 - INFO - codeparrot_training - Skipping example with length 889 (seq_length=1024) +03/05/2022 02:38:36 - INFO - codeparrot_training - Step 31634: {'lr': 0.00045214814224206744, 'samples': 16197120, 'steps': 31634, 'loss/train': 0.959520697593689} +03/05/2022 02:38:39 - INFO - codeparrot_training - Step 31635: {'lr': 0.00045214501987276304, 'samples': 16197632, 'steps': 31635, 'loss/train': 1.5569958686828613} +03/05/2022 02:38:40 - INFO - codeparrot_training - Skipping example with length 367 (seq_length=1024) +03/05/2022 02:38:44 - INFO - codeparrot_training - Step 31636: {'lr': 0.0004521418974123751, 'samples': 16198144, 'steps': 31636, 'loss/train': 1.9874142408370972} +03/05/2022 02:38:47 - INFO - codeparrot_training - Step 31637: {'lr': 0.00045213877486090524, 'samples': 16198656, 'steps': 31637, 'loss/train': 0.5747865438461304} +03/05/2022 02:38:48 - INFO - codeparrot_training - Skipping example with length 192 (seq_length=1024) +03/05/2022 02:38:53 - INFO - codeparrot_training - Step 31638: {'lr': 0.00045213565221835473, 'samples': 16199168, 'steps': 31638, 'loss/train': 1.9332669973373413} +03/05/2022 02:38:56 - INFO - codeparrot_training - Step 31639: {'lr': 0.00045213252948472505, 'samples': 16199680, 'steps': 31639, 'loss/train': 1.9183270931243896} +03/05/2022 02:38:57 - INFO - codeparrot_training - Skipping example with length 320 (seq_length=1024) +03/05/2022 02:39:01 - INFO - codeparrot_training - Step 31640: {'lr': 0.0004521294066600175, 'samples': 16200192, 'steps': 31640, 'loss/train': 1.2080668210983276} +03/05/2022 02:39:04 - INFO - codeparrot_training - Step 31641: {'lr': 0.0004521262837442336, 'samples': 16200704, 'steps': 31641, 'loss/train': 2.2235372066497803} +03/05/2022 02:39:05 - INFO - codeparrot_training - Skipping example with length 112 (seq_length=1024) +03/05/2022 02:39:09 - INFO - codeparrot_training - Step 31642: {'lr': 0.0004521231607373747, 'samples': 16201216, 'steps': 31642, 'loss/train': 1.5852410793304443} +03/05/2022 02:39:13 - INFO - codeparrot_training - Step 31643: {'lr': 0.00045212003763944226, 'samples': 16201728, 'steps': 31643, 'loss/train': 1.962286114692688} +03/05/2022 02:39:13 - INFO - codeparrot_training - Skipping example with length 880 (seq_length=1024) +03/05/2022 02:39:18 - INFO - codeparrot_training - Step 31644: {'lr': 0.00045211691445043765, 'samples': 16202240, 'steps': 31644, 'loss/train': 1.8435064554214478} +03/05/2022 02:39:21 - INFO - codeparrot_training - Step 31645: {'lr': 0.0004521137911703622, 'samples': 16202752, 'steps': 31645, 'loss/train': 1.9495258331298828} +03/05/2022 02:39:21 - INFO - codeparrot_training - Skipping example with length 220 (seq_length=1024) +03/05/2022 02:39:26 - INFO - codeparrot_training - Step 31646: {'lr': 0.0004521106677992175, 'samples': 16203264, 'steps': 31646, 'loss/train': 2.007026195526123} +03/05/2022 02:39:29 - INFO - codeparrot_training - Step 31647: {'lr': 0.0004521075443370048, 'samples': 16203776, 'steps': 31647, 'loss/train': 1.3651809692382812} +03/05/2022 02:39:30 - INFO - codeparrot_training - Skipping example with length 510 (seq_length=1024) +03/05/2022 02:39:35 - INFO - codeparrot_training - Step 31648: {'lr': 0.0004521044207837256, 'samples': 16204288, 'steps': 31648, 'loss/train': 1.7581672668457031} +03/05/2022 02:39:38 - INFO - codeparrot_training - Step 31649: {'lr': 0.0004521012971393812, 'samples': 16204800, 'steps': 31649, 'loss/train': 1.9649947881698608} +03/05/2022 02:39:38 - INFO - codeparrot_training - Skipping example with length 934 (seq_length=1024) +03/05/2022 02:39:43 - INFO - codeparrot_training - Step 31650: {'lr': 0.0004520981734039731, 'samples': 16205312, 'steps': 31650, 'loss/train': 1.0028561353683472} +03/05/2022 02:39:46 - INFO - codeparrot_training - Step 31651: {'lr': 0.0004520950495775027, 'samples': 16205824, 'steps': 31651, 'loss/train': 2.3872528076171875} +03/05/2022 02:39:46 - INFO - codeparrot_training - Skipping example with length 1002 (seq_length=1024) +03/05/2022 02:39:52 - INFO - codeparrot_training - Step 31652: {'lr': 0.00045209192565997137, 'samples': 16206336, 'steps': 31652, 'loss/train': 2.0773656368255615} +03/05/2022 02:39:55 - INFO - codeparrot_training - Step 31653: {'lr': 0.00045208880165138054, 'samples': 16206848, 'steps': 31653, 'loss/train': 1.9626826047897339} +03/05/2022 02:39:55 - INFO - codeparrot_training - Skipping example with length 108 (seq_length=1024) +03/05/2022 02:40:00 - INFO - codeparrot_training - Step 31654: {'lr': 0.0004520856775517316, 'samples': 16207360, 'steps': 31654, 'loss/train': 3.0475759506225586} +03/05/2022 02:40:03 - INFO - codeparrot_training - Skipping example with length 154 (seq_length=1024) +03/05/2022 02:40:05 - INFO - codeparrot_training - Step 31655: {'lr': 0.00045208255336102597, 'samples': 16207872, 'steps': 31655, 'loss/train': 2.127302646636963} +03/05/2022 02:40:08 - INFO - codeparrot_training - Step 31656: {'lr': 0.0004520794290792651, 'samples': 16208384, 'steps': 31656, 'loss/train': 1.8837140798568726} +03/05/2022 02:40:11 - INFO - codeparrot_training - Skipping example with length 363 (seq_length=1024) +03/05/2022 02:40:14 - INFO - codeparrot_training - Step 31657: {'lr': 0.0004520763047064503, 'samples': 16208896, 'steps': 31657, 'loss/train': 1.559601068496704} +03/05/2022 02:40:17 - INFO - codeparrot_training - Step 31658: {'lr': 0.0004520731802425831, 'samples': 16209408, 'steps': 31658, 'loss/train': 1.8940517902374268} +03/05/2022 02:40:20 - INFO - codeparrot_training - Skipping example with length 221 (seq_length=1024) +03/05/2022 02:40:22 - INFO - codeparrot_training - Step 31659: {'lr': 0.0004520700556876648, 'samples': 16209920, 'steps': 31659, 'loss/train': 1.4561841487884521} +03/05/2022 02:40:25 - INFO - codeparrot_training - Step 31660: {'lr': 0.0004520669310416969, 'samples': 16210432, 'steps': 31660, 'loss/train': 1.7505598068237305} +03/05/2022 02:40:28 - INFO - codeparrot_training - Skipping example with length 908 (seq_length=1024) +03/05/2022 02:40:31 - INFO - codeparrot_training - Step 31661: {'lr': 0.0004520638063046807, 'samples': 16210944, 'steps': 31661, 'loss/train': 1.4576059579849243} +03/05/2022 02:40:34 - INFO - codeparrot_training - Step 31662: {'lr': 0.0004520606814766177, 'samples': 16211456, 'steps': 31662, 'loss/train': 1.0030043125152588} +03/05/2022 02:40:36 - INFO - codeparrot_training - Skipping example with length 354 (seq_length=1024) +03/05/2022 02:40:39 - INFO - codeparrot_training - Step 31663: {'lr': 0.00045205755655750924, 'samples': 16211968, 'steps': 31663, 'loss/train': 1.9131088256835938} +03/05/2022 02:40:42 - INFO - codeparrot_training - Step 31664: {'lr': 0.0004520544315473568, 'samples': 16212480, 'steps': 31664, 'loss/train': 1.380644679069519} +03/05/2022 02:40:44 - INFO - codeparrot_training - Skipping example with length 317 (seq_length=1024) +03/05/2022 02:40:47 - INFO - codeparrot_training - Step 31665: {'lr': 0.00045205130644616177, 'samples': 16212992, 'steps': 31665, 'loss/train': 1.4131038188934326} +03/05/2022 02:40:51 - INFO - codeparrot_training - Step 31666: {'lr': 0.0004520481812539255, 'samples': 16213504, 'steps': 31666, 'loss/train': 1.496529221534729} +03/05/2022 02:40:53 - INFO - codeparrot_training - Skipping example with length 886 (seq_length=1024) +03/05/2022 02:40:56 - INFO - codeparrot_training - Step 31667: {'lr': 0.00045204505597064943, 'samples': 16214016, 'steps': 31667, 'loss/train': 0.12706409394741058} +03/05/2022 02:40:59 - INFO - codeparrot_training - Step 31668: {'lr': 0.00045204193059633505, 'samples': 16214528, 'steps': 31668, 'loss/train': 2.0271198749542236} +03/05/2022 02:41:01 - INFO - codeparrot_training - Skipping example with length 591 (seq_length=1024) +03/05/2022 02:41:04 - INFO - codeparrot_training - Step 31669: {'lr': 0.0004520388051309836, 'samples': 16215040, 'steps': 31669, 'loss/train': 2.3709213733673096} +03/05/2022 02:41:07 - INFO - codeparrot_training - Step 31670: {'lr': 0.00045203567957459657, 'samples': 16215552, 'steps': 31670, 'loss/train': 1.4888590574264526} +03/05/2022 02:41:09 - INFO - codeparrot_training - Skipping example with length 697 (seq_length=1024) +03/05/2022 02:41:13 - INFO - codeparrot_training - Step 31671: {'lr': 0.00045203255392717545, 'samples': 16216064, 'steps': 31671, 'loss/train': 2.06488037109375} +03/05/2022 02:41:16 - INFO - codeparrot_training - Step 31672: {'lr': 0.00045202942818872157, 'samples': 16216576, 'steps': 31672, 'loss/train': 1.5083506107330322} +03/05/2022 02:41:18 - INFO - codeparrot_training - Skipping example with length 859 (seq_length=1024) +03/05/2022 02:41:21 - INFO - codeparrot_training - Step 31673: {'lr': 0.0004520263023592363, 'samples': 16217088, 'steps': 31673, 'loss/train': 1.8850589990615845} +03/05/2022 02:41:24 - INFO - codeparrot_training - Step 31674: {'lr': 0.00045202317643872113, 'samples': 16217600, 'steps': 31674, 'loss/train': 2.0380096435546875} +03/05/2022 02:41:26 - INFO - codeparrot_training - Skipping example with length 340 (seq_length=1024) +03/05/2022 02:41:29 - INFO - codeparrot_training - Step 31675: {'lr': 0.00045202005042717743, 'samples': 16218112, 'steps': 31675, 'loss/train': 2.1981077194213867} +03/05/2022 02:41:32 - INFO - codeparrot_training - Step 31676: {'lr': 0.0004520169243246066, 'samples': 16218624, 'steps': 31676, 'loss/train': 1.7429442405700684} +03/05/2022 02:41:34 - INFO - codeparrot_training - Skipping example with length 1011 (seq_length=1024) +03/05/2022 02:41:38 - INFO - codeparrot_training - Step 31677: {'lr': 0.0004520137981310101, 'samples': 16219136, 'steps': 31677, 'loss/train': 1.3953373432159424} +03/05/2022 02:41:41 - INFO - codeparrot_training - Step 31678: {'lr': 0.0004520106718463893, 'samples': 16219648, 'steps': 31678, 'loss/train': 1.905089259147644} +03/05/2022 02:41:42 - INFO - codeparrot_training - Skipping example with length 587 (seq_length=1024) +03/05/2022 02:41:46 - INFO - codeparrot_training - Step 31679: {'lr': 0.0004520075454707456, 'samples': 16220160, 'steps': 31679, 'loss/train': 1.4570354223251343} +03/05/2022 02:41:49 - INFO - codeparrot_training - Step 31680: {'lr': 0.0004520044190040804, 'samples': 16220672, 'steps': 31680, 'loss/train': 1.72770357131958} +03/05/2022 02:41:51 - INFO - codeparrot_training - Skipping example with length 212 (seq_length=1024) +03/05/2022 02:41:55 - INFO - codeparrot_training - Step 31681: {'lr': 0.0004520012924463951, 'samples': 16221184, 'steps': 31681, 'loss/train': 0.7951334118843079} +03/05/2022 02:41:58 - INFO - codeparrot_training - Step 31682: {'lr': 0.0004519981657976912, 'samples': 16221696, 'steps': 31682, 'loss/train': 1.2828333377838135} +03/05/2022 02:41:59 - INFO - codeparrot_training - Skipping example with length 586 (seq_length=1024) +03/05/2022 02:42:03 - INFO - codeparrot_training - Step 31683: {'lr': 0.00045199503905797, 'samples': 16222208, 'steps': 31683, 'loss/train': 1.8788996934890747} +03/05/2022 02:42:06 - INFO - codeparrot_training - Step 31684: {'lr': 0.0004519919122272329, 'samples': 16222720, 'steps': 31684, 'loss/train': 2.659221887588501} +03/05/2022 02:42:07 - INFO - codeparrot_training - Skipping example with length 155 (seq_length=1024) +03/05/2022 02:42:11 - INFO - codeparrot_training - Step 31685: {'lr': 0.00045198878530548146, 'samples': 16223232, 'steps': 31685, 'loss/train': 2.2966699600219727} +03/05/2022 02:42:15 - INFO - codeparrot_training - Step 31686: {'lr': 0.0004519856582927169, 'samples': 16223744, 'steps': 31686, 'loss/train': 1.558124303817749} +03/05/2022 02:42:16 - INFO - codeparrot_training - Skipping example with length 58 (seq_length=1024) +03/05/2022 02:42:20 - INFO - codeparrot_training - Step 31687: {'lr': 0.00045198253118894084, 'samples': 16224256, 'steps': 31687, 'loss/train': 2.451099157333374} +03/05/2022 02:42:23 - INFO - codeparrot_training - Step 31688: {'lr': 0.0004519794039941545, 'samples': 16224768, 'steps': 31688, 'loss/train': 1.467653512954712} +03/05/2022 02:42:24 - INFO - codeparrot_training - Skipping example with length 81 (seq_length=1024) +03/05/2022 02:42:28 - INFO - codeparrot_training - Step 31689: {'lr': 0.0004519762767083593, 'samples': 16225280, 'steps': 31689, 'loss/train': 1.9793176651000977} +03/05/2022 02:42:32 - INFO - codeparrot_training - Step 31690: {'lr': 0.00045197314933155677, 'samples': 16225792, 'steps': 31690, 'loss/train': 1.5835257768630981} +03/05/2022 02:42:33 - INFO - codeparrot_training - Skipping example with length 121 (seq_length=1024) +03/05/2022 02:42:37 - INFO - codeparrot_training - Step 31691: {'lr': 0.0004519700218637482, 'samples': 16226304, 'steps': 31691, 'loss/train': 1.8030756711959839} +03/05/2022 02:42:40 - INFO - codeparrot_training - Step 31692: {'lr': 0.00045196689430493516, 'samples': 16226816, 'steps': 31692, 'loss/train': 1.190625548362732} +03/05/2022 02:42:41 - INFO - codeparrot_training - Skipping example with length 390 (seq_length=1024) +03/05/2022 02:42:45 - INFO - codeparrot_training - Step 31693: {'lr': 0.00045196376665511883, 'samples': 16227328, 'steps': 31693, 'loss/train': 0.9631977081298828} +03/05/2022 02:42:48 - INFO - codeparrot_training - Step 31694: {'lr': 0.00045196063891430086, 'samples': 16227840, 'steps': 31694, 'loss/train': 1.2497475147247314} +03/05/2022 02:42:50 - INFO - codeparrot_training - Skipping example with length 730 (seq_length=1024) +03/05/2022 02:42:54 - INFO - codeparrot_training - Step 31695: {'lr': 0.0004519575110824825, 'samples': 16228352, 'steps': 31695, 'loss/train': 1.792426347732544} +03/05/2022 02:42:57 - INFO - codeparrot_training - Step 31696: {'lr': 0.0004519543831596652, 'samples': 16228864, 'steps': 31696, 'loss/train': 1.5987141132354736} +03/05/2022 02:42:58 - INFO - codeparrot_training - Skipping example with length 529 (seq_length=1024) +03/05/2022 02:43:02 - INFO - codeparrot_training - Step 31697: {'lr': 0.0004519512551458503, 'samples': 16229376, 'steps': 31697, 'loss/train': 2.129547119140625} +03/05/2022 02:43:05 - INFO - codeparrot_training - Step 31698: {'lr': 0.0004519481270410394, 'samples': 16229888, 'steps': 31698, 'loss/train': 2.1524972915649414} +03/05/2022 02:43:06 - INFO - codeparrot_training - Skipping example with length 799 (seq_length=1024) +03/05/2022 02:43:11 - INFO - codeparrot_training - Step 31699: {'lr': 0.00045194499884523376, 'samples': 16230400, 'steps': 31699, 'loss/train': 2.0305118560791016} +03/05/2022 02:43:14 - INFO - codeparrot_training - Step 31700: {'lr': 0.0004519418705584348, 'samples': 16230912, 'steps': 31700, 'loss/train': 0.8260295391082764} +03/05/2022 02:43:15 - INFO - codeparrot_training - Skipping example with length 700 (seq_length=1024) +03/05/2022 02:43:19 - INFO - codeparrot_training - Step 31701: {'lr': 0.0004519387421806439, 'samples': 16231424, 'steps': 31701, 'loss/train': 2.1808745861053467} +03/05/2022 02:43:22 - INFO - codeparrot_training - Step 31702: {'lr': 0.0004519356137118625, 'samples': 16231936, 'steps': 31702, 'loss/train': 1.8498154878616333} +03/05/2022 02:43:24 - INFO - codeparrot_training - Skipping example with length 120 (seq_length=1024) +03/05/2022 02:43:28 - INFO - codeparrot_training - Step 31703: {'lr': 0.00045193248515209216, 'samples': 16232448, 'steps': 31703, 'loss/train': 1.867157220840454} +03/05/2022 02:43:31 - INFO - codeparrot_training - Step 31704: {'lr': 0.0004519293565013341, 'samples': 16232960, 'steps': 31704, 'loss/train': 1.7759273052215576} +03/05/2022 02:43:32 - INFO - codeparrot_training - Skipping example with length 703 (seq_length=1024) +03/05/2022 02:43:36 - INFO - codeparrot_training - Step 31705: {'lr': 0.0004519262277595898, 'samples': 16233472, 'steps': 31705, 'loss/train': 1.4876981973648071} +03/05/2022 02:43:39 - INFO - codeparrot_training - Step 31706: {'lr': 0.0004519230989268606, 'samples': 16233984, 'steps': 31706, 'loss/train': 1.9603303670883179} +03/05/2022 02:43:40 - INFO - codeparrot_training - Skipping example with length 818 (seq_length=1024) +03/05/2022 02:43:45 - INFO - codeparrot_training - Step 31707: {'lr': 0.000451919970003148, 'samples': 16234496, 'steps': 31707, 'loss/train': 1.3129453659057617} +03/05/2022 02:43:48 - INFO - codeparrot_training - Step 31708: {'lr': 0.0004519168409884534, 'samples': 16235008, 'steps': 31708, 'loss/train': 1.6527740955352783} +03/05/2022 02:43:49 - INFO - codeparrot_training - Skipping example with length 241 (seq_length=1024) +03/05/2022 02:43:53 - INFO - codeparrot_training - Step 31709: {'lr': 0.00045191371188277817, 'samples': 16235520, 'steps': 31709, 'loss/train': 1.511582851409912} +03/05/2022 02:43:56 - INFO - codeparrot_training - Step 31710: {'lr': 0.0004519105826861237, 'samples': 16236032, 'steps': 31710, 'loss/train': 1.9950817823410034} +03/05/2022 02:43:58 - INFO - codeparrot_training - Skipping example with length 722 (seq_length=1024) +03/05/2022 02:44:02 - INFO - codeparrot_training - Step 31711: {'lr': 0.0004519074533984915, 'samples': 16236544, 'steps': 31711, 'loss/train': 1.0954766273498535} +03/05/2022 02:44:05 - INFO - codeparrot_training - Step 31712: {'lr': 0.0004519043240198829, 'samples': 16237056, 'steps': 31712, 'loss/train': 2.137829303741455} +03/05/2022 02:44:08 - INFO - codeparrot_training - Step 31713: {'lr': 0.0004519011945502993, 'samples': 16237568, 'steps': 31713, 'loss/train': 1.3465287685394287} +03/05/2022 02:44:08 - INFO - codeparrot_training - Skipping example with length 74 (seq_length=1024) +03/05/2022 02:44:14 - INFO - codeparrot_training - Step 31714: {'lr': 0.00045189806498974216, 'samples': 16238080, 'steps': 31714, 'loss/train': 1.7914372682571411} +03/05/2022 02:44:17 - INFO - codeparrot_training - Skipping example with length 667 (seq_length=1024) +03/05/2022 02:44:19 - INFO - codeparrot_training - Step 31715: {'lr': 0.00045189493533821285, 'samples': 16238592, 'steps': 31715, 'loss/train': 1.8237380981445312} +03/05/2022 02:44:22 - INFO - codeparrot_training - Step 31716: {'lr': 0.0004518918055957128, 'samples': 16239104, 'steps': 31716, 'loss/train': 2.1610751152038574} +03/05/2022 02:44:25 - INFO - codeparrot_training - Skipping example with length 197 (seq_length=1024) +03/05/2022 02:44:27 - INFO - codeparrot_training - Step 31717: {'lr': 0.0004518886757622435, 'samples': 16239616, 'steps': 31717, 'loss/train': 1.9940295219421387} +03/05/2022 02:44:31 - INFO - codeparrot_training - Step 31718: {'lr': 0.0004518855458378062, 'samples': 16240128, 'steps': 31718, 'loss/train': 1.4362796545028687} +03/05/2022 02:44:33 - INFO - codeparrot_training - Skipping example with length 100 (seq_length=1024) +03/05/2022 02:44:36 - INFO - codeparrot_training - Step 31719: {'lr': 0.0004518824158224023, 'samples': 16240640, 'steps': 31719, 'loss/train': 1.6215218305587769} +03/05/2022 02:44:39 - INFO - codeparrot_training - Step 31720: {'lr': 0.00045187928571603343, 'samples': 16241152, 'steps': 31720, 'loss/train': 1.430087924003601} +03/05/2022 02:44:41 - INFO - codeparrot_training - Skipping example with length 433 (seq_length=1024) +03/05/2022 02:44:44 - INFO - codeparrot_training - Step 31721: {'lr': 0.0004518761555187008, 'samples': 16241664, 'steps': 31721, 'loss/train': 2.02836012840271} +03/05/2022 02:44:47 - INFO - codeparrot_training - Step 31722: {'lr': 0.00045187302523040597, 'samples': 16242176, 'steps': 31722, 'loss/train': 1.0167558193206787} +03/05/2022 02:44:50 - INFO - codeparrot_training - Skipping example with length 948 (seq_length=1024) +03/05/2022 02:44:53 - INFO - codeparrot_training - Step 31723: {'lr': 0.00045186989485115014, 'samples': 16242688, 'steps': 31723, 'loss/train': 1.7651481628417969} +03/05/2022 02:44:56 - INFO - codeparrot_training - Step 31724: {'lr': 0.000451866764380935, 'samples': 16243200, 'steps': 31724, 'loss/train': 0.2187340259552002} +03/05/2022 02:44:58 - INFO - codeparrot_training - Skipping example with length 756 (seq_length=1024) +03/05/2022 02:45:01 - INFO - codeparrot_training - Step 31725: {'lr': 0.0004518636338197617, 'samples': 16243712, 'steps': 31725, 'loss/train': 1.924948811531067} +03/05/2022 02:45:04 - INFO - codeparrot_training - Step 31726: {'lr': 0.00045186050316763186, 'samples': 16244224, 'steps': 31726, 'loss/train': 1.245557188987732} +03/05/2022 02:45:06 - INFO - codeparrot_training - Skipping example with length 128 (seq_length=1024) +03/05/2022 02:45:10 - INFO - codeparrot_training - Step 31727: {'lr': 0.0004518573724245467, 'samples': 16244736, 'steps': 31727, 'loss/train': 1.7461291551589966} +03/05/2022 02:45:13 - INFO - codeparrot_training - Step 31728: {'lr': 0.00045185424159050776, 'samples': 16245248, 'steps': 31728, 'loss/train': 2.007668972015381} +03/05/2022 02:45:15 - INFO - codeparrot_training - Skipping example with length 259 (seq_length=1024) +03/05/2022 02:45:18 - INFO - codeparrot_training - Step 31729: {'lr': 0.00045185111066551643, 'samples': 16245760, 'steps': 31729, 'loss/train': 1.9318382740020752} +03/05/2022 02:45:21 - INFO - codeparrot_training - Step 31730: {'lr': 0.0004518479796495741, 'samples': 16246272, 'steps': 31730, 'loss/train': 4.010793209075928} +03/05/2022 02:45:23 - INFO - codeparrot_training - Skipping example with length 266 (seq_length=1024) +03/05/2022 02:45:27 - INFO - codeparrot_training - Step 31731: {'lr': 0.00045184484854268216, 'samples': 16246784, 'steps': 31731, 'loss/train': 1.8899635076522827} +03/05/2022 02:45:30 - INFO - codeparrot_training - Step 31732: {'lr': 0.00045184171734484203, 'samples': 16247296, 'steps': 31732, 'loss/train': 1.649454116821289} +03/05/2022 02:45:33 - INFO - codeparrot_training - Step 31733: {'lr': 0.00045183858605605517, 'samples': 16247808, 'steps': 31733, 'loss/train': 2.162670135498047} +03/05/2022 02:45:33 - INFO - codeparrot_training - Skipping example with length 90 (seq_length=1024) +03/05/2022 02:45:39 - INFO - codeparrot_training - Step 31734: {'lr': 0.00045183545467632295, 'samples': 16248320, 'steps': 31734, 'loss/train': 1.5207518339157104} +03/05/2022 02:45:42 - INFO - codeparrot_training - Step 31735: {'lr': 0.0004518323232056468, 'samples': 16248832, 'steps': 31735, 'loss/train': 1.4781872034072876} +03/05/2022 02:45:47 - INFO - codeparrot_training - Step 31736: {'lr': 0.0004518291916440281, 'samples': 16249344, 'steps': 31736, 'loss/train': 1.7404606342315674} +03/05/2022 02:45:50 - INFO - codeparrot_training - Step 31737: {'lr': 0.0004518260599914683, 'samples': 16249856, 'steps': 31737, 'loss/train': 2.054672956466675} +03/05/2022 02:45:50 - INFO - codeparrot_training - Skipping example with length 889 (seq_length=1024) +03/05/2022 02:45:55 - INFO - codeparrot_training - Step 31738: {'lr': 0.0004518229282479688, 'samples': 16250368, 'steps': 31738, 'loss/train': 1.5744974613189697} +03/05/2022 02:45:58 - INFO - codeparrot_training - Skipping example with length 596 (seq_length=1024) +03/05/2022 02:46:01 - INFO - codeparrot_training - Step 31739: {'lr': 0.000451819796413531, 'samples': 16250880, 'steps': 31739, 'loss/train': 1.680079460144043} +03/05/2022 02:46:04 - INFO - codeparrot_training - Step 31740: {'lr': 0.0004518166644881563, 'samples': 16251392, 'steps': 31740, 'loss/train': 1.8072750568389893} +03/05/2022 02:46:07 - INFO - codeparrot_training - Step 31741: {'lr': 0.0004518135324718461, 'samples': 16251904, 'steps': 31741, 'loss/train': 1.5976402759552002} +03/05/2022 02:46:07 - INFO - codeparrot_training - Skipping example with length 676 (seq_length=1024) +03/05/2022 02:46:13 - INFO - codeparrot_training - Step 31742: {'lr': 0.00045181040036460185, 'samples': 16252416, 'steps': 31742, 'loss/train': 2.039569854736328} +03/05/2022 02:46:16 - INFO - codeparrot_training - Step 31743: {'lr': 0.0004518072681664249, 'samples': 16252928, 'steps': 31743, 'loss/train': 1.698258638381958} +03/05/2022 02:46:16 - INFO - codeparrot_training - Skipping example with length 786 (seq_length=1024) +03/05/2022 02:46:21 - INFO - codeparrot_training - Step 31744: {'lr': 0.0004518041358773168, 'samples': 16253440, 'steps': 31744, 'loss/train': 1.7008917331695557} +03/05/2022 02:46:24 - INFO - codeparrot_training - Step 31745: {'lr': 0.0004518010034972788, 'samples': 16253952, 'steps': 31745, 'loss/train': 1.7665826082229614} +03/05/2022 02:46:24 - INFO - codeparrot_training - Skipping example with length 64 (seq_length=1024) +03/05/2022 02:46:30 - INFO - codeparrot_training - Step 31746: {'lr': 0.0004517978710263124, 'samples': 16254464, 'steps': 31746, 'loss/train': 1.3124279975891113} +03/05/2022 02:46:33 - INFO - codeparrot_training - Step 31747: {'lr': 0.0004517947384644191, 'samples': 16254976, 'steps': 31747, 'loss/train': 1.766959309577942} +03/05/2022 02:46:33 - INFO - codeparrot_training - Skipping example with length 737 (seq_length=1024) +03/05/2022 02:46:38 - INFO - codeparrot_training - Step 31748: {'lr': 0.00045179160581160005, 'samples': 16255488, 'steps': 31748, 'loss/train': 1.5297390222549438} +03/05/2022 02:46:41 - INFO - codeparrot_training - Step 31749: {'lr': 0.0004517884730678569, 'samples': 16256000, 'steps': 31749, 'loss/train': 2.06141996383667} +03/05/2022 02:46:41 - INFO - codeparrot_training - Skipping example with length 977 (seq_length=1024) +03/05/2022 02:46:46 - INFO - codeparrot_training - Step 31750: {'lr': 0.00045178534023319097, 'samples': 16256512, 'steps': 31750, 'loss/train': 1.2325838804244995} +03/05/2022 02:46:49 - INFO - codeparrot_training - Skipping example with length 355 (seq_length=1024) +03/05/2022 02:46:52 - INFO - codeparrot_training - Step 31751: {'lr': 0.00045178220730760367, 'samples': 16257024, 'steps': 31751, 'loss/train': 1.4560389518737793} +03/05/2022 02:46:55 - INFO - codeparrot_training - Step 31752: {'lr': 0.0004517790742910964, 'samples': 16257536, 'steps': 31752, 'loss/train': 1.7231682538986206} +03/05/2022 02:46:58 - INFO - codeparrot_training - Skipping example with length 378 (seq_length=1024) +03/05/2022 02:47:00 - INFO - codeparrot_training - Step 31753: {'lr': 0.0004517759411836706, 'samples': 16258048, 'steps': 31753, 'loss/train': 2.8942039012908936} +03/05/2022 02:47:03 - INFO - codeparrot_training - Step 31754: {'lr': 0.0004517728079853277, 'samples': 16258560, 'steps': 31754, 'loss/train': 0.2740870714187622} +03/05/2022 02:47:06 - INFO - codeparrot_training - Skipping example with length 786 (seq_length=1024) +03/05/2022 02:47:09 - INFO - codeparrot_training - Step 31755: {'lr': 0.0004517696746960691, 'samples': 16259072, 'steps': 31755, 'loss/train': 2.1802561283111572} +03/05/2022 02:47:12 - INFO - codeparrot_training - Step 31756: {'lr': 0.00045176654131589617, 'samples': 16259584, 'steps': 31756, 'loss/train': 1.7064852714538574} +03/05/2022 02:47:15 - INFO - codeparrot_training - Skipping example with length 821 (seq_length=1024) +03/05/2022 02:47:17 - INFO - codeparrot_training - Step 31757: {'lr': 0.0004517634078448103, 'samples': 16260096, 'steps': 31757, 'loss/train': 1.633244514465332} +03/05/2022 02:47:20 - INFO - codeparrot_training - Step 31758: {'lr': 0.0004517602742828131, 'samples': 16260608, 'steps': 31758, 'loss/train': 1.0179920196533203} +03/05/2022 02:47:23 - INFO - codeparrot_training - Skipping example with length 462 (seq_length=1024) +03/05/2022 02:47:25 - INFO - codeparrot_training - Step 31759: {'lr': 0.0004517571406299057, 'samples': 16261120, 'steps': 31759, 'loss/train': 0.5536475777626038} +03/05/2022 02:47:29 - INFO - codeparrot_training - Step 31760: {'lr': 0.0004517540068860897, 'samples': 16261632, 'steps': 31760, 'loss/train': 1.843300461769104} +03/05/2022 02:47:31 - INFO - codeparrot_training - Skipping example with length 255 (seq_length=1024) +03/05/2022 02:47:34 - INFO - codeparrot_training - Step 31761: {'lr': 0.0004517508730513664, 'samples': 16262144, 'steps': 31761, 'loss/train': 1.1719732284545898} +03/05/2022 02:47:37 - INFO - codeparrot_training - Step 31762: {'lr': 0.00045174773912573735, 'samples': 16262656, 'steps': 31762, 'loss/train': 1.827906847000122} +03/05/2022 02:47:40 - INFO - codeparrot_training - Skipping example with length 275 (seq_length=1024) +03/05/2022 02:47:42 - INFO - codeparrot_training - Step 31763: {'lr': 0.00045174460510920386, 'samples': 16263168, 'steps': 31763, 'loss/train': 2.518206834793091} +03/05/2022 02:47:45 - INFO - codeparrot_training - Step 31764: {'lr': 0.00045174147100176734, 'samples': 16263680, 'steps': 31764, 'loss/train': 1.5004510879516602} +03/05/2022 02:47:48 - INFO - codeparrot_training - Skipping example with length 397 (seq_length=1024) +03/05/2022 02:47:51 - INFO - codeparrot_training - Step 31765: {'lr': 0.00045173833680342925, 'samples': 16264192, 'steps': 31765, 'loss/train': 1.0793771743774414} +03/05/2022 02:47:54 - INFO - codeparrot_training - Step 31766: {'lr': 0.00045173520251419095, 'samples': 16264704, 'steps': 31766, 'loss/train': 1.4264402389526367} +03/05/2022 02:47:56 - INFO - codeparrot_training - Skipping example with length 647 (seq_length=1024) +03/05/2022 02:47:59 - INFO - codeparrot_training - Step 31767: {'lr': 0.0004517320681340539, 'samples': 16265216, 'steps': 31767, 'loss/train': 1.2054189443588257} +03/05/2022 02:48:03 - INFO - codeparrot_training - Step 31768: {'lr': 0.0004517289336630195, 'samples': 16265728, 'steps': 31768, 'loss/train': 1.71027410030365} +03/05/2022 02:48:05 - INFO - codeparrot_training - Skipping example with length 739 (seq_length=1024) +03/05/2022 02:48:08 - INFO - codeparrot_training - Step 31769: {'lr': 0.0004517257991010891, 'samples': 16266240, 'steps': 31769, 'loss/train': 1.573933720588684} +03/05/2022 02:48:11 - INFO - codeparrot_training - Step 31770: {'lr': 0.0004517226644482642, 'samples': 16266752, 'steps': 31770, 'loss/train': 2.0494937896728516} +03/05/2022 02:48:14 - INFO - codeparrot_training - Skipping example with length 279 (seq_length=1024) +03/05/2022 02:48:16 - INFO - codeparrot_training - Step 31771: {'lr': 0.00045171952970454623, 'samples': 16267264, 'steps': 31771, 'loss/train': 2.298218250274658} +03/05/2022 02:48:20 - INFO - codeparrot_training - Step 31772: {'lr': 0.0004517163948699365, 'samples': 16267776, 'steps': 31772, 'loss/train': 0.05792680382728577} +03/05/2022 02:48:22 - INFO - codeparrot_training - Skipping example with length 137 (seq_length=1024) +03/05/2022 02:48:25 - INFO - codeparrot_training - Step 31773: {'lr': 0.00045171325994443644, 'samples': 16268288, 'steps': 31773, 'loss/train': 1.6810221672058105} +03/05/2022 02:48:28 - INFO - codeparrot_training - Step 31774: {'lr': 0.00045171012492804753, 'samples': 16268800, 'steps': 31774, 'loss/train': 1.402950644493103} +03/05/2022 02:48:30 - INFO - codeparrot_training - Skipping example with length 981 (seq_length=1024) +03/05/2022 02:48:33 - INFO - codeparrot_training - Step 31775: {'lr': 0.0004517069898207712, 'samples': 16269312, 'steps': 31775, 'loss/train': 1.2547709941864014} +03/05/2022 02:48:36 - INFO - codeparrot_training - Step 31776: {'lr': 0.00045170385462260876, 'samples': 16269824, 'steps': 31776, 'loss/train': 1.9468953609466553} +03/05/2022 02:48:39 - INFO - codeparrot_training - Skipping example with length 600 (seq_length=1024) +03/05/2022 02:48:42 - INFO - codeparrot_training - Step 31777: {'lr': 0.0004517007193335617, 'samples': 16270336, 'steps': 31777, 'loss/train': 1.9092763662338257} +03/05/2022 02:48:45 - INFO - codeparrot_training - Step 31778: {'lr': 0.0004516975839536314, 'samples': 16270848, 'steps': 31778, 'loss/train': 1.630836844444275} +03/05/2022 02:48:47 - INFO - codeparrot_training - Skipping example with length 626 (seq_length=1024) +03/05/2022 02:48:50 - INFO - codeparrot_training - Step 31779: {'lr': 0.0004516944484828193, 'samples': 16271360, 'steps': 31779, 'loss/train': 0.8185743093490601} +03/05/2022 02:48:53 - INFO - codeparrot_training - Step 31780: {'lr': 0.0004516913129211268, 'samples': 16271872, 'steps': 31780, 'loss/train': 1.7097927331924438} +03/05/2022 02:48:55 - INFO - codeparrot_training - Skipping example with length 242 (seq_length=1024) +03/05/2022 02:48:59 - INFO - codeparrot_training - Step 31781: {'lr': 0.00045168817726855525, 'samples': 16272384, 'steps': 31781, 'loss/train': 1.8957138061523438} +03/05/2022 02:49:02 - INFO - codeparrot_training - Step 31782: {'lr': 0.0004516850415251061, 'samples': 16272896, 'steps': 31782, 'loss/train': 1.4866905212402344} +03/05/2022 02:49:03 - INFO - codeparrot_training - Skipping example with length 435 (seq_length=1024) +03/05/2022 02:49:07 - INFO - codeparrot_training - Step 31783: {'lr': 0.0004516819056907809, 'samples': 16273408, 'steps': 31783, 'loss/train': 2.675497531890869} +03/05/2022 02:49:10 - INFO - codeparrot_training - Step 31784: {'lr': 0.0004516787697655809, 'samples': 16273920, 'steps': 31784, 'loss/train': 1.717115044593811} +03/05/2022 02:49:12 - INFO - codeparrot_training - Skipping example with length 100 (seq_length=1024) +03/05/2022 02:49:16 - INFO - codeparrot_training - Step 31785: {'lr': 0.0004516756337495075, 'samples': 16274432, 'steps': 31785, 'loss/train': 2.263826847076416} +03/05/2022 02:49:19 - INFO - codeparrot_training - Step 31786: {'lr': 0.0004516724976425622, 'samples': 16274944, 'steps': 31786, 'loss/train': 1.6937733888626099} +03/05/2022 02:49:21 - INFO - codeparrot_training - Skipping example with length 1004 (seq_length=1024) +03/05/2022 02:49:24 - INFO - codeparrot_training - Step 31787: {'lr': 0.0004516693614447464, 'samples': 16275456, 'steps': 31787, 'loss/train': 2.688793420791626} +03/05/2022 02:49:27 - INFO - codeparrot_training - Step 31788: {'lr': 0.0004516662251560615, 'samples': 16275968, 'steps': 31788, 'loss/train': 1.3521760702133179} +03/05/2022 02:49:30 - INFO - codeparrot_training - Skipping example with length 769 (seq_length=1024) +03/05/2022 02:49:32 - INFO - codeparrot_training - Step 31789: {'lr': 0.0004516630887765089, 'samples': 16276480, 'steps': 31789, 'loss/train': 2.153630018234253} +03/05/2022 02:49:35 - INFO - codeparrot_training - Step 31790: {'lr': 0.00045165995230609003, 'samples': 16276992, 'steps': 31790, 'loss/train': 1.2454617023468018} +03/05/2022 02:49:38 - INFO - codeparrot_training - Skipping example with length 139 (seq_length=1024) +03/05/2022 02:49:41 - INFO - codeparrot_training - Step 31791: {'lr': 0.0004516568157448063, 'samples': 16277504, 'steps': 31791, 'loss/train': 1.1172261238098145} +03/05/2022 02:49:44 - INFO - codeparrot_training - Step 31792: {'lr': 0.00045165367909265916, 'samples': 16278016, 'steps': 31792, 'loss/train': 0.7798632979393005} +03/05/2022 02:49:47 - INFO - codeparrot_training - Skipping example with length 758 (seq_length=1024) +03/05/2022 02:49:49 - INFO - codeparrot_training - Step 31793: {'lr': 0.00045165054234964984, 'samples': 16278528, 'steps': 31793, 'loss/train': 2.2542359828948975} +03/05/2022 02:49:53 - INFO - codeparrot_training - Step 31794: {'lr': 0.0004516474055157801, 'samples': 16279040, 'steps': 31794, 'loss/train': 1.832531213760376} +03/05/2022 02:49:55 - INFO - codeparrot_training - Skipping example with length 878 (seq_length=1024) +03/05/2022 02:49:58 - INFO - codeparrot_training - Step 31795: {'lr': 0.000451644268591051, 'samples': 16279552, 'steps': 31795, 'loss/train': 1.1278120279312134} +03/05/2022 02:50:01 - INFO - codeparrot_training - Step 31796: {'lr': 0.00045164113157546414, 'samples': 16280064, 'steps': 31796, 'loss/train': 1.618048071861267} +03/05/2022 02:50:04 - INFO - codeparrot_training - Skipping example with length 801 (seq_length=1024) +03/05/2022 02:50:06 - INFO - codeparrot_training - Step 31797: {'lr': 0.0004516379944690209, 'samples': 16280576, 'steps': 31797, 'loss/train': 1.7062360048294067} +03/05/2022 02:50:09 - INFO - codeparrot_training - Step 31798: {'lr': 0.0004516348572717227, 'samples': 16281088, 'steps': 31798, 'loss/train': 1.5274795293807983} +03/05/2022 02:50:12 - INFO - codeparrot_training - Skipping example with length 142 (seq_length=1024) +03/05/2022 02:50:15 - INFO - codeparrot_training - Step 31799: {'lr': 0.000451631719983571, 'samples': 16281600, 'steps': 31799, 'loss/train': 1.377568006515503} +03/05/2022 02:50:18 - INFO - codeparrot_training - Step 31800: {'lr': 0.00045162858260456705, 'samples': 16282112, 'steps': 31800, 'loss/train': 1.6362025737762451} +03/05/2022 02:50:20 - INFO - codeparrot_training - Skipping example with length 111 (seq_length=1024) +03/05/2022 02:50:23 - INFO - codeparrot_training - Step 31801: {'lr': 0.0004516254451347125, 'samples': 16282624, 'steps': 31801, 'loss/train': 1.8461443185806274} +03/05/2022 02:50:26 - INFO - codeparrot_training - Step 31802: {'lr': 0.0004516223075740085, 'samples': 16283136, 'steps': 31802, 'loss/train': 0.619382917881012} +03/05/2022 02:50:29 - INFO - codeparrot_training - Skipping example with length 804 (seq_length=1024) +03/05/2022 02:50:32 - INFO - codeparrot_training - Step 31803: {'lr': 0.00045161916992245664, 'samples': 16283648, 'steps': 31803, 'loss/train': 0.8664124608039856} +03/05/2022 02:50:35 - INFO - codeparrot_training - Step 31804: {'lr': 0.0004516160321800584, 'samples': 16284160, 'steps': 31804, 'loss/train': 0.5236685872077942} +03/05/2022 02:50:37 - INFO - codeparrot_training - Skipping example with length 834 (seq_length=1024) +03/05/2022 02:50:40 - INFO - codeparrot_training - Step 31805: {'lr': 0.000451612894346815, 'samples': 16284672, 'steps': 31805, 'loss/train': 1.8693708181381226} +03/05/2022 02:50:43 - INFO - codeparrot_training - Step 31806: {'lr': 0.00045160975642272795, 'samples': 16285184, 'steps': 31806, 'loss/train': 1.828359603881836} +03/05/2022 02:50:46 - INFO - codeparrot_training - Skipping example with length 663 (seq_length=1024) +03/05/2022 02:50:49 - INFO - codeparrot_training - Step 31807: {'lr': 0.0004516066184077986, 'samples': 16285696, 'steps': 31807, 'loss/train': 0.054384298622608185} +03/05/2022 02:50:52 - INFO - codeparrot_training - Step 31808: {'lr': 0.0004516034803020285, 'samples': 16286208, 'steps': 31808, 'loss/train': 1.6048599481582642} +03/05/2022 02:50:55 - INFO - codeparrot_training - Skipping example with length 83 (seq_length=1024) +03/05/2022 02:50:57 - INFO - codeparrot_training - Step 31809: {'lr': 0.0004516003421054189, 'samples': 16286720, 'steps': 31809, 'loss/train': 1.9228047132492065} +03/05/2022 02:51:01 - INFO - codeparrot_training - Step 31810: {'lr': 0.0004515972038179714, 'samples': 16287232, 'steps': 31810, 'loss/train': 1.960437297821045} +03/05/2022 02:51:03 - INFO - codeparrot_training - Skipping example with length 899 (seq_length=1024) +03/05/2022 02:51:06 - INFO - codeparrot_training - Step 31811: {'lr': 0.0004515940654396872, 'samples': 16287744, 'steps': 31811, 'loss/train': 1.6252107620239258} +03/05/2022 02:51:09 - INFO - codeparrot_training - Step 31812: {'lr': 0.00045159092697056794, 'samples': 16288256, 'steps': 31812, 'loss/train': 1.6809409856796265} +03/05/2022 02:51:11 - INFO - codeparrot_training - Skipping example with length 210 (seq_length=1024) +03/05/2022 02:51:14 - INFO - codeparrot_training - Step 31813: {'lr': 0.00045158778841061483, 'samples': 16288768, 'steps': 31813, 'loss/train': 1.8418540954589844} +03/05/2022 02:51:18 - INFO - codeparrot_training - Step 31814: {'lr': 0.0004515846497598294, 'samples': 16289280, 'steps': 31814, 'loss/train': 1.7240734100341797} +03/05/2022 02:51:20 - INFO - codeparrot_training - Skipping example with length 475 (seq_length=1024) +03/05/2022 02:51:23 - INFO - codeparrot_training - Step 31815: {'lr': 0.000451581511018213, 'samples': 16289792, 'steps': 31815, 'loss/train': 1.0928095579147339} +03/05/2022 02:51:26 - INFO - codeparrot_training - Step 31816: {'lr': 0.00045157837218576713, 'samples': 16290304, 'steps': 31816, 'loss/train': 1.6573946475982666} +03/05/2022 02:51:28 - INFO - codeparrot_training - Skipping example with length 540 (seq_length=1024) +03/05/2022 02:51:31 - INFO - codeparrot_training - Step 31817: {'lr': 0.00045157523326249316, 'samples': 16290816, 'steps': 31817, 'loss/train': 1.8898624181747437} +03/05/2022 02:51:35 - INFO - codeparrot_training - Step 31818: {'lr': 0.00045157209424839253, 'samples': 16291328, 'steps': 31818, 'loss/train': 1.8430675268173218} +03/05/2022 02:51:37 - INFO - codeparrot_training - Skipping example with length 549 (seq_length=1024) +03/05/2022 02:51:40 - INFO - codeparrot_training - Step 31819: {'lr': 0.0004515689551434665, 'samples': 16291840, 'steps': 31819, 'loss/train': 1.8320001363754272} +03/05/2022 02:51:43 - INFO - codeparrot_training - Step 31820: {'lr': 0.00045156581594771675, 'samples': 16292352, 'steps': 31820, 'loss/train': 2.5847766399383545} +03/05/2022 02:51:45 - INFO - codeparrot_training - Skipping example with length 481 (seq_length=1024) +03/05/2022 02:51:48 - INFO - codeparrot_training - Step 31821: {'lr': 0.00045156267666114446, 'samples': 16292864, 'steps': 31821, 'loss/train': 1.9770170450210571} +03/05/2022 02:51:51 - INFO - codeparrot_training - Step 31822: {'lr': 0.0004515595372837512, 'samples': 16293376, 'steps': 31822, 'loss/train': 1.488275408744812} +03/05/2022 02:51:53 - INFO - codeparrot_training - Skipping example with length 615 (seq_length=1024) +03/05/2022 02:51:57 - INFO - codeparrot_training - Step 31823: {'lr': 0.00045155639781553825, 'samples': 16293888, 'steps': 31823, 'loss/train': 1.2861467599868774} +03/05/2022 02:52:00 - INFO - codeparrot_training - Step 31824: {'lr': 0.00045155325825650715, 'samples': 16294400, 'steps': 31824, 'loss/train': 1.4563275575637817} +03/05/2022 02:52:02 - INFO - codeparrot_training - Skipping example with length 509 (seq_length=1024) +03/05/2022 02:52:06 - INFO - codeparrot_training - Step 31825: {'lr': 0.00045155011860665927, 'samples': 16294912, 'steps': 31825, 'loss/train': 2.0736804008483887} +03/05/2022 02:52:09 - INFO - codeparrot_training - Step 31826: {'lr': 0.00045154697886599606, 'samples': 16295424, 'steps': 31826, 'loss/train': 1.8365153074264526} +03/05/2022 02:52:12 - INFO - codeparrot_training - Step 31827: {'lr': 0.0004515438390345188, 'samples': 16295936, 'steps': 31827, 'loss/train': 0.157594695687294} +03/05/2022 02:52:12 - INFO - codeparrot_training - Skipping example with length 855 (seq_length=1024) +03/05/2022 02:52:17 - INFO - codeparrot_training - Step 31828: {'lr': 0.00045154069911222905, 'samples': 16296448, 'steps': 31828, 'loss/train': 1.3065181970596313} +03/05/2022 02:52:20 - INFO - codeparrot_training - Skipping example with length 582 (seq_length=1024) +03/05/2022 02:52:23 - INFO - codeparrot_training - Step 31829: {'lr': 0.0004515375590991281, 'samples': 16296960, 'steps': 31829, 'loss/train': 2.2466864585876465} +03/05/2022 02:52:26 - INFO - codeparrot_training - Step 31830: {'lr': 0.0004515344189952175, 'samples': 16297472, 'steps': 31830, 'loss/train': 2.1473350524902344} +03/05/2022 02:52:29 - INFO - codeparrot_training - Skipping example with length 220 (seq_length=1024) +03/05/2022 02:52:31 - INFO - codeparrot_training - Step 31831: {'lr': 0.0004515312788004986, 'samples': 16297984, 'steps': 31831, 'loss/train': 1.6698858737945557} +03/05/2022 02:52:34 - INFO - codeparrot_training - Step 31832: {'lr': 0.00045152813851497274, 'samples': 16298496, 'steps': 31832, 'loss/train': 0.07000356167554855} +03/05/2022 02:52:37 - INFO - codeparrot_training - Skipping example with length 631 (seq_length=1024) +03/05/2022 02:52:40 - INFO - codeparrot_training - Step 31833: {'lr': 0.0004515249981386416, 'samples': 16299008, 'steps': 31833, 'loss/train': 1.4705886840820312} +03/05/2022 02:52:43 - INFO - codeparrot_training - Step 31834: {'lr': 0.0004515218576715062, 'samples': 16299520, 'steps': 31834, 'loss/train': 1.3666563034057617} +03/05/2022 02:52:45 - INFO - codeparrot_training - Skipping example with length 827 (seq_length=1024) +03/05/2022 02:52:48 - INFO - codeparrot_training - Step 31835: {'lr': 0.00045151871711356827, 'samples': 16300032, 'steps': 31835, 'loss/train': 1.2498530149459839} +03/05/2022 02:52:51 - INFO - codeparrot_training - Step 31836: {'lr': 0.0004515155764648291, 'samples': 16300544, 'steps': 31836, 'loss/train': 1.845923662185669} +03/05/2022 02:52:53 - INFO - codeparrot_training - Skipping example with length 886 (seq_length=1024) +03/05/2022 02:52:57 - INFO - codeparrot_training - Step 31837: {'lr': 0.0004515124357252901, 'samples': 16301056, 'steps': 31837, 'loss/train': 1.0130943059921265} +03/05/2022 02:53:00 - INFO - codeparrot_training - Step 31838: {'lr': 0.0004515092948949527, 'samples': 16301568, 'steps': 31838, 'loss/train': 1.9048171043395996} +03/05/2022 02:53:02 - INFO - codeparrot_training - Skipping example with length 292 (seq_length=1024) +03/05/2022 02:53:05 - INFO - codeparrot_training - Step 31839: {'lr': 0.00045150615397381835, 'samples': 16302080, 'steps': 31839, 'loss/train': 1.3387864828109741} +03/05/2022 02:53:08 - INFO - codeparrot_training - Step 31840: {'lr': 0.0004515030129618884, 'samples': 16302592, 'steps': 31840, 'loss/train': 1.932776689529419} +03/05/2022 02:53:11 - INFO - codeparrot_training - Skipping example with length 342 (seq_length=1024) +03/05/2022 02:53:14 - INFO - codeparrot_training - Step 31841: {'lr': 0.0004514998718591643, 'samples': 16303104, 'steps': 31841, 'loss/train': 1.77843177318573} +03/05/2022 02:53:17 - INFO - codeparrot_training - Step 31842: {'lr': 0.0004514967306656475, 'samples': 16303616, 'steps': 31842, 'loss/train': 1.7404714822769165} +03/05/2022 02:53:19 - INFO - codeparrot_training - Skipping example with length 32 (seq_length=1024) +03/05/2022 02:53:22 - INFO - codeparrot_training - Step 31843: {'lr': 0.0004514935893813394, 'samples': 16304128, 'steps': 31843, 'loss/train': 1.1077680587768555} +03/05/2022 02:53:26 - INFO - codeparrot_training - Step 31844: {'lr': 0.00045149044800624135, 'samples': 16304640, 'steps': 31844, 'loss/train': 1.3739569187164307} +03/05/2022 02:53:28 - INFO - codeparrot_training - Skipping example with length 337 (seq_length=1024) +03/05/2022 02:53:31 - INFO - codeparrot_training - Step 31845: {'lr': 0.0004514873065403549, 'samples': 16305152, 'steps': 31845, 'loss/train': 1.5432828664779663} +03/05/2022 02:53:34 - INFO - codeparrot_training - Step 31846: {'lr': 0.0004514841649836813, 'samples': 16305664, 'steps': 31846, 'loss/train': 1.8257838487625122} +03/05/2022 02:53:37 - INFO - codeparrot_training - Skipping example with length 317 (seq_length=1024) +03/05/2022 02:53:39 - INFO - codeparrot_training - Step 31847: {'lr': 0.000451481023336222, 'samples': 16306176, 'steps': 31847, 'loss/train': 1.4391939640045166} +03/05/2022 02:53:43 - INFO - codeparrot_training - Step 31848: {'lr': 0.0004514778815979785, 'samples': 16306688, 'steps': 31848, 'loss/train': 2.4059624671936035} +03/05/2022 02:53:45 - INFO - codeparrot_training - Skipping example with length 548 (seq_length=1024) +03/05/2022 02:53:48 - INFO - codeparrot_training - Step 31849: {'lr': 0.0004514747397689522, 'samples': 16307200, 'steps': 31849, 'loss/train': 1.5942658185958862} +03/05/2022 02:53:51 - INFO - codeparrot_training - Step 31850: {'lr': 0.0004514715978491445, 'samples': 16307712, 'steps': 31850, 'loss/train': 1.565090298652649} +03/05/2022 02:53:53 - INFO - codeparrot_training - Skipping example with length 208 (seq_length=1024) +03/05/2022 02:53:56 - INFO - codeparrot_training - Step 31851: {'lr': 0.0004514684558385568, 'samples': 16308224, 'steps': 31851, 'loss/train': 1.8012075424194336} +03/05/2022 02:53:59 - INFO - codeparrot_training - Step 31852: {'lr': 0.0004514653137371905, 'samples': 16308736, 'steps': 31852, 'loss/train': 1.3229076862335205} +03/05/2022 02:54:02 - INFO - codeparrot_training - Skipping example with length 133 (seq_length=1024) +03/05/2022 02:54:05 - INFO - codeparrot_training - Step 31853: {'lr': 0.000451462171545047, 'samples': 16309248, 'steps': 31853, 'loss/train': 1.7128969430923462} +03/05/2022 02:54:08 - INFO - codeparrot_training - Step 31854: {'lr': 0.00045145902926212785, 'samples': 16309760, 'steps': 31854, 'loss/train': 1.7368899583816528} +03/05/2022 02:54:10 - INFO - codeparrot_training - Skipping example with length 568 (seq_length=1024) +03/05/2022 02:54:13 - INFO - codeparrot_training - Step 31855: {'lr': 0.0004514558868884343, 'samples': 16310272, 'steps': 31855, 'loss/train': 1.469285249710083} +03/05/2022 02:54:16 - INFO - codeparrot_training - Step 31856: {'lr': 0.00045145274442396786, 'samples': 16310784, 'steps': 31856, 'loss/train': 1.583849310874939} +03/05/2022 02:54:19 - INFO - codeparrot_training - Skipping example with length 332 (seq_length=1024) +03/05/2022 02:54:21 - INFO - codeparrot_training - Step 31857: {'lr': 0.00045144960186872996, 'samples': 16311296, 'steps': 31857, 'loss/train': 0.09570786356925964} +03/05/2022 02:54:25 - INFO - codeparrot_training - Step 31858: {'lr': 0.0004514464592227219, 'samples': 16311808, 'steps': 31858, 'loss/train': 1.2518233060836792} +03/05/2022 02:54:27 - INFO - codeparrot_training - Skipping example with length 319 (seq_length=1024) +03/05/2022 02:54:30 - INFO - codeparrot_training - Step 31859: {'lr': 0.0004514433164859453, 'samples': 16312320, 'steps': 31859, 'loss/train': 0.09363142400979996} +03/05/2022 02:54:33 - INFO - codeparrot_training - Step 31860: {'lr': 0.0004514401736584013, 'samples': 16312832, 'steps': 31860, 'loss/train': 2.0139875411987305} +03/05/2022 02:54:35 - INFO - codeparrot_training - Skipping example with length 971 (seq_length=1024) +03/05/2022 02:54:39 - INFO - codeparrot_training - Step 31861: {'lr': 0.0004514370307400916, 'samples': 16313344, 'steps': 31861, 'loss/train': 2.1147162914276123} +03/05/2022 02:54:42 - INFO - codeparrot_training - Step 31862: {'lr': 0.00045143388773101733, 'samples': 16313856, 'steps': 31862, 'loss/train': 1.9519046545028687} +03/05/2022 02:54:44 - INFO - codeparrot_training - Skipping example with length 607 (seq_length=1024) +03/05/2022 02:54:47 - INFO - codeparrot_training - Step 31863: {'lr': 0.0004514307446311802, 'samples': 16314368, 'steps': 31863, 'loss/train': 2.2852942943573} +03/05/2022 02:54:50 - INFO - codeparrot_training - Step 31864: {'lr': 0.0004514276014405814, 'samples': 16314880, 'steps': 31864, 'loss/train': 2.569105863571167} +03/05/2022 02:54:52 - INFO - codeparrot_training - Skipping example with length 911 (seq_length=1024) +03/05/2022 02:54:56 - INFO - codeparrot_training - Step 31865: {'lr': 0.00045142445815922244, 'samples': 16315392, 'steps': 31865, 'loss/train': 1.76587975025177} +03/05/2022 02:54:59 - INFO - codeparrot_training - Step 31866: {'lr': 0.0004514213147871047, 'samples': 16315904, 'steps': 31866, 'loss/train': 0.7369840145111084} +03/05/2022 02:55:00 - INFO - codeparrot_training - Skipping example with length 421 (seq_length=1024) +03/05/2022 02:55:04 - INFO - codeparrot_training - Step 31867: {'lr': 0.00045141817132422974, 'samples': 16316416, 'steps': 31867, 'loss/train': 1.6868627071380615} +03/05/2022 02:55:07 - INFO - codeparrot_training - Step 31868: {'lr': 0.0004514150277705988, 'samples': 16316928, 'steps': 31868, 'loss/train': 1.293117642402649} +03/05/2022 02:55:09 - INFO - codeparrot_training - Skipping example with length 214 (seq_length=1024) +03/05/2022 02:55:12 - INFO - codeparrot_training - Step 31869: {'lr': 0.0004514118841262133, 'samples': 16317440, 'steps': 31869, 'loss/train': 1.6722594499588013} +03/05/2022 02:55:15 - INFO - codeparrot_training - Step 31870: {'lr': 0.0004514087403910748, 'samples': 16317952, 'steps': 31870, 'loss/train': 0.3640415370464325} +03/05/2022 02:55:17 - INFO - codeparrot_training - Skipping example with length 701 (seq_length=1024) +03/05/2022 02:55:21 - INFO - codeparrot_training - Step 31871: {'lr': 0.00045140559656518456, 'samples': 16318464, 'steps': 31871, 'loss/train': 1.4758586883544922} +03/05/2022 02:55:24 - INFO - codeparrot_training - Step 31872: {'lr': 0.0004514024526485441, 'samples': 16318976, 'steps': 31872, 'loss/train': 1.2275573015213013} +03/05/2022 02:55:25 - INFO - codeparrot_training - Skipping example with length 932 (seq_length=1024) +03/05/2022 02:55:29 - INFO - codeparrot_training - Step 31873: {'lr': 0.0004513993086411548, 'samples': 16319488, 'steps': 31873, 'loss/train': 1.9309337139129639} +03/05/2022 02:55:32 - INFO - codeparrot_training - Step 31874: {'lr': 0.00045139616454301806, 'samples': 16320000, 'steps': 31874, 'loss/train': 0.6806849241256714} +03/05/2022 02:55:34 - INFO - codeparrot_training - Skipping example with length 655 (seq_length=1024) +03/05/2022 02:55:38 - INFO - codeparrot_training - Step 31875: {'lr': 0.00045139302035413534, 'samples': 16320512, 'steps': 31875, 'loss/train': 1.2036634683609009} +03/05/2022 02:55:41 - INFO - codeparrot_training - Step 31876: {'lr': 0.00045138987607450803, 'samples': 16321024, 'steps': 31876, 'loss/train': 1.948067307472229} +03/05/2022 02:55:42 - INFO - codeparrot_training - Skipping example with length 892 (seq_length=1024) +03/05/2022 02:55:46 - INFO - codeparrot_training - Step 31877: {'lr': 0.00045138673170413756, 'samples': 16321536, 'steps': 31877, 'loss/train': 2.4430065155029297} +03/05/2022 02:55:49 - INFO - codeparrot_training - Step 31878: {'lr': 0.0004513835872430253, 'samples': 16322048, 'steps': 31878, 'loss/train': 0.8089848160743713} +03/05/2022 02:55:51 - INFO - codeparrot_training - Skipping example with length 765 (seq_length=1024) +03/05/2022 02:55:55 - INFO - codeparrot_training - Step 31879: {'lr': 0.0004513804426911727, 'samples': 16322560, 'steps': 31879, 'loss/train': 1.3781253099441528} +03/05/2022 02:55:58 - INFO - codeparrot_training - Step 31880: {'lr': 0.00045137729804858124, 'samples': 16323072, 'steps': 31880, 'loss/train': 1.7367064952850342} +03/05/2022 02:55:59 - INFO - codeparrot_training - Skipping example with length 490 (seq_length=1024) +03/05/2022 02:56:03 - INFO - codeparrot_training - Step 31881: {'lr': 0.00045137415331525225, 'samples': 16323584, 'steps': 31881, 'loss/train': 1.9250236749649048} +03/05/2022 02:56:06 - INFO - codeparrot_training - Step 31882: {'lr': 0.0004513710084911872, 'samples': 16324096, 'steps': 31882, 'loss/train': 1.8302488327026367} +03/05/2022 02:56:08 - INFO - codeparrot_training - Skipping example with length 319 (seq_length=1024) +03/05/2022 02:56:12 - INFO - codeparrot_training - Step 31883: {'lr': 0.00045136786357638736, 'samples': 16324608, 'steps': 31883, 'loss/train': 2.6210012435913086} +03/05/2022 02:56:15 - INFO - codeparrot_training - Step 31884: {'lr': 0.00045136471857085435, 'samples': 16325120, 'steps': 31884, 'loss/train': 0.5416684746742249} +03/05/2022 02:56:16 - INFO - codeparrot_training - Skipping example with length 79 (seq_length=1024) +03/05/2022 02:56:20 - INFO - codeparrot_training - Step 31885: {'lr': 0.0004513615734745895, 'samples': 16325632, 'steps': 31885, 'loss/train': 1.5893045663833618} +03/05/2022 02:56:23 - INFO - codeparrot_training - Step 31886: {'lr': 0.00045135842828759426, 'samples': 16326144, 'steps': 31886, 'loss/train': 1.335083246231079} +03/05/2022 02:56:26 - INFO - codeparrot_training - Skipping example with length 984 (seq_length=1024) +03/05/2022 02:56:29 - INFO - codeparrot_training - Step 31887: {'lr': 0.00045135528300987006, 'samples': 16326656, 'steps': 31887, 'loss/train': 0.7847394347190857} +03/05/2022 02:56:32 - INFO - codeparrot_training - Step 31888: {'lr': 0.00045135213764141814, 'samples': 16327168, 'steps': 31888, 'loss/train': 1.9699671268463135} +03/05/2022 02:56:35 - INFO - codeparrot_training - Skipping example with length 829 (seq_length=1024) +03/05/2022 02:56:37 - INFO - codeparrot_training - Step 31889: {'lr': 0.00045134899218224014, 'samples': 16327680, 'steps': 31889, 'loss/train': 2.086529016494751} +03/05/2022 02:56:40 - INFO - codeparrot_training - Step 31890: {'lr': 0.0004513458466323374, 'samples': 16328192, 'steps': 31890, 'loss/train': 1.7125701904296875} +03/05/2022 02:56:43 - INFO - codeparrot_training - Skipping example with length 904 (seq_length=1024) +03/05/2022 02:56:46 - INFO - codeparrot_training - Step 31891: {'lr': 0.0004513427009917113, 'samples': 16328704, 'steps': 31891, 'loss/train': 2.791313886642456} +03/05/2022 02:56:49 - INFO - codeparrot_training - Step 31892: {'lr': 0.0004513395552603633, 'samples': 16329216, 'steps': 31892, 'loss/train': 2.0405433177948} +03/05/2022 02:56:51 - INFO - codeparrot_training - Skipping example with length 588 (seq_length=1024) +03/05/2022 02:56:54 - INFO - codeparrot_training - Step 31893: {'lr': 0.0004513364094382948, 'samples': 16329728, 'steps': 31893, 'loss/train': 1.044501543045044} +03/05/2022 02:56:57 - INFO - codeparrot_training - Step 31894: {'lr': 0.00045133326352550724, 'samples': 16330240, 'steps': 31894, 'loss/train': 0.7635440826416016} +03/05/2022 02:57:00 - INFO - codeparrot_training - Skipping example with length 636 (seq_length=1024) +03/05/2022 02:57:03 - INFO - codeparrot_training - Step 31895: {'lr': 0.000451330117522002, 'samples': 16330752, 'steps': 31895, 'loss/train': 2.0208373069763184} +03/05/2022 02:57:06 - INFO - codeparrot_training - Step 31896: {'lr': 0.00045132697142778044, 'samples': 16331264, 'steps': 31896, 'loss/train': 1.7065905332565308} +03/05/2022 02:57:08 - INFO - codeparrot_training - Skipping example with length 279 (seq_length=1024) +03/05/2022 02:57:11 - INFO - codeparrot_training - Step 31897: {'lr': 0.0004513238252428442, 'samples': 16331776, 'steps': 31897, 'loss/train': 1.441049337387085} +03/05/2022 02:57:14 - INFO - codeparrot_training - Step 31898: {'lr': 0.0004513206789671945, 'samples': 16332288, 'steps': 31898, 'loss/train': 0.9508504867553711} +03/05/2022 02:57:17 - INFO - codeparrot_training - Skipping example with length 453 (seq_length=1024) +03/05/2022 02:57:19 - INFO - codeparrot_training - Step 31899: {'lr': 0.00045131753260083276, 'samples': 16332800, 'steps': 31899, 'loss/train': 1.6174496412277222} +03/05/2022 02:57:23 - INFO - codeparrot_training - Step 31900: {'lr': 0.0004513143861437605, 'samples': 16333312, 'steps': 31900, 'loss/train': 2.327481508255005} +03/05/2022 02:57:25 - INFO - codeparrot_training - Skipping example with length 81 (seq_length=1024) +03/05/2022 02:57:28 - INFO - codeparrot_training - Step 31901: {'lr': 0.00045131123959597905, 'samples': 16333824, 'steps': 31901, 'loss/train': 1.7458815574645996} +03/05/2022 02:57:31 - INFO - codeparrot_training - Step 31902: {'lr': 0.0004513080929574899, 'samples': 16334336, 'steps': 31902, 'loss/train': 1.8604228496551514} +03/05/2022 02:57:34 - INFO - codeparrot_training - Skipping example with length 978 (seq_length=1024) +03/05/2022 02:57:36 - INFO - codeparrot_training - Step 31903: {'lr': 0.0004513049462282943, 'samples': 16334848, 'steps': 31903, 'loss/train': 0.8403961062431335} +03/05/2022 02:57:39 - INFO - codeparrot_training - Step 31904: {'lr': 0.00045130179940839395, 'samples': 16335360, 'steps': 31904, 'loss/train': 1.2440351247787476} +03/05/2022 02:57:42 - INFO - codeparrot_training - Skipping example with length 279 (seq_length=1024) +03/05/2022 02:57:45 - INFO - codeparrot_training - Step 31905: {'lr': 0.00045129865249779, 'samples': 16335872, 'steps': 31905, 'loss/train': 1.4054588079452515} +03/05/2022 02:57:48 - INFO - codeparrot_training - Step 31906: {'lr': 0.0004512955054964841, 'samples': 16336384, 'steps': 31906, 'loss/train': 0.8889415860176086} +03/05/2022 02:57:51 - INFO - codeparrot_training - Skipping example with length 229 (seq_length=1024) +03/05/2022 02:57:53 - INFO - codeparrot_training - Step 31907: {'lr': 0.0004512923584044775, 'samples': 16336896, 'steps': 31907, 'loss/train': 1.014445185661316} +03/05/2022 02:57:56 - INFO - codeparrot_training - Step 31908: {'lr': 0.0004512892112217717, 'samples': 16337408, 'steps': 31908, 'loss/train': 1.7877353429794312} +03/05/2022 02:57:59 - INFO - codeparrot_training - Skipping example with length 513 (seq_length=1024) +03/05/2022 02:58:02 - INFO - codeparrot_training - Step 31909: {'lr': 0.00045128606394836805, 'samples': 16337920, 'steps': 31909, 'loss/train': 1.9404898881912231} +03/05/2022 02:58:05 - INFO - codeparrot_training - Step 31910: {'lr': 0.00045128291658426796, 'samples': 16338432, 'steps': 31910, 'loss/train': 0.6479689478874207} +03/05/2022 02:58:08 - INFO - codeparrot_training - Skipping example with length 753 (seq_length=1024) +03/05/2022 02:58:10 - INFO - codeparrot_training - Step 31911: {'lr': 0.00045127976912947296, 'samples': 16338944, 'steps': 31911, 'loss/train': 0.15872105956077576} +03/05/2022 02:58:14 - INFO - codeparrot_training - Step 31912: {'lr': 0.00045127662158398434, 'samples': 16339456, 'steps': 31912, 'loss/train': 2.273942470550537} +03/05/2022 02:58:16 - INFO - codeparrot_training - Skipping example with length 697 (seq_length=1024) +03/05/2022 02:58:19 - INFO - codeparrot_training - Step 31913: {'lr': 0.00045127347394780367, 'samples': 16339968, 'steps': 31913, 'loss/train': 2.3919310569763184} +03/05/2022 02:58:22 - INFO - codeparrot_training - Step 31914: {'lr': 0.00045127032622093225, 'samples': 16340480, 'steps': 31914, 'loss/train': 1.34188973903656} +03/05/2022 02:58:25 - INFO - codeparrot_training - Skipping example with length 273 (seq_length=1024) +03/05/2022 02:58:27 - INFO - codeparrot_training - Step 31915: {'lr': 0.0004512671784033715, 'samples': 16340992, 'steps': 31915, 'loss/train': 1.8171836137771606} +03/05/2022 02:58:30 - INFO - codeparrot_training - Step 31916: {'lr': 0.00045126403049512286, 'samples': 16341504, 'steps': 31916, 'loss/train': 1.0759696960449219} +03/05/2022 02:58:33 - INFO - codeparrot_training - Skipping example with length 687 (seq_length=1024) +03/05/2022 02:58:36 - INFO - codeparrot_training - Step 31917: {'lr': 0.0004512608824961878, 'samples': 16342016, 'steps': 31917, 'loss/train': 1.2252100706100464} +03/05/2022 02:58:39 - INFO - codeparrot_training - Step 31918: {'lr': 0.00045125773440656756, 'samples': 16342528, 'steps': 31918, 'loss/train': 1.8207192420959473} +03/05/2022 02:58:41 - INFO - codeparrot_training - Skipping example with length 893 (seq_length=1024) +03/05/2022 02:58:44 - INFO - codeparrot_training - Step 31919: {'lr': 0.0004512545862262638, 'samples': 16343040, 'steps': 31919, 'loss/train': 1.904942512512207} +03/05/2022 02:58:47 - INFO - codeparrot_training - Step 31920: {'lr': 0.0004512514379552779, 'samples': 16343552, 'steps': 31920, 'loss/train': 1.6376686096191406} +03/05/2022 02:58:50 - INFO - codeparrot_training - Skipping example with length 516 (seq_length=1024) +03/05/2022 02:58:52 - INFO - codeparrot_training - Step 31921: {'lr': 0.0004512482895936111, 'samples': 16344064, 'steps': 31921, 'loss/train': 1.5099483728408813} +03/05/2022 02:58:56 - INFO - codeparrot_training - Step 31922: {'lr': 0.00045124514114126493, 'samples': 16344576, 'steps': 31922, 'loss/train': 2.0737662315368652} +03/05/2022 02:58:58 - INFO - codeparrot_training - Skipping example with length 104 (seq_length=1024) +03/05/2022 02:59:01 - INFO - codeparrot_training - Step 31923: {'lr': 0.0004512419925982408, 'samples': 16345088, 'steps': 31923, 'loss/train': 1.7070953845977783} +03/05/2022 02:59:04 - INFO - codeparrot_training - Step 31924: {'lr': 0.0004512388439645402, 'samples': 16345600, 'steps': 31924, 'loss/train': 2.2826290130615234} +03/05/2022 02:59:06 - INFO - codeparrot_training - Skipping example with length 838 (seq_length=1024) +03/05/2022 02:59:09 - INFO - codeparrot_training - Step 31925: {'lr': 0.00045123569524016446, 'samples': 16346112, 'steps': 31925, 'loss/train': 1.769502878189087} +03/05/2022 02:59:12 - INFO - codeparrot_training - Step 31926: {'lr': 0.00045123254642511504, 'samples': 16346624, 'steps': 31926, 'loss/train': 1.940051555633545} +03/05/2022 02:59:15 - INFO - codeparrot_training - Skipping example with length 708 (seq_length=1024) +03/05/2022 02:59:18 - INFO - codeparrot_training - Step 31927: {'lr': 0.0004512293975193933, 'samples': 16347136, 'steps': 31927, 'loss/train': 0.769180417060852} +03/05/2022 02:59:21 - INFO - codeparrot_training - Step 31928: {'lr': 0.0004512262485230007, 'samples': 16347648, 'steps': 31928, 'loss/train': 2.6771113872528076} +03/05/2022 02:59:23 - INFO - codeparrot_training - Skipping example with length 594 (seq_length=1024) +03/05/2022 02:59:26 - INFO - codeparrot_training - Step 31929: {'lr': 0.00045122309943593865, 'samples': 16348160, 'steps': 31929, 'loss/train': 2.009106159210205} +03/05/2022 02:59:29 - INFO - codeparrot_training - Step 31930: {'lr': 0.0004512199502582086, 'samples': 16348672, 'steps': 31930, 'loss/train': 0.8217947483062744} +03/05/2022 02:59:31 - INFO - codeparrot_training - Skipping example with length 849 (seq_length=1024) +03/05/2022 02:59:34 - INFO - codeparrot_training - Step 31931: {'lr': 0.00045121680098981186, 'samples': 16349184, 'steps': 31931, 'loss/train': 0.3093494176864624} +03/05/2022 02:59:38 - INFO - codeparrot_training - Step 31932: {'lr': 0.00045121365163075007, 'samples': 16349696, 'steps': 31932, 'loss/train': 0.16149555146694183} +03/05/2022 02:59:40 - INFO - codeparrot_training - Skipping example with length 933 (seq_length=1024) +03/05/2022 02:59:43 - INFO - codeparrot_training - Step 31933: {'lr': 0.0004512105021810244, 'samples': 16350208, 'steps': 31933, 'loss/train': 0.8143050670623779} +03/05/2022 02:59:46 - INFO - codeparrot_training - Step 31934: {'lr': 0.0004512073526406365, 'samples': 16350720, 'steps': 31934, 'loss/train': 1.5129972696304321} +03/05/2022 02:59:48 - INFO - codeparrot_training - Skipping example with length 219 (seq_length=1024) +03/05/2022 02:59:51 - INFO - codeparrot_training - Step 31935: {'lr': 0.0004512042030095876, 'samples': 16351232, 'steps': 31935, 'loss/train': 1.7157049179077148} +03/05/2022 02:59:55 - INFO - codeparrot_training - Step 31936: {'lr': 0.0004512010532878792, 'samples': 16351744, 'steps': 31936, 'loss/train': 1.8498201370239258} +03/05/2022 02:59:56 - INFO - codeparrot_training - Skipping example with length 307 (seq_length=1024) +03/05/2022 03:00:00 - INFO - codeparrot_training - Step 31937: {'lr': 0.0004511979034755127, 'samples': 16352256, 'steps': 31937, 'loss/train': 1.2360297441482544} +03/05/2022 03:00:03 - INFO - codeparrot_training - Step 31938: {'lr': 0.0004511947535724895, 'samples': 16352768, 'steps': 31938, 'loss/train': 1.9999516010284424} +03/05/2022 03:00:05 - INFO - codeparrot_training - Skipping example with length 916 (seq_length=1024) +03/05/2022 03:00:08 - INFO - codeparrot_training - Step 31939: {'lr': 0.00045119160357881105, 'samples': 16353280, 'steps': 31939, 'loss/train': 1.838710904121399} +03/05/2022 03:00:11 - INFO - codeparrot_training - Step 31940: {'lr': 0.0004511884534944789, 'samples': 16353792, 'steps': 31940, 'loss/train': 1.921875} +03/05/2022 03:00:13 - INFO - codeparrot_training - Skipping example with length 514 (seq_length=1024) +03/05/2022 03:00:17 - INFO - codeparrot_training - Step 31941: {'lr': 0.0004511853033194942, 'samples': 16354304, 'steps': 31941, 'loss/train': 1.2046767473220825} +03/05/2022 03:00:20 - INFO - codeparrot_training - Step 31942: {'lr': 0.00045118215305385855, 'samples': 16354816, 'steps': 31942, 'loss/train': 2.4072768688201904} +03/05/2022 03:00:21 - INFO - codeparrot_training - Skipping example with length 939 (seq_length=1024) +03/05/2022 03:00:25 - INFO - codeparrot_training - Step 31943: {'lr': 0.0004511790026975733, 'samples': 16355328, 'steps': 31943, 'loss/train': 1.9124397039413452} +03/05/2022 03:00:28 - INFO - codeparrot_training - Step 31944: {'lr': 0.00045117585225063996, 'samples': 16355840, 'steps': 31944, 'loss/train': 1.20439612865448} +03/05/2022 03:00:30 - INFO - codeparrot_training - Skipping example with length 606 (seq_length=1024) +03/05/2022 03:00:34 - INFO - codeparrot_training - Step 31945: {'lr': 0.0004511727017130598, 'samples': 16356352, 'steps': 31945, 'loss/train': 2.1158857345581055} +03/05/2022 03:00:37 - INFO - codeparrot_training - Step 31946: {'lr': 0.00045116955108483436, 'samples': 16356864, 'steps': 31946, 'loss/train': 1.375718355178833} +03/05/2022 03:00:38 - INFO - codeparrot_training - Skipping example with length 331 (seq_length=1024) +03/05/2022 03:00:42 - INFO - codeparrot_training - Step 31947: {'lr': 0.00045116640036596507, 'samples': 16357376, 'steps': 31947, 'loss/train': 1.270947813987732} +03/05/2022 03:00:45 - INFO - codeparrot_training - Step 31948: {'lr': 0.0004511632495564533, 'samples': 16357888, 'steps': 31948, 'loss/train': 1.7259471416473389} +03/05/2022 03:00:47 - INFO - codeparrot_training - Skipping example with length 738 (seq_length=1024) +03/05/2022 03:00:51 - INFO - codeparrot_training - Step 31949: {'lr': 0.00045116009865630034, 'samples': 16358400, 'steps': 31949, 'loss/train': 1.0533421039581299} +03/05/2022 03:00:54 - INFO - codeparrot_training - Step 31950: {'lr': 0.0004511569476655079, 'samples': 16358912, 'steps': 31950, 'loss/train': 1.9342403411865234} +03/05/2022 03:00:56 - INFO - codeparrot_training - Skipping example with length 209 (seq_length=1024) +03/05/2022 03:00:59 - INFO - codeparrot_training - Step 31951: {'lr': 0.00045115379658407717, 'samples': 16359424, 'steps': 31951, 'loss/train': 1.0411666631698608} +03/05/2022 03:01:02 - INFO - codeparrot_training - Step 31952: {'lr': 0.0004511506454120097, 'samples': 16359936, 'steps': 31952, 'loss/train': 2.016972064971924} +03/05/2022 03:01:04 - INFO - codeparrot_training - Skipping example with length 258 (seq_length=1024) +03/05/2022 03:01:08 - INFO - codeparrot_training - Step 31953: {'lr': 0.00045114749414930676, 'samples': 16360448, 'steps': 31953, 'loss/train': 1.6155586242675781} +03/05/2022 03:01:11 - INFO - codeparrot_training - Step 31954: {'lr': 0.00045114434279596994, 'samples': 16360960, 'steps': 31954, 'loss/train': 2.150050640106201} +03/05/2022 03:01:14 - INFO - codeparrot_training - Step 31955: {'lr': 0.0004511411913520006, 'samples': 16361472, 'steps': 31955, 'loss/train': 1.2652933597564697} +03/05/2022 03:01:15 - INFO - codeparrot_training - Skipping example with length 148 (seq_length=1024) +03/05/2022 03:01:20 - INFO - codeparrot_training - Step 31956: {'lr': 0.0004511380398174001, 'samples': 16361984, 'steps': 31956, 'loss/train': 2.127192735671997} +03/05/2022 03:01:23 - INFO - codeparrot_training - Step 31957: {'lr': 0.00045113488819216983, 'samples': 16362496, 'steps': 31957, 'loss/train': 1.540175199508667} +03/05/2022 03:01:24 - INFO - codeparrot_training - Skipping example with length 800 (seq_length=1024) +03/05/2022 03:01:28 - INFO - codeparrot_training - Step 31958: {'lr': 0.00045113173647631143, 'samples': 16363008, 'steps': 31958, 'loss/train': 1.9785131216049194} +03/05/2022 03:01:31 - INFO - codeparrot_training - Step 31959: {'lr': 0.0004511285846698261, 'samples': 16363520, 'steps': 31959, 'loss/train': 3.0094780921936035} +03/05/2022 03:01:32 - INFO - codeparrot_training - Skipping example with length 256 (seq_length=1024) +03/05/2022 03:01:37 - INFO - codeparrot_training - Step 31960: {'lr': 0.0004511254327727153, 'samples': 16364032, 'steps': 31960, 'loss/train': 2.643731117248535} +03/05/2022 03:01:40 - INFO - codeparrot_training - Step 31961: {'lr': 0.00045112228078498053, 'samples': 16364544, 'steps': 31961, 'loss/train': 1.668400764465332} +03/05/2022 03:01:41 - INFO - codeparrot_training - Skipping example with length 278 (seq_length=1024) +03/05/2022 03:01:45 - INFO - codeparrot_training - Step 31962: {'lr': 0.0004511191287066232, 'samples': 16365056, 'steps': 31962, 'loss/train': 1.620114803314209} +03/05/2022 03:01:48 - INFO - codeparrot_training - Step 31963: {'lr': 0.00045111597653764456, 'samples': 16365568, 'steps': 31963, 'loss/train': 2.171884298324585} +03/05/2022 03:01:49 - INFO - codeparrot_training - Skipping example with length 317 (seq_length=1024) +03/05/2022 03:01:54 - INFO - codeparrot_training - Step 31964: {'lr': 0.00045111282427804636, 'samples': 16366080, 'steps': 31964, 'loss/train': 2.3800129890441895} +03/05/2022 03:01:57 - INFO - codeparrot_training - Step 31965: {'lr': 0.0004511096719278297, 'samples': 16366592, 'steps': 31965, 'loss/train': 1.117672324180603} +03/05/2022 03:01:58 - INFO - codeparrot_training - Skipping example with length 746 (seq_length=1024) +03/05/2022 03:02:02 - INFO - codeparrot_training - Step 31966: {'lr': 0.0004511065194869961, 'samples': 16367104, 'steps': 31966, 'loss/train': 1.6424318552017212} +03/05/2022 03:02:05 - INFO - codeparrot_training - Step 31967: {'lr': 0.00045110336695554707, 'samples': 16367616, 'steps': 31967, 'loss/train': 2.04544997215271} +03/05/2022 03:02:06 - INFO - codeparrot_training - Skipping example with length 474 (seq_length=1024) +03/05/2022 03:02:11 - INFO - codeparrot_training - Step 31968: {'lr': 0.0004511002143334839, 'samples': 16368128, 'steps': 31968, 'loss/train': 1.5337709188461304} +03/05/2022 03:02:14 - INFO - codeparrot_training - Step 31969: {'lr': 0.0004510970616208081, 'samples': 16368640, 'steps': 31969, 'loss/train': 1.6760246753692627} +03/05/2022 03:02:14 - INFO - codeparrot_training - Skipping example with length 283 (seq_length=1024) +03/05/2022 03:02:19 - INFO - codeparrot_training - Step 31970: {'lr': 0.0004510939088175211, 'samples': 16369152, 'steps': 31970, 'loss/train': 1.6577661037445068} +03/05/2022 03:02:22 - INFO - codeparrot_training - Step 31971: {'lr': 0.00045109075592362433, 'samples': 16369664, 'steps': 31971, 'loss/train': 1.203108549118042} +03/05/2022 03:02:22 - INFO - codeparrot_training - Skipping example with length 463 (seq_length=1024) +03/05/2022 03:02:27 - INFO - codeparrot_training - Step 31972: {'lr': 0.0004510876029391191, 'samples': 16370176, 'steps': 31972, 'loss/train': 1.574049472808838} +03/05/2022 03:02:31 - INFO - codeparrot_training - Step 31973: {'lr': 0.00045108444986400687, 'samples': 16370688, 'steps': 31973, 'loss/train': 2.646047592163086} +03/05/2022 03:02:31 - INFO - codeparrot_training - Skipping example with length 1018 (seq_length=1024) +03/05/2022 03:02:36 - INFO - codeparrot_training - Step 31974: {'lr': 0.0004510812966982892, 'samples': 16371200, 'steps': 31974, 'loss/train': 0.47657230496406555} +03/05/2022 03:02:39 - INFO - codeparrot_training - Step 31975: {'lr': 0.0004510781434419673, 'samples': 16371712, 'steps': 31975, 'loss/train': 0.2866252362728119} +03/05/2022 03:02:40 - INFO - codeparrot_training - Skipping example with length 579 (seq_length=1024) +03/05/2022 03:02:45 - INFO - codeparrot_training - Step 31976: {'lr': 0.0004510749900950427, 'samples': 16372224, 'steps': 31976, 'loss/train': 1.8011785745620728} +03/05/2022 03:02:48 - INFO - codeparrot_training - Step 31977: {'lr': 0.00045107183665751686, 'samples': 16372736, 'steps': 31977, 'loss/train': 1.935043454170227} +03/05/2022 03:02:48 - INFO - codeparrot_training - Skipping example with length 116 (seq_length=1024) +03/05/2022 03:02:53 - INFO - codeparrot_training - Step 31978: {'lr': 0.00045106868312939116, 'samples': 16373248, 'steps': 31978, 'loss/train': 1.5222426652908325} +03/05/2022 03:02:56 - INFO - codeparrot_training - Step 31979: {'lr': 0.0004510655295106669, 'samples': 16373760, 'steps': 31979, 'loss/train': 2.7634658813476562} +03/05/2022 03:02:56 - INFO - codeparrot_training - Skipping example with length 176 (seq_length=1024) +03/05/2022 03:03:02 - INFO - codeparrot_training - Step 31980: {'lr': 0.00045106237580134573, 'samples': 16374272, 'steps': 31980, 'loss/train': 3.5076136589050293} +03/05/2022 03:03:05 - INFO - codeparrot_training - Step 31981: {'lr': 0.000451059222001429, 'samples': 16374784, 'steps': 31981, 'loss/train': 0.8543733954429626} +03/05/2022 03:03:05 - INFO - codeparrot_training - Skipping example with length 582 (seq_length=1024) +03/05/2022 03:03:10 - INFO - codeparrot_training - Step 31982: {'lr': 0.0004510560681109179, 'samples': 16375296, 'steps': 31982, 'loss/train': 2.0498600006103516} +03/05/2022 03:03:13 - INFO - codeparrot_training - Step 31983: {'lr': 0.0004510529141298142, 'samples': 16375808, 'steps': 31983, 'loss/train': 1.1351772546768188} +03/05/2022 03:03:13 - INFO - codeparrot_training - Skipping example with length 65 (seq_length=1024) +03/05/2022 03:03:18 - INFO - codeparrot_training - Step 31984: {'lr': 0.00045104976005811917, 'samples': 16376320, 'steps': 31984, 'loss/train': 2.2497880458831787} +03/05/2022 03:03:21 - INFO - codeparrot_training - Step 31985: {'lr': 0.00045104660589583413, 'samples': 16376832, 'steps': 31985, 'loss/train': 1.893570899963379} +03/05/2022 03:03:22 - INFO - codeparrot_training - Skipping example with length 193 (seq_length=1024) +03/05/2022 03:03:27 - INFO - codeparrot_training - Step 31986: {'lr': 0.0004510434516429606, 'samples': 16377344, 'steps': 31986, 'loss/train': 1.8835066556930542} +03/05/2022 03:03:30 - INFO - codeparrot_training - Step 31987: {'lr': 0.0004510402972995, 'samples': 16377856, 'steps': 31987, 'loss/train': 2.057553768157959} +03/05/2022 03:03:30 - INFO - codeparrot_training - Skipping example with length 121 (seq_length=1024) +03/05/2022 03:03:35 - INFO - codeparrot_training - Step 31988: {'lr': 0.0004510371428654538, 'samples': 16378368, 'steps': 31988, 'loss/train': 1.7688745260238647} +03/05/2022 03:03:38 - INFO - codeparrot_training - Skipping example with length 247 (seq_length=1024) +03/05/2022 03:03:40 - INFO - codeparrot_training - Step 31989: {'lr': 0.00045103398834082334, 'samples': 16378880, 'steps': 31989, 'loss/train': 2.055570602416992} +03/05/2022 03:03:44 - INFO - codeparrot_training - Step 31990: {'lr': 0.00045103083372561003, 'samples': 16379392, 'steps': 31990, 'loss/train': 2.4414494037628174} +03/05/2022 03:03:46 - INFO - codeparrot_training - Skipping example with length 456 (seq_length=1024) +03/05/2022 03:03:49 - INFO - codeparrot_training - Step 31991: {'lr': 0.0004510276790198153, 'samples': 16379904, 'steps': 31991, 'loss/train': 1.2987937927246094} +03/05/2022 03:03:52 - INFO - codeparrot_training - Step 31992: {'lr': 0.00045102452422344065, 'samples': 16380416, 'steps': 31992, 'loss/train': 1.8898197412490845} +03/05/2022 03:03:55 - INFO - codeparrot_training - Skipping example with length 469 (seq_length=1024) +03/05/2022 03:03:57 - INFO - codeparrot_training - Step 31993: {'lr': 0.0004510213693364875, 'samples': 16380928, 'steps': 31993, 'loss/train': 1.2637690305709839} +03/05/2022 03:04:00 - INFO - codeparrot_training - Step 31994: {'lr': 0.0004510182143589572, 'samples': 16381440, 'steps': 31994, 'loss/train': 1.151983618736267} +03/05/2022 03:04:03 - INFO - codeparrot_training - Skipping example with length 831 (seq_length=1024) +03/05/2022 03:04:06 - INFO - codeparrot_training - Step 31995: {'lr': 0.0004510150592908511, 'samples': 16381952, 'steps': 31995, 'loss/train': 1.811228632926941} +03/05/2022 03:04:09 - INFO - codeparrot_training - Step 31996: {'lr': 0.00045101190413217085, 'samples': 16382464, 'steps': 31996, 'loss/train': 1.4244699478149414} +03/05/2022 03:04:11 - INFO - codeparrot_training - Skipping example with length 206 (seq_length=1024) +03/05/2022 03:04:14 - INFO - codeparrot_training - Step 31997: {'lr': 0.0004510087488829177, 'samples': 16382976, 'steps': 31997, 'loss/train': 1.6233900785446167} +03/05/2022 03:04:17 - INFO - codeparrot_training - Step 31998: {'lr': 0.000451005593543093, 'samples': 16383488, 'steps': 31998, 'loss/train': 2.252574920654297} +03/05/2022 03:04:20 - INFO - codeparrot_training - Skipping example with length 402 (seq_length=1024) +03/05/2022 03:04:23 - INFO - codeparrot_training - Step 31999: {'lr': 0.00045100243811269834, 'samples': 16384000, 'steps': 31999, 'loss/train': 2.0426595211029053} +03/05/2022 03:04:26 - INFO - codeparrot_training - Step 32000: {'lr': 0.00045099928259173516, 'samples': 16384512, 'steps': 32000, 'loss/train': 0.8855448961257935} +03/05/2022 03:04:29 - INFO - codeparrot_training - Skipping example with length 138 (seq_length=1024) +03/05/2022 03:04:31 - INFO - codeparrot_training - Step 32001: {'lr': 0.0004509961269802048, 'samples': 16385024, 'steps': 32001, 'loss/train': 1.4176315069198608} +03/05/2022 03:04:34 - INFO - codeparrot_training - Step 32002: {'lr': 0.00045099297127810855, 'samples': 16385536, 'steps': 32002, 'loss/train': 6.000682353973389} +03/05/2022 03:04:37 - INFO - codeparrot_training - Skipping example with length 202 (seq_length=1024) +03/05/2022 03:04:39 - INFO - codeparrot_training - Step 32003: {'lr': 0.0004509898154854481, 'samples': 16386048, 'steps': 32003, 'loss/train': 1.8179643154144287} +03/05/2022 03:04:43 - INFO - codeparrot_training - Step 32004: {'lr': 0.00045098665960222474, 'samples': 16386560, 'steps': 32004, 'loss/train': 2.8642096519470215} +03/05/2022 03:04:45 - INFO - codeparrot_training - Skipping example with length 366 (seq_length=1024) +03/05/2022 03:04:48 - INFO - codeparrot_training - Step 32005: {'lr': 0.00045098350362843975, 'samples': 16387072, 'steps': 32005, 'loss/train': 1.7400468587875366} +03/05/2022 03:04:51 - INFO - codeparrot_training - Step 32006: {'lr': 0.0004509803475640948, 'samples': 16387584, 'steps': 32006, 'loss/train': 1.5226988792419434} +03/05/2022 03:04:54 - INFO - codeparrot_training - Skipping example with length 259 (seq_length=1024) +03/05/2022 03:04:56 - INFO - codeparrot_training - Step 32007: {'lr': 0.00045097719140919126, 'samples': 16388096, 'steps': 32007, 'loss/train': 1.3183097839355469} +03/05/2022 03:04:59 - INFO - codeparrot_training - Step 32008: {'lr': 0.0004509740351637304, 'samples': 16388608, 'steps': 32008, 'loss/train': 0.863994836807251} +03/05/2022 03:05:02 - INFO - codeparrot_training - Skipping example with length 337 (seq_length=1024) +03/05/2022 03:05:05 - INFO - codeparrot_training - Step 32009: {'lr': 0.0004509708788277138, 'samples': 16389120, 'steps': 32009, 'loss/train': 1.5725955963134766} +03/05/2022 03:05:08 - INFO - codeparrot_training - Step 32010: {'lr': 0.0004509677224011428, 'samples': 16389632, 'steps': 32010, 'loss/train': 0.5772419571876526} +03/05/2022 03:05:10 - INFO - codeparrot_training - Skipping example with length 69 (seq_length=1024) +03/05/2022 03:05:13 - INFO - codeparrot_training - Step 32011: {'lr': 0.00045096456588401883, 'samples': 16390144, 'steps': 32011, 'loss/train': 1.0410505533218384} +03/05/2022 03:05:16 - INFO - codeparrot_training - Step 32012: {'lr': 0.0004509614092763434, 'samples': 16390656, 'steps': 32012, 'loss/train': 2.3063197135925293} +03/05/2022 03:05:19 - INFO - codeparrot_training - Skipping example with length 464 (seq_length=1024) +03/05/2022 03:05:22 - INFO - codeparrot_training - Step 32013: {'lr': 0.00045095825257811776, 'samples': 16391168, 'steps': 32013, 'loss/train': 1.93497633934021} +03/05/2022 03:05:25 - INFO - codeparrot_training - Step 32014: {'lr': 0.00045095509578934353, 'samples': 16391680, 'steps': 32014, 'loss/train': 1.7996841669082642} +03/05/2022 03:05:27 - INFO - codeparrot_training - Skipping example with length 277 (seq_length=1024) +03/05/2022 03:05:30 - INFO - codeparrot_training - Step 32015: {'lr': 0.00045095193891002194, 'samples': 16392192, 'steps': 32015, 'loss/train': 1.7910690307617188} +03/05/2022 03:05:33 - INFO - codeparrot_training - Step 32016: {'lr': 0.00045094878194015456, 'samples': 16392704, 'steps': 32016, 'loss/train': 1.9506921768188477} +03/05/2022 03:05:36 - INFO - codeparrot_training - Skipping example with length 652 (seq_length=1024) +03/05/2022 03:05:39 - INFO - codeparrot_training - Step 32017: {'lr': 0.0004509456248797428, 'samples': 16393216, 'steps': 32017, 'loss/train': 2.1983065605163574} +03/05/2022 03:05:42 - INFO - codeparrot_training - Step 32018: {'lr': 0.000450942467728788, 'samples': 16393728, 'steps': 32018, 'loss/train': 1.274975061416626} +03/05/2022 03:05:45 - INFO - codeparrot_training - Step 32019: {'lr': 0.00045093931048729156, 'samples': 16394240, 'steps': 32019, 'loss/train': 1.5938899517059326} +03/05/2022 03:05:45 - INFO - codeparrot_training - Skipping example with length 594 (seq_length=1024) +03/05/2022 03:05:50 - INFO - codeparrot_training - Step 32020: {'lr': 0.00045093615315525506, 'samples': 16394752, 'steps': 32020, 'loss/train': 0.08673045784235} +03/05/2022 03:05:54 - INFO - codeparrot_training - Step 32021: {'lr': 0.00045093299573267977, 'samples': 16395264, 'steps': 32021, 'loss/train': 1.2798175811767578} +03/05/2022 03:05:54 - INFO - codeparrot_training - Skipping example with length 573 (seq_length=1024) +03/05/2022 03:05:59 - INFO - codeparrot_training - Step 32022: {'lr': 0.00045092983821956725, 'samples': 16395776, 'steps': 32022, 'loss/train': 2.2171990871429443} +03/05/2022 03:06:02 - INFO - codeparrot_training - Step 32023: {'lr': 0.00045092668061591875, 'samples': 16396288, 'steps': 32023, 'loss/train': 1.9794648885726929} +03/05/2022 03:06:02 - INFO - codeparrot_training - Skipping example with length 513 (seq_length=1024) +03/05/2022 03:06:07 - INFO - codeparrot_training - Step 32024: {'lr': 0.00045092352292173585, 'samples': 16396800, 'steps': 32024, 'loss/train': 1.6061415672302246} +03/05/2022 03:06:10 - INFO - codeparrot_training - Step 32025: {'lr': 0.00045092036513701985, 'samples': 16397312, 'steps': 32025, 'loss/train': 1.6197881698608398} +03/05/2022 03:06:11 - INFO - codeparrot_training - Skipping example with length 327 (seq_length=1024) +03/05/2022 03:06:16 - INFO - codeparrot_training - Step 32026: {'lr': 0.0004509172072617723, 'samples': 16397824, 'steps': 32026, 'loss/train': 1.9297541379928589} +03/05/2022 03:06:19 - INFO - codeparrot_training - Step 32027: {'lr': 0.00045091404929599455, 'samples': 16398336, 'steps': 32027, 'loss/train': 1.1923638582229614} +03/05/2022 03:06:19 - INFO - codeparrot_training - Skipping example with length 786 (seq_length=1024) +03/05/2022 03:06:24 - INFO - codeparrot_training - Step 32028: {'lr': 0.00045091089123968796, 'samples': 16398848, 'steps': 32028, 'loss/train': 2.594214916229248} +03/05/2022 03:06:27 - INFO - codeparrot_training - Step 32029: {'lr': 0.0004509077330928541, 'samples': 16399360, 'steps': 32029, 'loss/train': 1.6268155574798584} +03/05/2022 03:06:27 - INFO - codeparrot_training - Skipping example with length 620 (seq_length=1024) +03/05/2022 03:06:33 - INFO - codeparrot_training - Step 32030: {'lr': 0.0004509045748554943, 'samples': 16399872, 'steps': 32030, 'loss/train': 2.0086452960968018} +03/05/2022 03:06:36 - INFO - codeparrot_training - Step 32031: {'lr': 0.00045090141652760995, 'samples': 16400384, 'steps': 32031, 'loss/train': 1.6971648931503296} +03/05/2022 03:06:36 - INFO - codeparrot_training - Skipping example with length 974 (seq_length=1024) +03/05/2022 03:06:41 - INFO - codeparrot_training - Step 32032: {'lr': 0.0004508982581092026, 'samples': 16400896, 'steps': 32032, 'loss/train': 0.9273979663848877} +03/05/2022 03:06:44 - INFO - codeparrot_training - Step 32033: {'lr': 0.00045089509960027354, 'samples': 16401408, 'steps': 32033, 'loss/train': 2.099200487136841} +03/05/2022 03:06:45 - INFO - codeparrot_training - Skipping example with length 918 (seq_length=1024) +03/05/2022 03:06:50 - INFO - codeparrot_training - Step 32034: {'lr': 0.00045089194100082433, 'samples': 16401920, 'steps': 32034, 'loss/train': 2.1232099533081055} +03/05/2022 03:06:53 - INFO - codeparrot_training - Step 32035: {'lr': 0.00045088878231085616, 'samples': 16402432, 'steps': 32035, 'loss/train': 2.4728918075561523} +03/05/2022 03:06:53 - INFO - codeparrot_training - Skipping example with length 257 (seq_length=1024) +03/05/2022 03:06:58 - INFO - codeparrot_training - Step 32036: {'lr': 0.00045088562353037077, 'samples': 16402944, 'steps': 32036, 'loss/train': 0.8891081809997559} +03/05/2022 03:07:01 - INFO - codeparrot_training - Step 32037: {'lr': 0.00045088246465936936, 'samples': 16403456, 'steps': 32037, 'loss/train': 1.6939873695373535} +03/05/2022 03:07:02 - INFO - codeparrot_training - Skipping example with length 240 (seq_length=1024) +03/05/2022 03:07:06 - INFO - codeparrot_training - Step 32038: {'lr': 0.0004508793056978534, 'samples': 16403968, 'steps': 32038, 'loss/train': 1.4837018251419067} +03/05/2022 03:07:10 - INFO - codeparrot_training - Step 32039: {'lr': 0.00045087614664582424, 'samples': 16404480, 'steps': 32039, 'loss/train': 1.4713070392608643} +03/05/2022 03:07:10 - INFO - codeparrot_training - Skipping example with length 310 (seq_length=1024) +03/05/2022 03:07:15 - INFO - codeparrot_training - Step 32040: {'lr': 0.0004508729875032834, 'samples': 16404992, 'steps': 32040, 'loss/train': 1.4132156372070312} +03/05/2022 03:07:18 - INFO - codeparrot_training - Step 32041: {'lr': 0.0004508698282702324, 'samples': 16405504, 'steps': 32041, 'loss/train': 2.021090269088745} +03/05/2022 03:07:19 - INFO - codeparrot_training - Skipping example with length 936 (seq_length=1024) +03/05/2022 03:07:23 - INFO - codeparrot_training - Step 32042: {'lr': 0.0004508666689466725, 'samples': 16406016, 'steps': 32042, 'loss/train': 1.9056329727172852} +03/05/2022 03:07:27 - INFO - codeparrot_training - Step 32043: {'lr': 0.00045086350953260526, 'samples': 16406528, 'steps': 32043, 'loss/train': 1.1744017601013184} +03/05/2022 03:07:27 - INFO - codeparrot_training - Skipping example with length 43 (seq_length=1024) +03/05/2022 03:07:32 - INFO - codeparrot_training - Step 32044: {'lr': 0.0004508603500280319, 'samples': 16407040, 'steps': 32044, 'loss/train': 1.8305118083953857} +03/05/2022 03:07:35 - INFO - codeparrot_training - Step 32045: {'lr': 0.00045085719043295406, 'samples': 16407552, 'steps': 32045, 'loss/train': 0.06139529123902321} +03/05/2022 03:07:35 - INFO - codeparrot_training - Skipping example with length 995 (seq_length=1024) +03/05/2022 03:07:40 - INFO - codeparrot_training - Step 32046: {'lr': 0.00045085403074737295, 'samples': 16408064, 'steps': 32046, 'loss/train': 2.9418563842773438} +03/05/2022 03:07:43 - INFO - codeparrot_training - Step 32047: {'lr': 0.0004508508709712902, 'samples': 16408576, 'steps': 32047, 'loss/train': 1.8753360509872437} +03/05/2022 03:07:43 - INFO - codeparrot_training - Skipping example with length 424 (seq_length=1024) +03/05/2022 03:07:49 - INFO - codeparrot_training - Step 32048: {'lr': 0.00045084771110470717, 'samples': 16409088, 'steps': 32048, 'loss/train': 1.6443184614181519} +03/05/2022 03:07:52 - INFO - codeparrot_training - Step 32049: {'lr': 0.00045084455114762525, 'samples': 16409600, 'steps': 32049, 'loss/train': 0.7787325978279114} +03/05/2022 03:07:52 - INFO - codeparrot_training - Skipping example with length 965 (seq_length=1024) +03/05/2022 03:07:57 - INFO - codeparrot_training - Step 32050: {'lr': 0.00045084139110004585, 'samples': 16410112, 'steps': 32050, 'loss/train': 1.8579407930374146} +03/05/2022 03:08:00 - INFO - codeparrot_training - Step 32051: {'lr': 0.0004508382309619704, 'samples': 16410624, 'steps': 32051, 'loss/train': 1.9255794286727905} +03/05/2022 03:08:01 - INFO - codeparrot_training - Skipping example with length 694 (seq_length=1024) +03/05/2022 03:08:06 - INFO - codeparrot_training - Step 32052: {'lr': 0.0004508350707334004, 'samples': 16411136, 'steps': 32052, 'loss/train': 1.5080236196517944} +03/05/2022 03:08:09 - INFO - codeparrot_training - Step 32053: {'lr': 0.00045083191041433713, 'samples': 16411648, 'steps': 32053, 'loss/train': 2.131565809249878} +03/05/2022 03:08:09 - INFO - codeparrot_training - Skipping example with length 225 (seq_length=1024) +03/05/2022 03:08:14 - INFO - codeparrot_training - Step 32054: {'lr': 0.00045082875000478214, 'samples': 16412160, 'steps': 32054, 'loss/train': 1.1241240501403809} +03/05/2022 03:08:17 - INFO - codeparrot_training - Step 32055: {'lr': 0.0004508255895047368, 'samples': 16412672, 'steps': 32055, 'loss/train': 1.5277467966079712} +03/05/2022 03:08:17 - INFO - codeparrot_training - Skipping example with length 927 (seq_length=1024) +03/05/2022 03:08:23 - INFO - codeparrot_training - Step 32056: {'lr': 0.0004508224289142026, 'samples': 16413184, 'steps': 32056, 'loss/train': 2.0874884128570557} +03/05/2022 03:08:26 - INFO - codeparrot_training - Step 32057: {'lr': 0.0004508192682331809, 'samples': 16413696, 'steps': 32057, 'loss/train': 0.8028739094734192} +03/05/2022 03:08:26 - INFO - codeparrot_training - Skipping example with length 102 (seq_length=1024) +03/05/2022 03:08:31 - INFO - codeparrot_training - Step 32058: {'lr': 0.0004508161074616731, 'samples': 16414208, 'steps': 32058, 'loss/train': 1.8901517391204834} +03/05/2022 03:08:34 - INFO - codeparrot_training - Step 32059: {'lr': 0.0004508129465996806, 'samples': 16414720, 'steps': 32059, 'loss/train': 1.7314239740371704} +03/05/2022 03:08:34 - INFO - codeparrot_training - Skipping example with length 7 (seq_length=1024) +03/05/2022 03:08:39 - INFO - codeparrot_training - Step 32060: {'lr': 0.00045080978564720505, 'samples': 16415232, 'steps': 32060, 'loss/train': 1.623302936553955} +03/05/2022 03:08:42 - INFO - codeparrot_training - Skipping example with length 216 (seq_length=1024) +03/05/2022 03:08:45 - INFO - codeparrot_training - Step 32061: {'lr': 0.0004508066246042476, 'samples': 16415744, 'steps': 32061, 'loss/train': 1.3772215843200684} +03/05/2022 03:08:48 - INFO - codeparrot_training - Step 32062: {'lr': 0.0004508034634708098, 'samples': 16416256, 'steps': 32062, 'loss/train': 2.013273239135742} +03/05/2022 03:08:51 - INFO - codeparrot_training - Step 32063: {'lr': 0.0004508003022468931, 'samples': 16416768, 'steps': 32063, 'loss/train': 0.7460302114486694} +03/05/2022 03:08:52 - INFO - codeparrot_training - Skipping example with length 395 (seq_length=1024) +03/05/2022 03:08:57 - INFO - codeparrot_training - Step 32064: {'lr': 0.00045079714093249887, 'samples': 16417280, 'steps': 32064, 'loss/train': 2.743365526199341} +03/05/2022 03:09:00 - INFO - codeparrot_training - Step 32065: {'lr': 0.00045079397952762845, 'samples': 16417792, 'steps': 32065, 'loss/train': 1.7845908403396606} +03/05/2022 03:09:00 - INFO - codeparrot_training - Skipping example with length 147 (seq_length=1024) +03/05/2022 03:09:05 - INFO - codeparrot_training - Step 32066: {'lr': 0.0004507908180322835, 'samples': 16418304, 'steps': 32066, 'loss/train': 1.0195339918136597} +03/05/2022 03:09:08 - INFO - codeparrot_training - Step 32067: {'lr': 0.00045078765644646524, 'samples': 16418816, 'steps': 32067, 'loss/train': 0.47019922733306885} +03/05/2022 03:09:09 - INFO - codeparrot_training - Skipping example with length 399 (seq_length=1024) +03/05/2022 03:09:13 - INFO - codeparrot_training - Step 32068: {'lr': 0.00045078449477017516, 'samples': 16419328, 'steps': 32068, 'loss/train': 1.6027827262878418} +03/05/2022 03:09:16 - INFO - codeparrot_training - Step 32069: {'lr': 0.0004507813330034147, 'samples': 16419840, 'steps': 32069, 'loss/train': 1.9164011478424072} +03/05/2022 03:09:17 - INFO - codeparrot_training - Skipping example with length 126 (seq_length=1024) +03/05/2022 03:09:22 - INFO - codeparrot_training - Step 32070: {'lr': 0.00045077817114618526, 'samples': 16420352, 'steps': 32070, 'loss/train': 1.0379717350006104} +03/05/2022 03:09:25 - INFO - codeparrot_training - Step 32071: {'lr': 0.00045077500919848826, 'samples': 16420864, 'steps': 32071, 'loss/train': 0.3108794391155243} +03/05/2022 03:09:25 - INFO - codeparrot_training - Skipping example with length 134 (seq_length=1024) +03/05/2022 03:09:30 - INFO - codeparrot_training - Step 32072: {'lr': 0.00045077184716032516, 'samples': 16421376, 'steps': 32072, 'loss/train': 0.29869237542152405} +03/05/2022 03:09:33 - INFO - codeparrot_training - Step 32073: {'lr': 0.0004507686850316973, 'samples': 16421888, 'steps': 32073, 'loss/train': 0.6080016493797302} +03/05/2022 03:09:34 - INFO - codeparrot_training - Skipping example with length 699 (seq_length=1024) +03/05/2022 03:09:39 - INFO - codeparrot_training - Step 32074: {'lr': 0.00045076552281260625, 'samples': 16422400, 'steps': 32074, 'loss/train': 1.23614501953125} +03/05/2022 03:09:42 - INFO - codeparrot_training - Step 32075: {'lr': 0.0004507623605030533, 'samples': 16422912, 'steps': 32075, 'loss/train': 1.9865936040878296} +03/05/2022 03:09:42 - INFO - codeparrot_training - Skipping example with length 150 (seq_length=1024) +03/05/2022 03:09:47 - INFO - codeparrot_training - Step 32076: {'lr': 0.00045075919810304, 'samples': 16423424, 'steps': 32076, 'loss/train': 1.4212244749069214} +03/05/2022 03:09:50 - INFO - codeparrot_training - Step 32077: {'lr': 0.0004507560356125676, 'samples': 16423936, 'steps': 32077, 'loss/train': 2.2919249534606934} +03/05/2022 03:09:51 - INFO - codeparrot_training - Skipping example with length 793 (seq_length=1024) +03/05/2022 03:09:56 - INFO - codeparrot_training - Step 32078: {'lr': 0.0004507528730316377, 'samples': 16424448, 'steps': 32078, 'loss/train': 6.587907791137695} +03/05/2022 03:09:59 - INFO - codeparrot_training - Step 32079: {'lr': 0.0004507497103602517, 'samples': 16424960, 'steps': 32079, 'loss/train': 1.9072664976119995} +03/05/2022 03:10:00 - INFO - codeparrot_training - Skipping example with length 801 (seq_length=1024) +03/05/2022 03:10:05 - INFO - codeparrot_training - Step 32080: {'lr': 0.00045074654759841087, 'samples': 16425472, 'steps': 32080, 'loss/train': 1.9068021774291992} +03/05/2022 03:10:08 - INFO - codeparrot_training - Step 32081: {'lr': 0.00045074338474611683, 'samples': 16425984, 'steps': 32081, 'loss/train': 2.1290552616119385} +03/05/2022 03:10:11 - INFO - codeparrot_training - Step 32082: {'lr': 0.00045074022180337085, 'samples': 16426496, 'steps': 32082, 'loss/train': 1.9639488458633423} +03/05/2022 03:10:12 - INFO - codeparrot_training - Skipping example with length 356 (seq_length=1024) +03/05/2022 03:10:16 - INFO - codeparrot_training - Step 32083: {'lr': 0.0004507370587701745, 'samples': 16427008, 'steps': 32083, 'loss/train': 1.4790430068969727} +03/05/2022 03:10:20 - INFO - codeparrot_training - Step 32084: {'lr': 0.000450733895646529, 'samples': 16427520, 'steps': 32084, 'loss/train': 2.458078384399414} +03/05/2022 03:10:20 - INFO - codeparrot_training - Skipping example with length 370 (seq_length=1024) +03/05/2022 03:10:25 - INFO - codeparrot_training - Step 32085: {'lr': 0.00045073073243243603, 'samples': 16428032, 'steps': 32085, 'loss/train': 1.3728265762329102} +03/05/2022 03:10:28 - INFO - codeparrot_training - Step 32086: {'lr': 0.0004507275691278968, 'samples': 16428544, 'steps': 32086, 'loss/train': 1.599483847618103} +03/05/2022 03:10:29 - INFO - codeparrot_training - Skipping example with length 190 (seq_length=1024) +03/05/2022 03:10:33 - INFO - codeparrot_training - Step 32087: {'lr': 0.00045072440573291293, 'samples': 16429056, 'steps': 32087, 'loss/train': 1.1276015043258667} +03/05/2022 03:10:36 - INFO - codeparrot_training - Step 32088: {'lr': 0.0004507212422474857, 'samples': 16429568, 'steps': 32088, 'loss/train': 2.040832042694092} +03/05/2022 03:10:38 - INFO - codeparrot_training - Skipping example with length 201 (seq_length=1024) +03/05/2022 03:10:42 - INFO - codeparrot_training - Step 32089: {'lr': 0.0004507180786716165, 'samples': 16430080, 'steps': 32089, 'loss/train': 1.717200517654419} +03/05/2022 03:10:45 - INFO - codeparrot_training - Step 32090: {'lr': 0.00045071491500530694, 'samples': 16430592, 'steps': 32090, 'loss/train': 1.8143031597137451} +03/05/2022 03:10:46 - INFO - codeparrot_training - Skipping example with length 20 (seq_length=1024) +03/05/2022 03:10:50 - INFO - codeparrot_training - Step 32091: {'lr': 0.0004507117512485582, 'samples': 16431104, 'steps': 32091, 'loss/train': 1.9190293550491333} +03/05/2022 03:10:53 - INFO - codeparrot_training - Step 32092: {'lr': 0.000450708587401372, 'samples': 16431616, 'steps': 32092, 'loss/train': 1.321264386177063} +03/05/2022 03:10:54 - INFO - codeparrot_training - Skipping example with length 679 (seq_length=1024) +03/05/2022 03:10:59 - INFO - codeparrot_training - Step 32093: {'lr': 0.0004507054234637495, 'samples': 16432128, 'steps': 32093, 'loss/train': 2.015144109725952} +03/05/2022 03:11:02 - INFO - codeparrot_training - Step 32094: {'lr': 0.0004507022594356922, 'samples': 16432640, 'steps': 32094, 'loss/train': 1.2830841541290283} +03/05/2022 03:11:02 - INFO - codeparrot_training - Skipping example with length 741 (seq_length=1024) +03/05/2022 03:11:07 - INFO - codeparrot_training - Step 32095: {'lr': 0.00045069909531720166, 'samples': 16433152, 'steps': 32095, 'loss/train': 1.311087965965271} +03/05/2022 03:11:10 - INFO - codeparrot_training - Step 32096: {'lr': 0.0004506959311082792, 'samples': 16433664, 'steps': 32096, 'loss/train': 2.7646584510803223} +03/05/2022 03:11:12 - INFO - codeparrot_training - Skipping example with length 418 (seq_length=1024) +03/05/2022 03:11:16 - INFO - codeparrot_training - Step 32097: {'lr': 0.00045069276680892624, 'samples': 16434176, 'steps': 32097, 'loss/train': 2.0605690479278564} +03/05/2022 03:11:19 - INFO - codeparrot_training - Step 32098: {'lr': 0.00045068960241914413, 'samples': 16434688, 'steps': 32098, 'loss/train': 1.7242608070373535} +03/05/2022 03:11:20 - INFO - codeparrot_training - Skipping example with length 876 (seq_length=1024) +03/05/2022 03:11:24 - INFO - codeparrot_training - Step 32099: {'lr': 0.00045068643793893447, 'samples': 16435200, 'steps': 32099, 'loss/train': 1.7715922594070435} +03/05/2022 03:11:27 - INFO - codeparrot_training - Step 32100: {'lr': 0.0004506832733682986, 'samples': 16435712, 'steps': 32100, 'loss/train': 0.8491368889808655} +03/05/2022 03:11:28 - INFO - codeparrot_training - Skipping example with length 433 (seq_length=1024) +03/05/2022 03:11:32 - INFO - codeparrot_training - Step 32101: {'lr': 0.00045068010870723783, 'samples': 16436224, 'steps': 32101, 'loss/train': 2.4156553745269775} +03/05/2022 03:11:36 - INFO - codeparrot_training - Step 32102: {'lr': 0.00045067694395575385, 'samples': 16436736, 'steps': 32102, 'loss/train': 1.5904183387756348} +03/05/2022 03:11:37 - INFO - codeparrot_training - Skipping example with length 595 (seq_length=1024) +03/05/2022 03:11:41 - INFO - codeparrot_training - Step 32103: {'lr': 0.0004506737791138479, 'samples': 16437248, 'steps': 32103, 'loss/train': 1.099422812461853} +03/05/2022 03:11:44 - INFO - codeparrot_training - Step 32104: {'lr': 0.00045067061418152136, 'samples': 16437760, 'steps': 32104, 'loss/train': 1.9458777904510498} +03/05/2022 03:11:45 - INFO - codeparrot_training - Skipping example with length 954 (seq_length=1024) +03/05/2022 03:11:49 - INFO - codeparrot_training - Step 32105: {'lr': 0.00045066744915877585, 'samples': 16438272, 'steps': 32105, 'loss/train': 2.10386323928833} +03/05/2022 03:11:53 - INFO - codeparrot_training - Step 32106: {'lr': 0.0004506642840456126, 'samples': 16438784, 'steps': 32106, 'loss/train': 1.757859468460083} +03/05/2022 03:11:54 - INFO - codeparrot_training - Skipping example with length 157 (seq_length=1024) +03/05/2022 03:11:58 - INFO - codeparrot_training - Step 32107: {'lr': 0.00045066111884203315, 'samples': 16439296, 'steps': 32107, 'loss/train': 1.5780664682388306} +03/05/2022 03:12:01 - INFO - codeparrot_training - Step 32108: {'lr': 0.0004506579535480389, 'samples': 16439808, 'steps': 32108, 'loss/train': 1.497854232788086} +03/05/2022 03:12:02 - INFO - codeparrot_training - Skipping example with length 97 (seq_length=1024) +03/05/2022 03:12:06 - INFO - codeparrot_training - Step 32109: {'lr': 0.00045065478816363124, 'samples': 16440320, 'steps': 32109, 'loss/train': 2.388638496398926} +03/05/2022 03:12:09 - INFO - codeparrot_training - Step 32110: {'lr': 0.00045065162268881164, 'samples': 16440832, 'steps': 32110, 'loss/train': 1.997281789779663} +03/05/2022 03:12:10 - INFO - codeparrot_training - Skipping example with length 1014 (seq_length=1024) +03/05/2022 03:12:15 - INFO - codeparrot_training - Step 32111: {'lr': 0.0004506484571235816, 'samples': 16441344, 'steps': 32111, 'loss/train': 1.5788021087646484} +03/05/2022 03:12:18 - INFO - codeparrot_training - Step 32112: {'lr': 0.00045064529146794234, 'samples': 16441856, 'steps': 32112, 'loss/train': 2.4255483150482178} +03/05/2022 03:12:19 - INFO - codeparrot_training - Skipping example with length 98 (seq_length=1024) +03/05/2022 03:12:23 - INFO - codeparrot_training - Step 32113: {'lr': 0.0004506421257218955, 'samples': 16442368, 'steps': 32113, 'loss/train': 2.302644729614258} +03/05/2022 03:12:27 - INFO - codeparrot_training - Step 32114: {'lr': 0.00045063895988544235, 'samples': 16442880, 'steps': 32114, 'loss/train': 2.1795966625213623} +03/05/2022 03:12:28 - INFO - codeparrot_training - Skipping example with length 103 (seq_length=1024) +03/05/2022 03:12:32 - INFO - codeparrot_training - Step 32115: {'lr': 0.00045063579395858444, 'samples': 16443392, 'steps': 32115, 'loss/train': 1.6226500272750854} +03/05/2022 03:12:35 - INFO - codeparrot_training - Step 32116: {'lr': 0.0004506326279413231, 'samples': 16443904, 'steps': 32116, 'loss/train': 1.461987018585205} +03/05/2022 03:12:36 - INFO - codeparrot_training - Skipping example with length 308 (seq_length=1024) +03/05/2022 03:12:40 - INFO - codeparrot_training - Step 32117: {'lr': 0.0004506294618336598, 'samples': 16444416, 'steps': 32117, 'loss/train': 1.177091121673584} +03/05/2022 03:12:43 - INFO - codeparrot_training - Step 32118: {'lr': 0.00045062629563559595, 'samples': 16444928, 'steps': 32118, 'loss/train': 1.8922208547592163} +03/05/2022 03:12:45 - INFO - codeparrot_training - Skipping example with length 899 (seq_length=1024) +03/05/2022 03:12:49 - INFO - codeparrot_training - Step 32119: {'lr': 0.00045062312934713303, 'samples': 16445440, 'steps': 32119, 'loss/train': 1.8817964792251587} +03/05/2022 03:12:52 - INFO - codeparrot_training - Step 32120: {'lr': 0.00045061996296827237, 'samples': 16445952, 'steps': 32120, 'loss/train': 1.4593420028686523} +03/05/2022 03:12:54 - INFO - codeparrot_training - Skipping example with length 1019 (seq_length=1024) +03/05/2022 03:12:57 - INFO - codeparrot_training - Step 32121: {'lr': 0.00045061679649901543, 'samples': 16446464, 'steps': 32121, 'loss/train': 1.780485987663269} +03/05/2022 03:13:00 - INFO - codeparrot_training - Step 32122: {'lr': 0.00045061362993936374, 'samples': 16446976, 'steps': 32122, 'loss/train': 1.5574488639831543} +03/05/2022 03:13:02 - INFO - codeparrot_training - Skipping example with length 615 (seq_length=1024) +03/05/2022 03:13:05 - INFO - codeparrot_training - Step 32123: {'lr': 0.0004506104632893185, 'samples': 16447488, 'steps': 32123, 'loss/train': 2.1572587490081787} +03/05/2022 03:13:09 - INFO - codeparrot_training - Step 32124: {'lr': 0.00045060729654888143, 'samples': 16448000, 'steps': 32124, 'loss/train': 1.518384575843811} +03/05/2022 03:13:10 - INFO - codeparrot_training - Skipping example with length 497 (seq_length=1024) +03/05/2022 03:13:14 - INFO - codeparrot_training - Step 32125: {'lr': 0.00045060412971805375, 'samples': 16448512, 'steps': 32125, 'loss/train': 2.67118763923645} +03/05/2022 03:13:17 - INFO - codeparrot_training - Step 32126: {'lr': 0.00045060096279683694, 'samples': 16449024, 'steps': 32126, 'loss/train': 2.283170461654663} +03/05/2022 03:13:19 - INFO - codeparrot_training - Skipping example with length 184 (seq_length=1024) +03/05/2022 03:13:22 - INFO - codeparrot_training - Step 32127: {'lr': 0.0004505977957852325, 'samples': 16449536, 'steps': 32127, 'loss/train': 1.9854600429534912} +03/05/2022 03:13:26 - INFO - codeparrot_training - Step 32128: {'lr': 0.00045059462868324177, 'samples': 16450048, 'steps': 32128, 'loss/train': 2.2117459774017334} +03/05/2022 03:13:28 - INFO - codeparrot_training - Skipping example with length 349 (seq_length=1024) +03/05/2022 03:13:31 - INFO - codeparrot_training - Step 32129: {'lr': 0.00045059146149086605, 'samples': 16450560, 'steps': 32129, 'loss/train': 1.4528615474700928} +03/05/2022 03:13:34 - INFO - codeparrot_training - Step 32130: {'lr': 0.00045058829420810707, 'samples': 16451072, 'steps': 32130, 'loss/train': 1.0567272901535034} +03/05/2022 03:13:37 - INFO - codeparrot_training - Skipping example with length 338 (seq_length=1024) +03/05/2022 03:13:39 - INFO - codeparrot_training - Step 32131: {'lr': 0.00045058512683496607, 'samples': 16451584, 'steps': 32131, 'loss/train': 2.081271171569824} +03/05/2022 03:13:42 - INFO - codeparrot_training - Step 32132: {'lr': 0.00045058195937144446, 'samples': 16452096, 'steps': 32132, 'loss/train': 1.5891145467758179} +03/05/2022 03:13:45 - INFO - codeparrot_training - Skipping example with length 469 (seq_length=1024) +03/05/2022 03:13:48 - INFO - codeparrot_training - Step 32133: {'lr': 0.00045057879181754375, 'samples': 16452608, 'steps': 32133, 'loss/train': 1.8834021091461182} +03/05/2022 03:13:51 - INFO - codeparrot_training - Step 32134: {'lr': 0.0004505756241732653, 'samples': 16453120, 'steps': 32134, 'loss/train': 1.3042086362838745} +03/05/2022 03:13:53 - INFO - codeparrot_training - Skipping example with length 970 (seq_length=1024) +03/05/2022 03:13:56 - INFO - codeparrot_training - Step 32135: {'lr': 0.0004505724564386106, 'samples': 16453632, 'steps': 32135, 'loss/train': 1.8343548774719238} +03/05/2022 03:13:59 - INFO - codeparrot_training - Step 32136: {'lr': 0.00045056928861358106, 'samples': 16454144, 'steps': 32136, 'loss/train': 2.023365020751953} +03/05/2022 03:14:02 - INFO - codeparrot_training - Skipping example with length 140 (seq_length=1024) +03/05/2022 03:14:05 - INFO - codeparrot_training - Step 32137: {'lr': 0.000450566120698178, 'samples': 16454656, 'steps': 32137, 'loss/train': 1.7368501424789429} +03/05/2022 03:14:08 - INFO - codeparrot_training - Step 32138: {'lr': 0.0004505629526924031, 'samples': 16455168, 'steps': 32138, 'loss/train': 2.8090903759002686} +03/05/2022 03:14:10 - INFO - codeparrot_training - Skipping example with length 471 (seq_length=1024) +03/05/2022 03:14:13 - INFO - codeparrot_training - Step 32139: {'lr': 0.0004505597845962575, 'samples': 16455680, 'steps': 32139, 'loss/train': 2.1710009574890137} +03/05/2022 03:14:16 - INFO - codeparrot_training - Step 32140: {'lr': 0.0004505566164097428, 'samples': 16456192, 'steps': 32140, 'loss/train': 1.9724067449569702} +03/05/2022 03:14:19 - INFO - codeparrot_training - Skipping example with length 836 (seq_length=1024) +03/05/2022 03:14:21 - INFO - codeparrot_training - Step 32141: {'lr': 0.0004505534481328604, 'samples': 16456704, 'steps': 32141, 'loss/train': 0.9738463759422302} +03/05/2022 03:14:25 - INFO - codeparrot_training - Step 32142: {'lr': 0.0004505502797656117, 'samples': 16457216, 'steps': 32142, 'loss/train': 0.8872283101081848} +03/05/2022 03:14:27 - INFO - codeparrot_training - Skipping example with length 588 (seq_length=1024) +03/05/2022 03:14:30 - INFO - codeparrot_training - Step 32143: {'lr': 0.00045054711130799806, 'samples': 16457728, 'steps': 32143, 'loss/train': 1.1109455823898315} +03/05/2022 03:14:33 - INFO - codeparrot_training - Step 32144: {'lr': 0.00045054394276002106, 'samples': 16458240, 'steps': 32144, 'loss/train': 1.1003745794296265} +03/05/2022 03:14:35 - INFO - codeparrot_training - Skipping example with length 17 (seq_length=1024) +03/05/2022 03:14:38 - INFO - codeparrot_training - Step 32145: {'lr': 0.00045054077412168215, 'samples': 16458752, 'steps': 32145, 'loss/train': 2.4092071056365967} +03/05/2022 03:14:41 - INFO - codeparrot_training - Step 32146: {'lr': 0.0004505376053929825, 'samples': 16459264, 'steps': 32146, 'loss/train': 1.9454472064971924} +03/05/2022 03:14:44 - INFO - codeparrot_training - Skipping example with length 683 (seq_length=1024) +03/05/2022 03:14:47 - INFO - codeparrot_training - Step 32147: {'lr': 0.0004505344365739238, 'samples': 16459776, 'steps': 32147, 'loss/train': 2.153879165649414} +03/05/2022 03:14:50 - INFO - codeparrot_training - Step 32148: {'lr': 0.0004505312676645073, 'samples': 16460288, 'steps': 32148, 'loss/train': 2.1145272254943848} +03/05/2022 03:14:52 - INFO - codeparrot_training - Skipping example with length 677 (seq_length=1024) +03/05/2022 03:14:55 - INFO - codeparrot_training - Step 32149: {'lr': 0.00045052809866473454, 'samples': 16460800, 'steps': 32149, 'loss/train': 0.2470967024564743} +03/05/2022 03:14:58 - INFO - codeparrot_training - Step 32150: {'lr': 0.00045052492957460696, 'samples': 16461312, 'steps': 32150, 'loss/train': 2.1979258060455322} +03/05/2022 03:15:00 - INFO - codeparrot_training - Skipping example with length 75 (seq_length=1024) +03/05/2022 03:15:03 - INFO - codeparrot_training - Step 32151: {'lr': 0.00045052176039412587, 'samples': 16461824, 'steps': 32151, 'loss/train': 0.9724978804588318} +03/05/2022 03:15:07 - INFO - codeparrot_training - Step 32152: {'lr': 0.0004505185911232928, 'samples': 16462336, 'steps': 32152, 'loss/train': 1.855562448501587} +03/05/2022 03:15:08 - INFO - codeparrot_training - Skipping example with length 468 (seq_length=1024) +03/05/2022 03:15:12 - INFO - codeparrot_training - Step 32153: {'lr': 0.00045051542176210914, 'samples': 16462848, 'steps': 32153, 'loss/train': 2.0042941570281982} +03/05/2022 03:15:15 - INFO - codeparrot_training - Step 32154: {'lr': 0.0004505122523105764, 'samples': 16463360, 'steps': 32154, 'loss/train': 0.3884555995464325} +03/05/2022 03:15:17 - INFO - codeparrot_training - Skipping example with length 392 (seq_length=1024) +03/05/2022 03:15:20 - INFO - codeparrot_training - Step 32155: {'lr': 0.00045050908276869585, 'samples': 16463872, 'steps': 32155, 'loss/train': 2.0705671310424805} +03/05/2022 03:15:23 - INFO - codeparrot_training - Step 32156: {'lr': 0.0004505059131364689, 'samples': 16464384, 'steps': 32156, 'loss/train': 2.1798617839813232} +03/05/2022 03:15:25 - INFO - codeparrot_training - Skipping example with length 824 (seq_length=1024) +03/05/2022 03:15:29 - INFO - codeparrot_training - Step 32157: {'lr': 0.00045050274341389726, 'samples': 16464896, 'steps': 32157, 'loss/train': 2.2720835208892822} +03/05/2022 03:15:32 - INFO - codeparrot_training - Step 32158: {'lr': 0.00045049957360098207, 'samples': 16465408, 'steps': 32158, 'loss/train': 0.6701028943061829} +03/05/2022 03:15:34 - INFO - codeparrot_training - Skipping example with length 807 (seq_length=1024) +03/05/2022 03:15:37 - INFO - codeparrot_training - Step 32159: {'lr': 0.0004504964036977249, 'samples': 16465920, 'steps': 32159, 'loss/train': 1.919608235359192} +03/05/2022 03:15:40 - INFO - codeparrot_training - Step 32160: {'lr': 0.00045049323370412723, 'samples': 16466432, 'steps': 32160, 'loss/train': 1.891566276550293} +03/05/2022 03:15:42 - INFO - codeparrot_training - Skipping example with length 436 (seq_length=1024) +03/05/2022 03:15:46 - INFO - codeparrot_training - Step 32161: {'lr': 0.0004504900636201903, 'samples': 16466944, 'steps': 32161, 'loss/train': 0.7414053678512573} +03/05/2022 03:15:49 - INFO - codeparrot_training - Step 32162: {'lr': 0.00045048689344591566, 'samples': 16467456, 'steps': 32162, 'loss/train': 1.5685561895370483} +03/05/2022 03:15:50 - INFO - codeparrot_training - Skipping example with length 864 (seq_length=1024) +03/05/2022 03:15:54 - INFO - codeparrot_training - Step 32163: {'lr': 0.0004504837231813047, 'samples': 16467968, 'steps': 32163, 'loss/train': 1.1673611402511597} +03/05/2022 03:15:57 - INFO - codeparrot_training - Step 32164: {'lr': 0.0004504805528263589, 'samples': 16468480, 'steps': 32164, 'loss/train': 1.5249865055084229} +03/05/2022 03:15:58 - INFO - codeparrot_training - Skipping example with length 944 (seq_length=1024) +03/05/2022 03:16:02 - INFO - codeparrot_training - Step 32165: {'lr': 0.00045047738238107967, 'samples': 16468992, 'steps': 32165, 'loss/train': 2.3334567546844482} +03/05/2022 03:16:06 - INFO - codeparrot_training - Step 32166: {'lr': 0.00045047421184546844, 'samples': 16469504, 'steps': 32166, 'loss/train': 2.0946598052978516} +03/05/2022 03:16:07 - INFO - codeparrot_training - Skipping example with length 810 (seq_length=1024) +03/05/2022 03:16:11 - INFO - codeparrot_training - Step 32167: {'lr': 0.0004504710412195265, 'samples': 16470016, 'steps': 32167, 'loss/train': 1.774285912513733} +03/05/2022 03:16:14 - INFO - codeparrot_training - Step 32168: {'lr': 0.00045046787050325555, 'samples': 16470528, 'steps': 32168, 'loss/train': 1.5887900590896606} +03/05/2022 03:16:15 - INFO - codeparrot_training - Skipping example with length 112 (seq_length=1024) +03/05/2022 03:16:19 - INFO - codeparrot_training - Step 32169: {'lr': 0.0004504646996966568, 'samples': 16471040, 'steps': 32169, 'loss/train': 1.6910507678985596} +03/05/2022 03:16:22 - INFO - codeparrot_training - Step 32170: {'lr': 0.0004504615287997318, 'samples': 16471552, 'steps': 32170, 'loss/train': 2.180844783782959} +03/05/2022 03:16:24 - INFO - codeparrot_training - Skipping example with length 779 (seq_length=1024) +03/05/2022 03:16:28 - INFO - codeparrot_training - Step 32171: {'lr': 0.00045045835781248184, 'samples': 16472064, 'steps': 32171, 'loss/train': 2.855029582977295} +03/05/2022 03:16:31 - INFO - codeparrot_training - Step 32172: {'lr': 0.0004504551867349085, 'samples': 16472576, 'steps': 32172, 'loss/train': 1.0955774784088135} +03/05/2022 03:16:33 - INFO - codeparrot_training - Skipping example with length 628 (seq_length=1024) +03/05/2022 03:16:36 - INFO - codeparrot_training - Step 32173: {'lr': 0.0004504520155670131, 'samples': 16473088, 'steps': 32173, 'loss/train': 1.2767086029052734} +03/05/2022 03:16:39 - INFO - codeparrot_training - Step 32174: {'lr': 0.0004504488443087972, 'samples': 16473600, 'steps': 32174, 'loss/train': 2.0411813259124756} +03/05/2022 03:16:41 - INFO - codeparrot_training - Skipping example with length 390 (seq_length=1024) +03/05/2022 03:16:45 - INFO - codeparrot_training - Step 32175: {'lr': 0.00045044567296026206, 'samples': 16474112, 'steps': 32175, 'loss/train': 1.4554191827774048} +03/05/2022 03:16:48 - INFO - codeparrot_training - Step 32176: {'lr': 0.0004504425015214092, 'samples': 16474624, 'steps': 32176, 'loss/train': 1.8240692615509033} +03/05/2022 03:16:49 - INFO - codeparrot_training - Skipping example with length 132 (seq_length=1024) +03/05/2022 03:16:53 - INFO - codeparrot_training - Step 32177: {'lr': 0.00045043932999224015, 'samples': 16475136, 'steps': 32177, 'loss/train': 1.536206841468811} +03/05/2022 03:16:56 - INFO - codeparrot_training - Step 32178: {'lr': 0.00045043615837275607, 'samples': 16475648, 'steps': 32178, 'loss/train': 1.7384963035583496} +03/05/2022 03:16:58 - INFO - codeparrot_training - Skipping example with length 888 (seq_length=1024) +03/05/2022 03:17:02 - INFO - codeparrot_training - Step 32179: {'lr': 0.0004504329866629586, 'samples': 16476160, 'steps': 32179, 'loss/train': 1.7710537910461426} +03/05/2022 03:17:05 - INFO - codeparrot_training - Step 32180: {'lr': 0.0004504298148628492, 'samples': 16476672, 'steps': 32180, 'loss/train': 2.001732587814331} +03/05/2022 03:17:07 - INFO - codeparrot_training - Skipping example with length 634 (seq_length=1024) +03/05/2022 03:17:10 - INFO - codeparrot_training - Step 32181: {'lr': 0.0004504266429724292, 'samples': 16477184, 'steps': 32181, 'loss/train': 1.115587830543518} +03/05/2022 03:17:14 - INFO - codeparrot_training - Step 32182: {'lr': 0.0004504234709917, 'samples': 16477696, 'steps': 32182, 'loss/train': 2.181873321533203} +03/05/2022 03:17:16 - INFO - codeparrot_training - Skipping example with length 471 (seq_length=1024) +03/05/2022 03:17:19 - INFO - codeparrot_training - Step 32183: {'lr': 0.00045042029892066306, 'samples': 16478208, 'steps': 32183, 'loss/train': 0.6127412915229797} +03/05/2022 03:17:22 - INFO - codeparrot_training - Step 32184: {'lr': 0.00045041712675931983, 'samples': 16478720, 'steps': 32184, 'loss/train': 0.10254140198230743} +03/05/2022 03:17:24 - INFO - codeparrot_training - Skipping example with length 600 (seq_length=1024) +03/05/2022 03:17:27 - INFO - codeparrot_training - Step 32185: {'lr': 0.0004504139545076717, 'samples': 16479232, 'steps': 32185, 'loss/train': 1.8352134227752686} +03/05/2022 03:17:30 - INFO - codeparrot_training - Step 32186: {'lr': 0.0004504107821657203, 'samples': 16479744, 'steps': 32186, 'loss/train': 2.150118112564087} +03/05/2022 03:17:32 - INFO - codeparrot_training - Skipping example with length 269 (seq_length=1024) +03/05/2022 03:17:36 - INFO - codeparrot_training - Step 32187: {'lr': 0.00045040760973346673, 'samples': 16480256, 'steps': 32187, 'loss/train': 2.707380533218384} +03/05/2022 03:17:39 - INFO - codeparrot_training - Step 32188: {'lr': 0.00045040443721091266, 'samples': 16480768, 'steps': 32188, 'loss/train': 1.8270772695541382} +03/05/2022 03:17:41 - INFO - codeparrot_training - Skipping example with length 746 (seq_length=1024) +03/05/2022 03:17:44 - INFO - codeparrot_training - Step 32189: {'lr': 0.0004504012645980594, 'samples': 16481280, 'steps': 32189, 'loss/train': 0.22897309064865112} +03/05/2022 03:17:47 - INFO - codeparrot_training - Step 32190: {'lr': 0.0004503980918949085, 'samples': 16481792, 'steps': 32190, 'loss/train': 1.241885781288147} +03/05/2022 03:17:49 - INFO - codeparrot_training - Skipping example with length 935 (seq_length=1024) +03/05/2022 03:17:53 - INFO - codeparrot_training - Step 32191: {'lr': 0.00045039491910146124, 'samples': 16482304, 'steps': 32191, 'loss/train': 1.7181458473205566} +03/05/2022 03:17:56 - INFO - codeparrot_training - Step 32192: {'lr': 0.00045039174621771915, 'samples': 16482816, 'steps': 32192, 'loss/train': 2.6758923530578613} +03/05/2022 03:17:57 - INFO - codeparrot_training - Skipping example with length 268 (seq_length=1024) +03/05/2022 03:18:01 - INFO - codeparrot_training - Step 32193: {'lr': 0.00045038857324368367, 'samples': 16483328, 'steps': 32193, 'loss/train': 0.6276638507843018} +03/05/2022 03:18:04 - INFO - codeparrot_training - Step 32194: {'lr': 0.0004503854001793561, 'samples': 16483840, 'steps': 32194, 'loss/train': 0.07944183051586151} +03/05/2022 03:18:06 - INFO - codeparrot_training - Skipping example with length 933 (seq_length=1024) +03/05/2022 03:18:10 - INFO - codeparrot_training - Step 32195: {'lr': 0.00045038222702473797, 'samples': 16484352, 'steps': 32195, 'loss/train': 2.2628095149993896} +03/05/2022 03:18:13 - INFO - codeparrot_training - Step 32196: {'lr': 0.0004503790537798308, 'samples': 16484864, 'steps': 32196, 'loss/train': 1.309360384941101} +03/05/2022 03:18:14 - INFO - codeparrot_training - Skipping example with length 335 (seq_length=1024) +03/05/2022 03:18:18 - INFO - codeparrot_training - Step 32197: {'lr': 0.00045037588044463586, 'samples': 16485376, 'steps': 32197, 'loss/train': 1.5654950141906738} +03/05/2022 03:18:21 - INFO - codeparrot_training - Step 32198: {'lr': 0.00045037270701915464, 'samples': 16485888, 'steps': 32198, 'loss/train': 2.325202226638794} +03/05/2022 03:18:22 - INFO - codeparrot_training - Skipping example with length 678 (seq_length=1024) +03/05/2022 03:18:26 - INFO - codeparrot_training - Step 32199: {'lr': 0.0004503695335033885, 'samples': 16486400, 'steps': 32199, 'loss/train': 1.2658920288085938} +03/05/2022 03:18:30 - INFO - codeparrot_training - Step 32200: {'lr': 0.00045036635989733904, 'samples': 16486912, 'steps': 32200, 'loss/train': 1.9737051725387573} +03/05/2022 03:18:31 - INFO - codeparrot_training - Skipping example with length 564 (seq_length=1024) +03/05/2022 03:18:35 - INFO - codeparrot_training - Step 32201: {'lr': 0.0004503631862010076, 'samples': 16487424, 'steps': 32201, 'loss/train': 1.3811358213424683} +03/05/2022 03:18:38 - INFO - codeparrot_training - Step 32202: {'lr': 0.0004503600124143955, 'samples': 16487936, 'steps': 32202, 'loss/train': 1.3133983612060547} +03/05/2022 03:18:39 - INFO - codeparrot_training - Skipping example with length 261 (seq_length=1024) +03/05/2022 03:18:43 - INFO - codeparrot_training - Step 32203: {'lr': 0.0004503568385375043, 'samples': 16488448, 'steps': 32203, 'loss/train': 1.7754358053207397} +03/05/2022 03:18:46 - INFO - codeparrot_training - Step 32204: {'lr': 0.00045035366457033546, 'samples': 16488960, 'steps': 32204, 'loss/train': 1.7398165464401245} +03/05/2022 03:18:47 - INFO - codeparrot_training - Skipping example with length 900 (seq_length=1024) +03/05/2022 03:18:52 - INFO - codeparrot_training - Step 32205: {'lr': 0.00045035049051289037, 'samples': 16489472, 'steps': 32205, 'loss/train': 1.4337958097457886} +03/05/2022 03:18:55 - INFO - codeparrot_training - Step 32206: {'lr': 0.00045034731636517036, 'samples': 16489984, 'steps': 32206, 'loss/train': 1.1567484140396118} +03/05/2022 03:18:55 - INFO - codeparrot_training - Skipping example with length 115 (seq_length=1024) +03/05/2022 03:19:00 - INFO - codeparrot_training - Step 32207: {'lr': 0.0004503441421271769, 'samples': 16490496, 'steps': 32207, 'loss/train': 1.896597981452942} +03/05/2022 03:19:03 - INFO - codeparrot_training - Step 32208: {'lr': 0.0004503409677989115, 'samples': 16491008, 'steps': 32208, 'loss/train': 1.7100908756256104} +03/05/2022 03:19:04 - INFO - codeparrot_training - Skipping example with length 1020 (seq_length=1024) +03/05/2022 03:19:08 - INFO - codeparrot_training - Step 32209: {'lr': 0.00045033779338037565, 'samples': 16491520, 'steps': 32209, 'loss/train': 1.4443621635437012} +03/05/2022 03:19:12 - INFO - codeparrot_training - Step 32210: {'lr': 0.0004503346188715706, 'samples': 16492032, 'steps': 32210, 'loss/train': 1.5934430360794067} +03/05/2022 03:19:12 - INFO - codeparrot_training - Skipping example with length 114 (seq_length=1024) +03/05/2022 03:19:17 - INFO - codeparrot_training - Step 32211: {'lr': 0.0004503314442724979, 'samples': 16492544, 'steps': 32211, 'loss/train': 1.5583096742630005} +03/05/2022 03:19:20 - INFO - codeparrot_training - Step 32212: {'lr': 0.0004503282695831589, 'samples': 16493056, 'steps': 32212, 'loss/train': 1.3145238161087036} +03/05/2022 03:19:21 - INFO - codeparrot_training - Skipping example with length 130 (seq_length=1024) +03/05/2022 03:19:25 - INFO - codeparrot_training - Step 32213: {'lr': 0.0004503250948035551, 'samples': 16493568, 'steps': 32213, 'loss/train': 1.9637290239334106} +03/05/2022 03:19:29 - INFO - codeparrot_training - Step 32214: {'lr': 0.0004503219199336879, 'samples': 16494080, 'steps': 32214, 'loss/train': 1.4416959285736084} +03/05/2022 03:19:29 - INFO - codeparrot_training - Skipping example with length 107 (seq_length=1024) +03/05/2022 03:19:34 - INFO - codeparrot_training - Step 32215: {'lr': 0.00045031874497355876, 'samples': 16494592, 'steps': 32215, 'loss/train': 0.8577883839607239} +03/05/2022 03:19:37 - INFO - codeparrot_training - Step 32216: {'lr': 0.000450315569923169, 'samples': 16495104, 'steps': 32216, 'loss/train': 2.0951616764068604} +03/05/2022 03:19:37 - INFO - codeparrot_training - Skipping example with length 340 (seq_length=1024) +03/05/2022 03:19:42 - INFO - codeparrot_training - Step 32217: {'lr': 0.00045031239478252017, 'samples': 16495616, 'steps': 32217, 'loss/train': 0.8503124117851257} +03/05/2022 03:19:46 - INFO - codeparrot_training - Step 32218: {'lr': 0.00045030921955161373, 'samples': 16496128, 'steps': 32218, 'loss/train': 2.3442375659942627} +03/05/2022 03:19:46 - INFO - codeparrot_training - Skipping example with length 219 (seq_length=1024) +03/05/2022 03:19:51 - INFO - codeparrot_training - Step 32219: {'lr': 0.000450306044230451, 'samples': 16496640, 'steps': 32219, 'loss/train': 1.560167670249939} +03/05/2022 03:19:54 - INFO - codeparrot_training - Step 32220: {'lr': 0.0004503028688190335, 'samples': 16497152, 'steps': 32220, 'loss/train': 1.4374396800994873} +03/05/2022 03:19:54 - INFO - codeparrot_training - Skipping example with length 17 (seq_length=1024) +03/05/2022 03:19:59 - INFO - codeparrot_training - Step 32221: {'lr': 0.00045029969331736254, 'samples': 16497664, 'steps': 32221, 'loss/train': 1.1682209968566895} +03/05/2022 03:20:02 - INFO - codeparrot_training - Step 32222: {'lr': 0.00045029651772543965, 'samples': 16498176, 'steps': 32222, 'loss/train': 1.8078739643096924} +03/05/2022 03:20:02 - INFO - codeparrot_training - Skipping example with length 801 (seq_length=1024) +03/05/2022 03:20:08 - INFO - codeparrot_training - Step 32223: {'lr': 0.0004502933420432662, 'samples': 16498688, 'steps': 32223, 'loss/train': 2.119680166244507} +03/05/2022 03:20:11 - INFO - codeparrot_training - Step 32224: {'lr': 0.0004502901662708437, 'samples': 16499200, 'steps': 32224, 'loss/train': 1.6902843713760376} +03/05/2022 03:20:12 - INFO - codeparrot_training - Skipping example with length 999 (seq_length=1024) +03/05/2022 03:20:16 - INFO - codeparrot_training - Step 32225: {'lr': 0.0004502869904081736, 'samples': 16499712, 'steps': 32225, 'loss/train': 1.5183053016662598} +03/05/2022 03:20:20 - INFO - codeparrot_training - Step 32226: {'lr': 0.00045028381445525725, 'samples': 16500224, 'steps': 32226, 'loss/train': 2.439406156539917} +03/05/2022 03:20:20 - INFO - codeparrot_training - Skipping example with length 944 (seq_length=1024) +03/05/2022 03:20:25 - INFO - codeparrot_training - Step 32227: {'lr': 0.0004502806384120961, 'samples': 16500736, 'steps': 32227, 'loss/train': 1.5894701480865479} +03/05/2022 03:20:28 - INFO - codeparrot_training - Step 32228: {'lr': 0.0004502774622786915, 'samples': 16501248, 'steps': 32228, 'loss/train': 2.3167834281921387} +03/05/2022 03:20:29 - INFO - codeparrot_training - Skipping example with length 645 (seq_length=1024) +03/05/2022 03:20:33 - INFO - codeparrot_training - Step 32229: {'lr': 0.00045027428605504507, 'samples': 16501760, 'steps': 32229, 'loss/train': 2.0827436447143555} +03/05/2022 03:20:37 - INFO - codeparrot_training - Step 32230: {'lr': 0.00045027110974115814, 'samples': 16502272, 'steps': 32230, 'loss/train': 1.519816279411316} +03/05/2022 03:20:37 - INFO - codeparrot_training - Skipping example with length 908 (seq_length=1024) +03/05/2022 03:20:42 - INFO - codeparrot_training - Step 32231: {'lr': 0.0004502679333370321, 'samples': 16502784, 'steps': 32231, 'loss/train': 1.6383501291275024} +03/05/2022 03:20:45 - INFO - codeparrot_training - Step 32232: {'lr': 0.0004502647568426684, 'samples': 16503296, 'steps': 32232, 'loss/train': 1.9301764965057373} +03/05/2022 03:20:46 - INFO - codeparrot_training - Skipping example with length 804 (seq_length=1024) +03/05/2022 03:20:50 - INFO - codeparrot_training - Step 32233: {'lr': 0.0004502615802580685, 'samples': 16503808, 'steps': 32233, 'loss/train': 2.0161755084991455} +03/05/2022 03:20:53 - INFO - codeparrot_training - Step 32234: {'lr': 0.0004502584035832338, 'samples': 16504320, 'steps': 32234, 'loss/train': 0.96965491771698} +03/05/2022 03:20:54 - INFO - codeparrot_training - Skipping example with length 775 (seq_length=1024) +03/05/2022 03:20:59 - INFO - codeparrot_training - Step 32235: {'lr': 0.00045025522681816586, 'samples': 16504832, 'steps': 32235, 'loss/train': 2.043834924697876} +03/05/2022 03:21:02 - INFO - codeparrot_training - Step 32236: {'lr': 0.0004502520499628659, 'samples': 16505344, 'steps': 32236, 'loss/train': 1.6013840436935425} +03/05/2022 03:21:02 - INFO - codeparrot_training - Skipping example with length 198 (seq_length=1024) +03/05/2022 03:21:07 - INFO - codeparrot_training - Step 32237: {'lr': 0.00045024887301733555, 'samples': 16505856, 'steps': 32237, 'loss/train': 2.0295398235321045} +03/05/2022 03:21:10 - INFO - codeparrot_training - Step 32238: {'lr': 0.0004502456959815761, 'samples': 16506368, 'steps': 32238, 'loss/train': 2.553128719329834} +03/05/2022 03:21:11 - INFO - codeparrot_training - Skipping example with length 1008 (seq_length=1024) +03/05/2022 03:21:15 - INFO - codeparrot_training - Step 32239: {'lr': 0.000450242518855589, 'samples': 16506880, 'steps': 32239, 'loss/train': 1.6728880405426025} +03/05/2022 03:21:19 - INFO - codeparrot_training - Step 32240: {'lr': 0.00045023934163937565, 'samples': 16507392, 'steps': 32240, 'loss/train': 1.971681833267212} +03/05/2022 03:21:19 - INFO - codeparrot_training - Skipping example with length 738 (seq_length=1024) +03/05/2022 03:21:24 - INFO - codeparrot_training - Step 32241: {'lr': 0.00045023616433293763, 'samples': 16507904, 'steps': 32241, 'loss/train': 2.336901903152466} +03/05/2022 03:21:27 - INFO - codeparrot_training - Step 32242: {'lr': 0.00045023298693627626, 'samples': 16508416, 'steps': 32242, 'loss/train': 1.8789466619491577} +03/05/2022 03:21:27 - INFO - codeparrot_training - Skipping example with length 540 (seq_length=1024) +03/05/2022 03:21:32 - INFO - codeparrot_training - Step 32243: {'lr': 0.000450229809449393, 'samples': 16508928, 'steps': 32243, 'loss/train': 1.7914034128189087} +03/05/2022 03:21:36 - INFO - codeparrot_training - Step 32244: {'lr': 0.00045022663187228927, 'samples': 16509440, 'steps': 32244, 'loss/train': 1.4560041427612305} +03/05/2022 03:21:36 - INFO - codeparrot_training - Skipping example with length 978 (seq_length=1024) +03/05/2022 03:21:41 - INFO - codeparrot_training - Step 32245: {'lr': 0.0004502234542049666, 'samples': 16509952, 'steps': 32245, 'loss/train': 1.5970028638839722} +03/05/2022 03:21:44 - INFO - codeparrot_training - Step 32246: {'lr': 0.00045022027644742624, 'samples': 16510464, 'steps': 32246, 'loss/train': 1.4289735555648804} +03/05/2022 03:21:44 - INFO - codeparrot_training - Skipping example with length 741 (seq_length=1024) +03/05/2022 03:21:49 - INFO - codeparrot_training - Step 32247: {'lr': 0.0004502170985996697, 'samples': 16510976, 'steps': 32247, 'loss/train': 1.6264692544937134} +03/05/2022 03:21:53 - INFO - codeparrot_training - Step 32248: {'lr': 0.00045021392066169844, 'samples': 16511488, 'steps': 32248, 'loss/train': 1.421189546585083} +03/05/2022 03:21:53 - INFO - codeparrot_training - Skipping example with length 439 (seq_length=1024) +03/05/2022 03:21:58 - INFO - codeparrot_training - Step 32249: {'lr': 0.0004502107426335139, 'samples': 16512000, 'steps': 32249, 'loss/train': 2.609271287918091} +03/05/2022 03:22:01 - INFO - codeparrot_training - Step 32250: {'lr': 0.0004502075645151175, 'samples': 16512512, 'steps': 32250, 'loss/train': 1.727664589881897} +03/05/2022 03:22:01 - INFO - codeparrot_training - Skipping example with length 673 (seq_length=1024) +03/05/2022 03:22:07 - INFO - codeparrot_training - Step 32251: {'lr': 0.0004502043863065106, 'samples': 16513024, 'steps': 32251, 'loss/train': 1.205125331878662} +03/05/2022 03:22:10 - INFO - codeparrot_training - Step 32252: {'lr': 0.00045020120800769474, 'samples': 16513536, 'steps': 32252, 'loss/train': 2.233844757080078} +03/05/2022 03:22:12 - INFO - codeparrot_training - Skipping example with length 718 (seq_length=1024) +03/05/2022 03:22:16 - INFO - codeparrot_training - Step 32253: {'lr': 0.0004501980296186713, 'samples': 16514048, 'steps': 32253, 'loss/train': 1.241442322731018} +03/05/2022 03:22:20 - INFO - codeparrot_training - Step 32254: {'lr': 0.0004501948511394417, 'samples': 16514560, 'steps': 32254, 'loss/train': 1.125423550605774} +03/05/2022 03:22:23 - INFO - codeparrot_training - Step 32255: {'lr': 0.0004501916725700074, 'samples': 16515072, 'steps': 32255, 'loss/train': 0.8903215527534485} +03/05/2022 03:22:25 - INFO - codeparrot_training - Skipping example with length 108 (seq_length=1024) +03/05/2022 03:22:28 - INFO - codeparrot_training - Step 32256: {'lr': 0.00045018849391036987, 'samples': 16515584, 'steps': 32256, 'loss/train': 0.8482746481895447} +03/05/2022 03:22:31 - INFO - codeparrot_training - Step 32257: {'lr': 0.00045018531516053046, 'samples': 16516096, 'steps': 32257, 'loss/train': 0.825526773929596} +03/05/2022 03:22:33 - INFO - codeparrot_training - Skipping example with length 102 (seq_length=1024) +03/05/2022 03:22:36 - INFO - codeparrot_training - Step 32258: {'lr': 0.0004501821363204906, 'samples': 16516608, 'steps': 32258, 'loss/train': 1.883768916130066} +03/05/2022 03:22:39 - INFO - codeparrot_training - Step 32259: {'lr': 0.00045017895739025185, 'samples': 16517120, 'steps': 32259, 'loss/train': 1.5496797561645508} +03/05/2022 03:22:41 - INFO - codeparrot_training - Skipping example with length 294 (seq_length=1024) +03/05/2022 03:22:45 - INFO - codeparrot_training - Step 32260: {'lr': 0.0004501757783698154, 'samples': 16517632, 'steps': 32260, 'loss/train': 1.793108582496643} +03/05/2022 03:22:48 - INFO - codeparrot_training - Step 32261: {'lr': 0.00045017259925918295, 'samples': 16518144, 'steps': 32261, 'loss/train': 1.7173904180526733} +03/05/2022 03:22:52 - INFO - codeparrot_training - Step 32262: {'lr': 0.0004501694200583558, 'samples': 16518656, 'steps': 32262, 'loss/train': 1.8365219831466675} +03/05/2022 03:22:52 - INFO - codeparrot_training - Skipping example with length 274 (seq_length=1024) +03/05/2022 03:22:57 - INFO - codeparrot_training - Step 32263: {'lr': 0.0004501662407673354, 'samples': 16519168, 'steps': 32263, 'loss/train': 2.000492572784424} +03/05/2022 03:23:00 - INFO - codeparrot_training - Step 32264: {'lr': 0.00045016306138612313, 'samples': 16519680, 'steps': 32264, 'loss/train': 1.648452877998352} +03/05/2022 03:23:00 - INFO - codeparrot_training - Skipping example with length 926 (seq_length=1024) +03/05/2022 03:23:05 - INFO - codeparrot_training - Step 32265: {'lr': 0.0004501598819147205, 'samples': 16520192, 'steps': 32265, 'loss/train': 0.06549766659736633} +03/05/2022 03:23:08 - INFO - codeparrot_training - Step 32266: {'lr': 0.00045015670235312895, 'samples': 16520704, 'steps': 32266, 'loss/train': 2.324337959289551} +03/05/2022 03:23:09 - INFO - codeparrot_training - Skipping example with length 784 (seq_length=1024) +03/05/2022 03:23:14 - INFO - codeparrot_training - Step 32267: {'lr': 0.0004501535227013498, 'samples': 16521216, 'steps': 32267, 'loss/train': 1.3472681045532227} +03/05/2022 03:23:17 - INFO - codeparrot_training - Step 32268: {'lr': 0.0004501503429593846, 'samples': 16521728, 'steps': 32268, 'loss/train': 1.4270840883255005} +03/05/2022 03:23:17 - INFO - codeparrot_training - Skipping example with length 707 (seq_length=1024) +03/05/2022 03:23:22 - INFO - codeparrot_training - Step 32269: {'lr': 0.0004501471631272348, 'samples': 16522240, 'steps': 32269, 'loss/train': 2.351712465286255} +03/05/2022 03:23:25 - INFO - codeparrot_training - Step 32270: {'lr': 0.00045014398320490173, 'samples': 16522752, 'steps': 32270, 'loss/train': 1.6424205303192139} +03/05/2022 03:23:25 - INFO - codeparrot_training - Skipping example with length 643 (seq_length=1024) +03/05/2022 03:23:30 - INFO - codeparrot_training - Step 32271: {'lr': 0.00045014080319238686, 'samples': 16523264, 'steps': 32271, 'loss/train': 1.97561776638031} +03/05/2022 03:23:34 - INFO - codeparrot_training - Step 32272: {'lr': 0.00045013762308969164, 'samples': 16523776, 'steps': 32272, 'loss/train': 2.1698272228240967} +03/05/2022 03:23:34 - INFO - codeparrot_training - Skipping example with length 261 (seq_length=1024) +03/05/2022 03:23:39 - INFO - codeparrot_training - Step 32273: {'lr': 0.00045013444289681757, 'samples': 16524288, 'steps': 32273, 'loss/train': 1.9056363105773926} +03/05/2022 03:23:42 - INFO - codeparrot_training - Skipping example with length 553 (seq_length=1024) +03/05/2022 03:23:44 - INFO - codeparrot_training - Step 32274: {'lr': 0.0004501312626137659, 'samples': 16524800, 'steps': 32274, 'loss/train': 1.9683963060379028} +03/05/2022 03:23:47 - INFO - codeparrot_training - Step 32275: {'lr': 0.0004501280822405382, 'samples': 16525312, 'steps': 32275, 'loss/train': 2.3114662170410156} +03/05/2022 03:23:50 - INFO - codeparrot_training - Skipping example with length 437 (seq_length=1024) +03/05/2022 03:23:52 - INFO - codeparrot_training - Step 32276: {'lr': 0.00045012490177713586, 'samples': 16525824, 'steps': 32276, 'loss/train': 0.7880001664161682} +03/05/2022 03:23:56 - INFO - codeparrot_training - Step 32277: {'lr': 0.00045012172122356036, 'samples': 16526336, 'steps': 32277, 'loss/train': 1.8203128576278687} +03/05/2022 03:23:59 - INFO - codeparrot_training - Step 32278: {'lr': 0.0004501185405798131, 'samples': 16526848, 'steps': 32278, 'loss/train': 1.8460109233856201} +03/05/2022 03:23:59 - INFO - codeparrot_training - Skipping example with length 875 (seq_length=1024) +03/05/2022 03:24:04 - INFO - codeparrot_training - Step 32279: {'lr': 0.00045011535984589544, 'samples': 16527360, 'steps': 32279, 'loss/train': 1.252022385597229} +03/05/2022 03:24:07 - INFO - codeparrot_training - Skipping example with length 90 (seq_length=1024) +03/05/2022 03:24:09 - INFO - codeparrot_training - Step 32280: {'lr': 0.000450112179021809, 'samples': 16527872, 'steps': 32280, 'loss/train': 1.2211589813232422} +03/05/2022 03:24:13 - INFO - codeparrot_training - Step 32281: {'lr': 0.00045010899810755506, 'samples': 16528384, 'steps': 32281, 'loss/train': 2.2352893352508545} +03/05/2022 03:24:15 - INFO - codeparrot_training - Skipping example with length 757 (seq_length=1024) +03/05/2022 03:24:18 - INFO - codeparrot_training - Step 32282: {'lr': 0.00045010581710313506, 'samples': 16528896, 'steps': 32282, 'loss/train': 1.7220207452774048} +03/05/2022 03:24:21 - INFO - codeparrot_training - Step 32283: {'lr': 0.0004501026360085505, 'samples': 16529408, 'steps': 32283, 'loss/train': 1.5309308767318726} +03/05/2022 03:24:24 - INFO - codeparrot_training - Step 32284: {'lr': 0.0004500994548238028, 'samples': 16529920, 'steps': 32284, 'loss/train': 2.028325080871582} +03/05/2022 03:24:25 - INFO - codeparrot_training - Skipping example with length 164 (seq_length=1024) +03/05/2022 03:24:29 - INFO - codeparrot_training - Step 32285: {'lr': 0.00045009627354889337, 'samples': 16530432, 'steps': 32285, 'loss/train': 1.9448999166488647} +03/05/2022 03:24:33 - INFO - codeparrot_training - Step 32286: {'lr': 0.0004500930921838236, 'samples': 16530944, 'steps': 32286, 'loss/train': 1.9928890466690063} +03/05/2022 03:24:33 - INFO - codeparrot_training - Skipping example with length 710 (seq_length=1024) +03/05/2022 03:24:38 - INFO - codeparrot_training - Step 32287: {'lr': 0.000450089910728595, 'samples': 16531456, 'steps': 32287, 'loss/train': 1.5635994672775269} +03/05/2022 03:24:41 - INFO - codeparrot_training - Step 32288: {'lr': 0.0004500867291832089, 'samples': 16531968, 'steps': 32288, 'loss/train': 2.0142176151275635} +03/05/2022 03:24:41 - INFO - codeparrot_training - Skipping example with length 101 (seq_length=1024) +03/05/2022 03:24:46 - INFO - codeparrot_training - Step 32289: {'lr': 0.00045008354754766687, 'samples': 16532480, 'steps': 32289, 'loss/train': 1.439382553100586} +03/05/2022 03:24:49 - INFO - codeparrot_training - Step 32290: {'lr': 0.0004500803658219703, 'samples': 16532992, 'steps': 32290, 'loss/train': 1.4623559713363647} +03/05/2022 03:24:50 - INFO - codeparrot_training - Skipping example with length 1011 (seq_length=1024) +03/05/2022 03:24:55 - INFO - codeparrot_training - Step 32291: {'lr': 0.0004500771840061206, 'samples': 16533504, 'steps': 32291, 'loss/train': 1.6388386487960815} +03/05/2022 03:24:58 - INFO - codeparrot_training - Step 32292: {'lr': 0.00045007400210011925, 'samples': 16534016, 'steps': 32292, 'loss/train': 3.134432077407837} +03/05/2022 03:24:59 - INFO - codeparrot_training - Skipping example with length 176 (seq_length=1024) +03/05/2022 03:25:03 - INFO - codeparrot_training - Step 32293: {'lr': 0.0004500708201039676, 'samples': 16534528, 'steps': 32293, 'loss/train': 0.8969138264656067} +03/05/2022 03:25:06 - INFO - codeparrot_training - Step 32294: {'lr': 0.0004500676380176671, 'samples': 16535040, 'steps': 32294, 'loss/train': 1.2729841470718384} +03/05/2022 03:25:07 - INFO - codeparrot_training - Skipping example with length 366 (seq_length=1024) +03/05/2022 03:25:12 - INFO - codeparrot_training - Step 32295: {'lr': 0.00045006445584121923, 'samples': 16535552, 'steps': 32295, 'loss/train': 1.509150505065918} +03/05/2022 03:25:15 - INFO - codeparrot_training - Step 32296: {'lr': 0.00045006127357462533, 'samples': 16536064, 'steps': 32296, 'loss/train': 2.2414145469665527} +03/05/2022 03:25:15 - INFO - codeparrot_training - Skipping example with length 620 (seq_length=1024) +03/05/2022 03:25:20 - INFO - codeparrot_training - Step 32297: {'lr': 0.000450058091217887, 'samples': 16536576, 'steps': 32297, 'loss/train': 2.2631585597991943} +03/05/2022 03:25:23 - INFO - codeparrot_training - Step 32298: {'lr': 0.0004500549087710056, 'samples': 16537088, 'steps': 32298, 'loss/train': 1.9179980754852295} +03/05/2022 03:25:23 - INFO - codeparrot_training - Skipping example with length 302 (seq_length=1024) +03/05/2022 03:25:28 - INFO - codeparrot_training - Step 32299: {'lr': 0.0004500517262339825, 'samples': 16537600, 'steps': 32299, 'loss/train': 2.2595155239105225} +03/05/2022 03:25:32 - INFO - codeparrot_training - Step 32300: {'lr': 0.0004500485436068191, 'samples': 16538112, 'steps': 32300, 'loss/train': 1.7985758781433105} +03/05/2022 03:25:32 - INFO - codeparrot_training - Skipping example with length 633 (seq_length=1024) +03/05/2022 03:25:37 - INFO - codeparrot_training - Step 32301: {'lr': 0.0004500453608895171, 'samples': 16538624, 'steps': 32301, 'loss/train': 1.3893694877624512} +03/05/2022 03:25:39 - INFO - codeparrot_training - Skipping example with length 246 (seq_length=1024) +03/05/2022 03:25:42 - INFO - codeparrot_training - Step 32302: {'lr': 0.00045004217808207757, 'samples': 16539136, 'steps': 32302, 'loss/train': 1.904556393623352} +03/05/2022 03:25:45 - INFO - codeparrot_training - Step 32303: {'lr': 0.0004500389951845022, 'samples': 16539648, 'steps': 32303, 'loss/train': 0.8378501534461975} +03/05/2022 03:25:48 - INFO - codeparrot_training - Skipping example with length 48 (seq_length=1024) +03/05/2022 03:25:50 - INFO - codeparrot_training - Step 32304: {'lr': 0.00045003581219679235, 'samples': 16540160, 'steps': 32304, 'loss/train': 1.7698394060134888} +03/05/2022 03:25:54 - INFO - codeparrot_training - Step 32305: {'lr': 0.00045003262911894943, 'samples': 16540672, 'steps': 32305, 'loss/train': 1.7045574188232422} +03/05/2022 03:25:56 - INFO - codeparrot_training - Skipping example with length 273 (seq_length=1024) +03/05/2022 03:25:59 - INFO - codeparrot_training - Step 32306: {'lr': 0.00045002944595097494, 'samples': 16541184, 'steps': 32306, 'loss/train': 1.4119954109191895} +03/05/2022 03:26:02 - INFO - codeparrot_training - Step 32307: {'lr': 0.00045002626269287024, 'samples': 16541696, 'steps': 32307, 'loss/train': 1.9988905191421509} +03/05/2022 03:26:05 - INFO - codeparrot_training - Skipping example with length 884 (seq_length=1024) +03/05/2022 03:26:07 - INFO - codeparrot_training - Step 32308: {'lr': 0.00045002307934463673, 'samples': 16542208, 'steps': 32308, 'loss/train': 1.3723077774047852} +03/05/2022 03:26:11 - INFO - codeparrot_training - Step 32309: {'lr': 0.000450019895906276, 'samples': 16542720, 'steps': 32309, 'loss/train': 1.920534610748291} +03/05/2022 03:26:13 - INFO - codeparrot_training - Skipping example with length 80 (seq_length=1024) +03/05/2022 03:26:16 - INFO - codeparrot_training - Step 32310: {'lr': 0.0004500167123777894, 'samples': 16543232, 'steps': 32310, 'loss/train': 1.4552727937698364} +03/05/2022 03:26:19 - INFO - codeparrot_training - Step 32311: {'lr': 0.00045001352875917824, 'samples': 16543744, 'steps': 32311, 'loss/train': 1.1241849660873413} +03/05/2022 03:26:22 - INFO - codeparrot_training - Skipping example with length 693 (seq_length=1024) +03/05/2022 03:26:24 - INFO - codeparrot_training - Step 32312: {'lr': 0.00045001034505044415, 'samples': 16544256, 'steps': 32312, 'loss/train': 1.3802741765975952} +03/05/2022 03:26:28 - INFO - codeparrot_training - Step 32313: {'lr': 0.00045000716125158846, 'samples': 16544768, 'steps': 32313, 'loss/train': 1.64714777469635} +03/05/2022 03:26:30 - INFO - codeparrot_training - Skipping example with length 657 (seq_length=1024) +03/05/2022 03:26:33 - INFO - codeparrot_training - Step 32314: {'lr': 0.0004500039773626127, 'samples': 16545280, 'steps': 32314, 'loss/train': 1.0032775402069092} +03/05/2022 03:26:36 - INFO - codeparrot_training - Step 32315: {'lr': 0.00045000079338351805, 'samples': 16545792, 'steps': 32315, 'loss/train': 1.7638407945632935} +03/05/2022 03:26:38 - INFO - codeparrot_training - Skipping example with length 410 (seq_length=1024) +03/05/2022 03:26:41 - INFO - codeparrot_training - Step 32316: {'lr': 0.0004499976093143063, 'samples': 16546304, 'steps': 32316, 'loss/train': 1.1470493078231812} +03/05/2022 03:26:44 - INFO - codeparrot_training - Step 32317: {'lr': 0.00044999442515497866, 'samples': 16546816, 'steps': 32317, 'loss/train': 0.05779756233096123} +03/05/2022 03:26:47 - INFO - codeparrot_training - Skipping example with length 477 (seq_length=1024) +03/05/2022 03:26:50 - INFO - codeparrot_training - Step 32318: {'lr': 0.0004499912409055367, 'samples': 16547328, 'steps': 32318, 'loss/train': 1.5817676782608032} +03/05/2022 03:26:53 - INFO - codeparrot_training - Step 32319: {'lr': 0.0004499880565659816, 'samples': 16547840, 'steps': 32319, 'loss/train': 1.6074827909469604} +03/05/2022 03:26:55 - INFO - codeparrot_training - Skipping example with length 436 (seq_length=1024) +03/05/2022 03:26:58 - INFO - codeparrot_training - Step 32320: {'lr': 0.0004499848721363151, 'samples': 16548352, 'steps': 32320, 'loss/train': 0.7577037811279297} +03/05/2022 03:27:01 - INFO - codeparrot_training - Step 32321: {'lr': 0.0004499816876165385, 'samples': 16548864, 'steps': 32321, 'loss/train': 1.8371872901916504} +03/05/2022 03:27:03 - INFO - codeparrot_training - Skipping example with length 190 (seq_length=1024) +03/05/2022 03:27:06 - INFO - codeparrot_training - Step 32322: {'lr': 0.0004499785030066532, 'samples': 16549376, 'steps': 32322, 'loss/train': 1.3737050294876099} +03/05/2022 03:27:10 - INFO - codeparrot_training - Step 32323: {'lr': 0.00044997531830666073, 'samples': 16549888, 'steps': 32323, 'loss/train': 1.1425515413284302} +03/05/2022 03:27:11 - INFO - codeparrot_training - Skipping example with length 942 (seq_length=1024) +03/05/2022 03:27:15 - INFO - codeparrot_training - Step 32324: {'lr': 0.00044997213351656237, 'samples': 16550400, 'steps': 32324, 'loss/train': 2.078904151916504} +03/05/2022 03:27:18 - INFO - codeparrot_training - Step 32325: {'lr': 0.00044996894863635965, 'samples': 16550912, 'steps': 32325, 'loss/train': 1.033521294593811} +03/05/2022 03:27:19 - INFO - codeparrot_training - Skipping example with length 314 (seq_length=1024) +03/05/2022 03:27:23 - INFO - codeparrot_training - Step 32326: {'lr': 0.00044996576366605415, 'samples': 16551424, 'steps': 32326, 'loss/train': 1.375506043434143} +03/05/2022 03:27:27 - INFO - codeparrot_training - Step 32327: {'lr': 0.00044996257860564705, 'samples': 16551936, 'steps': 32327, 'loss/train': 1.5657107830047607} +03/05/2022 03:27:28 - INFO - codeparrot_training - Skipping example with length 484 (seq_length=1024) +03/05/2022 03:27:32 - INFO - codeparrot_training - Step 32328: {'lr': 0.0004499593934551399, 'samples': 16552448, 'steps': 32328, 'loss/train': 0.695310652256012} +03/05/2022 03:27:35 - INFO - codeparrot_training - Step 32329: {'lr': 0.00044995620821453416, 'samples': 16552960, 'steps': 32329, 'loss/train': 2.174541711807251} +03/05/2022 03:27:37 - INFO - codeparrot_training - Skipping example with length 1005 (seq_length=1024) +03/05/2022 03:27:40 - INFO - codeparrot_training - Step 32330: {'lr': 0.00044995302288383123, 'samples': 16553472, 'steps': 32330, 'loss/train': 1.5241491794586182} +03/05/2022 03:27:44 - INFO - codeparrot_training - Step 32331: {'lr': 0.0004499498374630325, 'samples': 16553984, 'steps': 32331, 'loss/train': 0.1514754742383957} +03/05/2022 03:27:45 - INFO - codeparrot_training - Skipping example with length 57 (seq_length=1024) +03/05/2022 03:27:49 - INFO - codeparrot_training - Step 32332: {'lr': 0.0004499466519521396, 'samples': 16554496, 'steps': 32332, 'loss/train': 1.6864006519317627} +03/05/2022 03:27:52 - INFO - codeparrot_training - Step 32333: {'lr': 0.00044994346635115367, 'samples': 16555008, 'steps': 32333, 'loss/train': 2.1539382934570312} +03/05/2022 03:27:54 - INFO - codeparrot_training - Skipping example with length 45 (seq_length=1024) +03/05/2022 03:27:57 - INFO - codeparrot_training - Step 32334: {'lr': 0.00044994028066007636, 'samples': 16555520, 'steps': 32334, 'loss/train': 1.7117948532104492} +03/05/2022 03:28:00 - INFO - codeparrot_training - Step 32335: {'lr': 0.00044993709487890906, 'samples': 16556032, 'steps': 32335, 'loss/train': 1.5427757501602173} +03/05/2022 03:28:02 - INFO - codeparrot_training - Skipping example with length 438 (seq_length=1024) +03/05/2022 03:28:06 - INFO - codeparrot_training - Step 32336: {'lr': 0.0004499339090076532, 'samples': 16556544, 'steps': 32336, 'loss/train': 2.479074716567993} +03/05/2022 03:28:09 - INFO - codeparrot_training - Step 32337: {'lr': 0.0004499307230463102, 'samples': 16557056, 'steps': 32337, 'loss/train': 0.3770645558834076} +03/05/2022 03:28:10 - INFO - codeparrot_training - Skipping example with length 482 (seq_length=1024) +03/05/2022 03:28:14 - INFO - codeparrot_training - Step 32338: {'lr': 0.0004499275369948814, 'samples': 16557568, 'steps': 32338, 'loss/train': 1.9286540746688843} +03/05/2022 03:28:17 - INFO - codeparrot_training - Step 32339: {'lr': 0.0004499243508533685, 'samples': 16558080, 'steps': 32339, 'loss/train': 1.272286295890808} +03/05/2022 03:28:19 - INFO - codeparrot_training - Skipping example with length 386 (seq_length=1024) +03/05/2022 03:28:22 - INFO - codeparrot_training - Step 32340: {'lr': 0.0004499211646217727, 'samples': 16558592, 'steps': 32340, 'loss/train': 1.1806715726852417} +03/05/2022 03:28:26 - INFO - codeparrot_training - Step 32341: {'lr': 0.00044991797830009543, 'samples': 16559104, 'steps': 32341, 'loss/train': 1.5442988872528076} +03/05/2022 03:28:27 - INFO - codeparrot_training - Skipping example with length 180 (seq_length=1024) +03/05/2022 03:28:31 - INFO - codeparrot_training - Step 32342: {'lr': 0.00044991479188833826, 'samples': 16559616, 'steps': 32342, 'loss/train': 1.6451743841171265} +03/05/2022 03:28:34 - INFO - codeparrot_training - Step 32343: {'lr': 0.0004499116053865026, 'samples': 16560128, 'steps': 32343, 'loss/train': 1.5627999305725098} +03/05/2022 03:28:36 - INFO - codeparrot_training - Skipping example with length 352 (seq_length=1024) +03/05/2022 03:28:39 - INFO - codeparrot_training - Step 32344: {'lr': 0.0004499084187945899, 'samples': 16560640, 'steps': 32344, 'loss/train': 1.28183114528656} +03/05/2022 03:28:43 - INFO - codeparrot_training - Step 32345: {'lr': 0.0004499052321126015, 'samples': 16561152, 'steps': 32345, 'loss/train': 1.1448712348937988} +03/05/2022 03:28:44 - INFO - codeparrot_training - Skipping example with length 580 (seq_length=1024) +03/05/2022 03:28:48 - INFO - codeparrot_training - Step 32346: {'lr': 0.0004499020453405388, 'samples': 16561664, 'steps': 32346, 'loss/train': 1.6410918235778809} +03/05/2022 03:28:51 - INFO - codeparrot_training - Step 32347: {'lr': 0.00044989885847840344, 'samples': 16562176, 'steps': 32347, 'loss/train': 0.5534372329711914} +03/05/2022 03:28:53 - INFO - codeparrot_training - Skipping example with length 391 (seq_length=1024) +03/05/2022 03:28:56 - INFO - codeparrot_training - Step 32348: {'lr': 0.0004498956715261967, 'samples': 16562688, 'steps': 32348, 'loss/train': 1.2939332723617554} +03/05/2022 03:29:00 - INFO - codeparrot_training - Step 32349: {'lr': 0.00044989248448392007, 'samples': 16563200, 'steps': 32349, 'loss/train': 2.1184158325195312} +03/05/2022 03:29:01 - INFO - codeparrot_training - Skipping example with length 921 (seq_length=1024) +03/05/2022 03:29:05 - INFO - codeparrot_training - Step 32350: {'lr': 0.000449889297351575, 'samples': 16563712, 'steps': 32350, 'loss/train': 1.7678813934326172} +03/05/2022 03:29:08 - INFO - codeparrot_training - Step 32351: {'lr': 0.0004498861101291628, 'samples': 16564224, 'steps': 32351, 'loss/train': 1.0438998937606812} +03/05/2022 03:29:09 - INFO - codeparrot_training - Skipping example with length 934 (seq_length=1024) +03/05/2022 03:29:13 - INFO - codeparrot_training - Step 32352: {'lr': 0.0004498829228166851, 'samples': 16564736, 'steps': 32352, 'loss/train': 2.2826428413391113} +03/05/2022 03:29:16 - INFO - codeparrot_training - Step 32353: {'lr': 0.0004498797354141432, 'samples': 16565248, 'steps': 32353, 'loss/train': 1.643843650817871} +03/05/2022 03:29:18 - INFO - codeparrot_training - Skipping example with length 7 (seq_length=1024) +03/05/2022 03:29:21 - INFO - codeparrot_training - Step 32354: {'lr': 0.00044987654792153853, 'samples': 16565760, 'steps': 32354, 'loss/train': 1.048097848892212} +03/05/2022 03:29:25 - INFO - codeparrot_training - Step 32355: {'lr': 0.0004498733603388726, 'samples': 16566272, 'steps': 32355, 'loss/train': 1.6934741735458374} +03/05/2022 03:29:26 - INFO - codeparrot_training - Skipping example with length 399 (seq_length=1024) +03/05/2022 03:29:30 - INFO - codeparrot_training - Step 32356: {'lr': 0.00044987017266614684, 'samples': 16566784, 'steps': 32356, 'loss/train': 2.504734516143799} +03/05/2022 03:29:33 - INFO - codeparrot_training - Step 32357: {'lr': 0.00044986698490336263, 'samples': 16567296, 'steps': 32357, 'loss/train': 1.7436622381210327} +03/05/2022 03:29:34 - INFO - codeparrot_training - Skipping example with length 829 (seq_length=1024) +03/05/2022 03:29:38 - INFO - codeparrot_training - Step 32358: {'lr': 0.0004498637970505215, 'samples': 16567808, 'steps': 32358, 'loss/train': 1.7143983840942383} +03/05/2022 03:29:41 - INFO - codeparrot_training - Step 32359: {'lr': 0.0004498606091076248, 'samples': 16568320, 'steps': 32359, 'loss/train': 1.8568686246871948} +03/05/2022 03:29:42 - INFO - codeparrot_training - Skipping example with length 477 (seq_length=1024) +03/05/2022 03:29:47 - INFO - codeparrot_training - Step 32360: {'lr': 0.000449857421074674, 'samples': 16568832, 'steps': 32360, 'loss/train': 2.122437000274658} +03/05/2022 03:29:50 - INFO - codeparrot_training - Step 32361: {'lr': 0.0004498542329516705, 'samples': 16569344, 'steps': 32361, 'loss/train': 1.5481361150741577} +03/05/2022 03:29:52 - INFO - codeparrot_training - Skipping example with length 643 (seq_length=1024) +03/05/2022 03:29:55 - INFO - codeparrot_training - Step 32362: {'lr': 0.00044985104473861583, 'samples': 16569856, 'steps': 32362, 'loss/train': 1.305768609046936} +03/05/2022 03:29:58 - INFO - codeparrot_training - Step 32363: {'lr': 0.0004498478564355113, 'samples': 16570368, 'steps': 32363, 'loss/train': 1.6269898414611816} +03/05/2022 03:30:00 - INFO - codeparrot_training - Skipping example with length 1007 (seq_length=1024) +03/05/2022 03:30:04 - INFO - codeparrot_training - Step 32364: {'lr': 0.0004498446680423584, 'samples': 16570880, 'steps': 32364, 'loss/train': 1.9101046323776245} +03/05/2022 03:30:07 - INFO - codeparrot_training - Step 32365: {'lr': 0.0004498414795591586, 'samples': 16571392, 'steps': 32365, 'loss/train': 1.536567211151123} +03/05/2022 03:30:09 - INFO - codeparrot_training - Skipping example with length 581 (seq_length=1024) +03/05/2022 03:30:12 - INFO - codeparrot_training - Step 32366: {'lr': 0.00044983829098591336, 'samples': 16571904, 'steps': 32366, 'loss/train': 1.50094735622406} +03/05/2022 03:30:15 - INFO - codeparrot_training - Step 32367: {'lr': 0.00044983510232262405, 'samples': 16572416, 'steps': 32367, 'loss/train': 1.4778085947036743} +03/05/2022 03:30:17 - INFO - codeparrot_training - Skipping example with length 444 (seq_length=1024) +03/05/2022 03:30:21 - INFO - codeparrot_training - Step 32368: {'lr': 0.0004498319135692921, 'samples': 16572928, 'steps': 32368, 'loss/train': 2.0233843326568604} +03/05/2022 03:30:24 - INFO - codeparrot_training - Step 32369: {'lr': 0.00044982872472591897, 'samples': 16573440, 'steps': 32369, 'loss/train': 1.9142979383468628} +03/05/2022 03:30:25 - INFO - codeparrot_training - Skipping example with length 17 (seq_length=1024) +03/05/2022 03:30:29 - INFO - codeparrot_training - Step 32370: {'lr': 0.00044982553579250606, 'samples': 16573952, 'steps': 32370, 'loss/train': 2.364659547805786} +03/05/2022 03:30:32 - INFO - codeparrot_training - Step 32371: {'lr': 0.0004498223467690549, 'samples': 16574464, 'steps': 32371, 'loss/train': 1.2702393531799316} +03/05/2022 03:30:34 - INFO - codeparrot_training - Skipping example with length 849 (seq_length=1024) +03/05/2022 03:30:38 - INFO - codeparrot_training - Step 32372: {'lr': 0.0004498191576555669, 'samples': 16574976, 'steps': 32372, 'loss/train': 2.0149991512298584} +03/05/2022 03:30:41 - INFO - codeparrot_training - Step 32373: {'lr': 0.00044981596845204344, 'samples': 16575488, 'steps': 32373, 'loss/train': 1.873853325843811} +03/05/2022 03:30:43 - INFO - codeparrot_training - Skipping example with length 39 (seq_length=1024) +03/05/2022 03:30:46 - INFO - codeparrot_training - Step 32374: {'lr': 0.00044981277915848595, 'samples': 16576000, 'steps': 32374, 'loss/train': 0.9891318082809448} +03/05/2022 03:30:49 - INFO - codeparrot_training - Step 32375: {'lr': 0.00044980958977489593, 'samples': 16576512, 'steps': 32375, 'loss/train': 1.9771904945373535} +03/05/2022 03:30:51 - INFO - codeparrot_training - Skipping example with length 292 (seq_length=1024) +03/05/2022 03:30:54 - INFO - codeparrot_training - Step 32376: {'lr': 0.00044980640030127484, 'samples': 16577024, 'steps': 32376, 'loss/train': 1.327635645866394} +03/05/2022 03:30:57 - INFO - codeparrot_training - Step 32377: {'lr': 0.00044980321073762405, 'samples': 16577536, 'steps': 32377, 'loss/train': 1.2788350582122803} +03/05/2022 03:30:59 - INFO - codeparrot_training - Skipping example with length 46 (seq_length=1024) +03/05/2022 03:31:03 - INFO - codeparrot_training - Step 32378: {'lr': 0.00044980002108394496, 'samples': 16578048, 'steps': 32378, 'loss/train': 1.1805237531661987} +03/05/2022 03:31:06 - INFO - codeparrot_training - Step 32379: {'lr': 0.0004497968313402391, 'samples': 16578560, 'steps': 32379, 'loss/train': 1.724697232246399} +03/05/2022 03:31:07 - INFO - codeparrot_training - Skipping example with length 954 (seq_length=1024) +03/05/2022 03:31:11 - INFO - codeparrot_training - Step 32380: {'lr': 0.00044979364150650794, 'samples': 16579072, 'steps': 32380, 'loss/train': 2.061079978942871} +03/05/2022 03:31:14 - INFO - codeparrot_training - Step 32381: {'lr': 0.00044979045158275273, 'samples': 16579584, 'steps': 32381, 'loss/train': 1.7152940034866333} +03/05/2022 03:31:16 - INFO - codeparrot_training - Skipping example with length 861 (seq_length=1024) +03/05/2022 03:31:20 - INFO - codeparrot_training - Step 32382: {'lr': 0.0004497872615689751, 'samples': 16580096, 'steps': 32382, 'loss/train': 1.9621801376342773} +03/05/2022 03:31:23 - INFO - codeparrot_training - Step 32383: {'lr': 0.00044978407146517634, 'samples': 16580608, 'steps': 32383, 'loss/train': 0.3224453032016754} +03/05/2022 03:31:24 - INFO - codeparrot_training - Skipping example with length 648 (seq_length=1024) +03/05/2022 03:31:28 - INFO - codeparrot_training - Step 32384: {'lr': 0.0004497808812713581, 'samples': 16581120, 'steps': 32384, 'loss/train': 1.7872172594070435} +03/05/2022 03:31:31 - INFO - codeparrot_training - Step 32385: {'lr': 0.00044977769098752154, 'samples': 16581632, 'steps': 32385, 'loss/train': 0.6527504920959473} +03/05/2022 03:31:33 - INFO - codeparrot_training - Skipping example with length 107 (seq_length=1024) +03/05/2022 03:31:37 - INFO - codeparrot_training - Step 32386: {'lr': 0.0004497745006136683, 'samples': 16582144, 'steps': 32386, 'loss/train': 1.9129481315612793} +03/05/2022 03:31:40 - INFO - codeparrot_training - Step 32387: {'lr': 0.00044977131014979974, 'samples': 16582656, 'steps': 32387, 'loss/train': 1.2443722486495972} +03/05/2022 03:31:41 - INFO - codeparrot_training - Skipping example with length 304 (seq_length=1024) +03/05/2022 03:31:45 - INFO - codeparrot_training - Step 32388: {'lr': 0.0004497681195959173, 'samples': 16583168, 'steps': 32388, 'loss/train': 1.3849151134490967} +03/05/2022 03:31:48 - INFO - codeparrot_training - Step 32389: {'lr': 0.0004497649289520224, 'samples': 16583680, 'steps': 32389, 'loss/train': 0.22375613451004028} +03/05/2022 03:31:50 - INFO - codeparrot_training - Skipping example with length 510 (seq_length=1024) +03/05/2022 03:31:54 - INFO - codeparrot_training - Step 32390: {'lr': 0.00044976173821811654, 'samples': 16584192, 'steps': 32390, 'loss/train': 1.9322353601455688} +03/05/2022 03:31:57 - INFO - codeparrot_training - Step 32391: {'lr': 0.0004497585473942011, 'samples': 16584704, 'steps': 32391, 'loss/train': 2.339860439300537} +03/05/2022 03:31:59 - INFO - codeparrot_training - Skipping example with length 933 (seq_length=1024) +03/05/2022 03:32:02 - INFO - codeparrot_training - Step 32392: {'lr': 0.0004497553564802776, 'samples': 16585216, 'steps': 32392, 'loss/train': 1.9951239824295044} +03/05/2022 03:32:05 - INFO - codeparrot_training - Step 32393: {'lr': 0.0004497521654763474, 'samples': 16585728, 'steps': 32393, 'loss/train': 1.1290035247802734} +03/05/2022 03:32:07 - INFO - codeparrot_training - Skipping example with length 60 (seq_length=1024) +03/05/2022 03:32:10 - INFO - codeparrot_training - Step 32394: {'lr': 0.0004497489743824119, 'samples': 16586240, 'steps': 32394, 'loss/train': 2.451751470565796} +03/05/2022 03:32:14 - INFO - codeparrot_training - Step 32395: {'lr': 0.0004497457831984727, 'samples': 16586752, 'steps': 32395, 'loss/train': 1.840139389038086} +03/05/2022 03:32:15 - INFO - codeparrot_training - Skipping example with length 19 (seq_length=1024) +03/05/2022 03:32:19 - INFO - codeparrot_training - Step 32396: {'lr': 0.00044974259192453103, 'samples': 16587264, 'steps': 32396, 'loss/train': 3.2688207626342773} +03/05/2022 03:32:22 - INFO - codeparrot_training - Step 32397: {'lr': 0.0004497394005605885, 'samples': 16587776, 'steps': 32397, 'loss/train': 1.2105220556259155} +03/05/2022 03:32:23 - INFO - codeparrot_training - Skipping example with length 901 (seq_length=1024) +03/05/2022 03:32:27 - INFO - codeparrot_training - Step 32398: {'lr': 0.00044973620910664645, 'samples': 16588288, 'steps': 32398, 'loss/train': 1.652271032333374} +03/05/2022 03:32:30 - INFO - codeparrot_training - Step 32399: {'lr': 0.00044973301756270635, 'samples': 16588800, 'steps': 32399, 'loss/train': 1.8055057525634766} +03/05/2022 03:32:32 - INFO - codeparrot_training - Skipping example with length 376 (seq_length=1024) +03/05/2022 03:32:36 - INFO - codeparrot_training - Step 32400: {'lr': 0.0004497298259287696, 'samples': 16589312, 'steps': 32400, 'loss/train': 1.1664719581604004} +03/05/2022 03:32:39 - INFO - codeparrot_training - Step 32401: {'lr': 0.00044972663420483774, 'samples': 16589824, 'steps': 32401, 'loss/train': 1.8694703578948975} +03/05/2022 03:32:40 - INFO - codeparrot_training - Skipping example with length 788 (seq_length=1024) +03/05/2022 03:32:44 - INFO - codeparrot_training - Step 32402: {'lr': 0.00044972344239091206, 'samples': 16590336, 'steps': 32402, 'loss/train': 0.6922139525413513} +03/05/2022 03:32:47 - INFO - codeparrot_training - Step 32403: {'lr': 0.0004497202504869941, 'samples': 16590848, 'steps': 32403, 'loss/train': 2.0953924655914307} +03/05/2022 03:32:49 - INFO - codeparrot_training - Skipping example with length 992 (seq_length=1024) +03/05/2022 03:32:53 - INFO - codeparrot_training - Step 32404: {'lr': 0.0004497170584930853, 'samples': 16591360, 'steps': 32404, 'loss/train': 1.4079786539077759} +03/05/2022 03:32:56 - INFO - codeparrot_training - Step 32405: {'lr': 0.0004497138664091871, 'samples': 16591872, 'steps': 32405, 'loss/train': 1.5663923025131226} +03/05/2022 03:32:59 - INFO - codeparrot_training - Skipping example with length 660 (seq_length=1024) +03/05/2022 03:33:01 - INFO - codeparrot_training - Step 32406: {'lr': 0.00044971067423530087, 'samples': 16592384, 'steps': 32406, 'loss/train': 2.1109795570373535} +03/05/2022 03:33:05 - INFO - codeparrot_training - Step 32407: {'lr': 0.0004497074819714281, 'samples': 16592896, 'steps': 32407, 'loss/train': 1.9000605344772339} +03/05/2022 03:33:07 - INFO - codeparrot_training - Skipping example with length 264 (seq_length=1024) +03/05/2022 03:33:10 - INFO - codeparrot_training - Step 32408: {'lr': 0.00044970428961757026, 'samples': 16593408, 'steps': 32408, 'loss/train': 1.4713932275772095} +03/05/2022 03:33:13 - INFO - codeparrot_training - Step 32409: {'lr': 0.00044970109717372864, 'samples': 16593920, 'steps': 32409, 'loss/train': 2.370283603668213} +03/05/2022 03:33:15 - INFO - codeparrot_training - Skipping example with length 646 (seq_length=1024) +03/05/2022 03:33:18 - INFO - codeparrot_training - Step 32410: {'lr': 0.0004496979046399049, 'samples': 16594432, 'steps': 32410, 'loss/train': 2.0688838958740234} +03/05/2022 03:33:21 - INFO - codeparrot_training - Step 32411: {'lr': 0.00044969471201610037, 'samples': 16594944, 'steps': 32411, 'loss/train': 1.4880917072296143} +03/05/2022 03:33:24 - INFO - codeparrot_training - Skipping example with length 862 (seq_length=1024) +03/05/2022 03:33:27 - INFO - codeparrot_training - Step 32412: {'lr': 0.00044969151930231643, 'samples': 16595456, 'steps': 32412, 'loss/train': 1.0462182760238647} +03/05/2022 03:33:30 - INFO - codeparrot_training - Step 32413: {'lr': 0.00044968832649855455, 'samples': 16595968, 'steps': 32413, 'loss/train': 1.2924472093582153} +03/05/2022 03:33:32 - INFO - codeparrot_training - Skipping example with length 465 (seq_length=1024) +03/05/2022 03:33:35 - INFO - codeparrot_training - Step 32414: {'lr': 0.00044968513360481624, 'samples': 16596480, 'steps': 32414, 'loss/train': 2.191091775894165} +03/05/2022 03:33:39 - INFO - codeparrot_training - Step 32415: {'lr': 0.0004496819406211029, 'samples': 16596992, 'steps': 32415, 'loss/train': 1.7938324213027954} +03/05/2022 03:33:41 - INFO - codeparrot_training - Skipping example with length 561 (seq_length=1024) +03/05/2022 03:33:44 - INFO - codeparrot_training - Step 32416: {'lr': 0.0004496787475474159, 'samples': 16597504, 'steps': 32416, 'loss/train': 1.386800765991211} +03/05/2022 03:33:47 - INFO - codeparrot_training - Step 32417: {'lr': 0.00044967555438375675, 'samples': 16598016, 'steps': 32417, 'loss/train': 1.829301118850708} +03/05/2022 03:33:50 - INFO - codeparrot_training - Skipping example with length 127 (seq_length=1024) +03/05/2022 03:33:52 - INFO - codeparrot_training - Step 32418: {'lr': 0.0004496723611301269, 'samples': 16598528, 'steps': 32418, 'loss/train': 2.0702104568481445} +03/05/2022 03:33:55 - INFO - codeparrot_training - Step 32419: {'lr': 0.00044966916778652776, 'samples': 16599040, 'steps': 32419, 'loss/train': 1.859232783317566} +03/05/2022 03:33:58 - INFO - codeparrot_training - Skipping example with length 87 (seq_length=1024) +03/05/2022 03:34:01 - INFO - codeparrot_training - Step 32420: {'lr': 0.0004496659743529608, 'samples': 16599552, 'steps': 32420, 'loss/train': 2.0355241298675537} +03/05/2022 03:34:04 - INFO - codeparrot_training - Step 32421: {'lr': 0.00044966278082942746, 'samples': 16600064, 'steps': 32421, 'loss/train': 2.117018938064575} +03/05/2022 03:34:07 - INFO - codeparrot_training - Skipping example with length 989 (seq_length=1024) +03/05/2022 03:34:09 - INFO - codeparrot_training - Step 32422: {'lr': 0.000449659587215929, 'samples': 16600576, 'steps': 32422, 'loss/train': 1.6251906156539917} +03/05/2022 03:34:12 - INFO - codeparrot_training - Step 32423: {'lr': 0.0004496563935124672, 'samples': 16601088, 'steps': 32423, 'loss/train': 1.58332097530365} +03/05/2022 03:34:15 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 03:34:18 - INFO - codeparrot_training - Step 32424: {'lr': 0.0004496531997190432, 'samples': 16601600, 'steps': 32424, 'loss/train': 1.653906226158142} +03/05/2022 03:34:21 - INFO - codeparrot_training - Step 32425: {'lr': 0.0004496500058356586, 'samples': 16602112, 'steps': 32425, 'loss/train': 2.4441323280334473} +03/05/2022 03:34:23 - INFO - codeparrot_training - Skipping example with length 446 (seq_length=1024) +03/05/2022 03:34:26 - INFO - codeparrot_training - Step 32426: {'lr': 0.00044964681186231473, 'samples': 16602624, 'steps': 32426, 'loss/train': 2.017547607421875} +03/05/2022 03:34:29 - INFO - codeparrot_training - Step 32427: {'lr': 0.0004496436177990131, 'samples': 16603136, 'steps': 32427, 'loss/train': 1.3357704877853394} +03/05/2022 03:34:31 - INFO - codeparrot_training - Skipping example with length 719 (seq_length=1024) +03/05/2022 03:34:34 - INFO - codeparrot_training - Step 32428: {'lr': 0.0004496404236457552, 'samples': 16603648, 'steps': 32428, 'loss/train': 1.8977664709091187} +03/05/2022 03:34:37 - INFO - codeparrot_training - Step 32429: {'lr': 0.0004496372294025424, 'samples': 16604160, 'steps': 32429, 'loss/train': 1.779232382774353} +03/05/2022 03:34:40 - INFO - codeparrot_training - Skipping example with length 1014 (seq_length=1024) +03/05/2022 03:34:43 - INFO - codeparrot_training - Step 32430: {'lr': 0.00044963403506937603, 'samples': 16604672, 'steps': 32430, 'loss/train': 1.7111198902130127} +03/05/2022 03:34:46 - INFO - codeparrot_training - Step 32431: {'lr': 0.00044963084064625775, 'samples': 16605184, 'steps': 32431, 'loss/train': 2.3616256713867188} +03/05/2022 03:34:49 - INFO - codeparrot_training - Skipping example with length 560 (seq_length=1024) +03/05/2022 03:34:51 - INFO - codeparrot_training - Step 32432: {'lr': 0.00044962764613318886, 'samples': 16605696, 'steps': 32432, 'loss/train': 1.4934982061386108} +03/05/2022 03:34:54 - INFO - codeparrot_training - Step 32433: {'lr': 0.00044962445153017087, 'samples': 16606208, 'steps': 32433, 'loss/train': 1.1801294088363647} +03/05/2022 03:34:57 - INFO - codeparrot_training - Skipping example with length 145 (seq_length=1024) +03/05/2022 03:35:00 - INFO - codeparrot_training - Step 32434: {'lr': 0.00044962125683720513, 'samples': 16606720, 'steps': 32434, 'loss/train': 1.0857094526290894} +03/05/2022 03:35:03 - INFO - codeparrot_training - Step 32435: {'lr': 0.0004496180620542931, 'samples': 16607232, 'steps': 32435, 'loss/train': 2.293895721435547} +03/05/2022 03:35:05 - INFO - codeparrot_training - Skipping example with length 218 (seq_length=1024) +03/05/2022 03:35:08 - INFO - codeparrot_training - Step 32436: {'lr': 0.00044961486718143634, 'samples': 16607744, 'steps': 32436, 'loss/train': 1.5313867330551147} +03/05/2022 03:35:12 - INFO - codeparrot_training - Step 32437: {'lr': 0.0004496116722186362, 'samples': 16608256, 'steps': 32437, 'loss/train': 1.0509016513824463} +03/05/2022 03:35:14 - INFO - codeparrot_training - Skipping example with length 138 (seq_length=1024) +03/05/2022 03:35:17 - INFO - codeparrot_training - Step 32438: {'lr': 0.00044960847716589403, 'samples': 16608768, 'steps': 32438, 'loss/train': 0.3248491883277893} +03/05/2022 03:35:20 - INFO - codeparrot_training - Step 32439: {'lr': 0.00044960528202321143, 'samples': 16609280, 'steps': 32439, 'loss/train': 2.612558126449585} +03/05/2022 03:35:23 - INFO - codeparrot_training - Skipping example with length 593 (seq_length=1024) +03/05/2022 03:35:25 - INFO - codeparrot_training - Step 32440: {'lr': 0.0004496020867905898, 'samples': 16609792, 'steps': 32440, 'loss/train': 1.4358925819396973} +03/05/2022 03:35:28 - INFO - codeparrot_training - Step 32441: {'lr': 0.00044959889146803047, 'samples': 16610304, 'steps': 32441, 'loss/train': 0.838768720626831} +03/05/2022 03:35:31 - INFO - codeparrot_training - Skipping example with length 455 (seq_length=1024) +03/05/2022 03:35:34 - INFO - codeparrot_training - Step 32442: {'lr': 0.00044959569605553494, 'samples': 16610816, 'steps': 32442, 'loss/train': 1.6564538478851318} +03/05/2022 03:35:37 - INFO - codeparrot_training - Step 32443: {'lr': 0.00044959250055310473, 'samples': 16611328, 'steps': 32443, 'loss/train': 6.891471862792969} +03/05/2022 03:35:40 - INFO - codeparrot_training - Step 32444: {'lr': 0.00044958930496074125, 'samples': 16611840, 'steps': 32444, 'loss/train': 1.9294989109039307} +03/05/2022 03:35:40 - INFO - codeparrot_training - Skipping example with length 560 (seq_length=1024) +03/05/2022 03:35:45 - INFO - codeparrot_training - Step 32445: {'lr': 0.0004495861092784459, 'samples': 16612352, 'steps': 32445, 'loss/train': 2.1351335048675537} +03/05/2022 03:35:48 - INFO - codeparrot_training - Skipping example with length 188 (seq_length=1024) +03/05/2022 03:35:51 - INFO - codeparrot_training - Step 32446: {'lr': 0.00044958291350622007, 'samples': 16612864, 'steps': 32446, 'loss/train': 1.3726168870925903} +03/05/2022 03:35:54 - INFO - codeparrot_training - Step 32447: {'lr': 0.0004495797176440653, 'samples': 16613376, 'steps': 32447, 'loss/train': 0.21007169783115387} +03/05/2022 03:35:56 - INFO - codeparrot_training - Skipping example with length 757 (seq_length=1024) +03/05/2022 03:35:59 - INFO - codeparrot_training - Step 32448: {'lr': 0.000449576521691983, 'samples': 16613888, 'steps': 32448, 'loss/train': 0.7761363387107849} +03/05/2022 03:36:02 - INFO - codeparrot_training - Step 32449: {'lr': 0.00044957332564997453, 'samples': 16614400, 'steps': 32449, 'loss/train': 1.8157480955123901} +03/05/2022 03:36:05 - INFO - codeparrot_training - Skipping example with length 98 (seq_length=1024) +03/05/2022 03:36:08 - INFO - codeparrot_training - Step 32450: {'lr': 0.0004495701295180414, 'samples': 16614912, 'steps': 32450, 'loss/train': 0.6970478296279907} +03/05/2022 03:36:11 - INFO - codeparrot_training - Step 32451: {'lr': 0.0004495669332961852, 'samples': 16615424, 'steps': 32451, 'loss/train': 2.6068992614746094} +03/05/2022 03:36:13 - INFO - codeparrot_training - Skipping example with length 118 (seq_length=1024) +03/05/2022 03:36:16 - INFO - codeparrot_training - Step 32452: {'lr': 0.0004495637369844071, 'samples': 16615936, 'steps': 32452, 'loss/train': 1.5784298181533813} +03/05/2022 03:36:19 - INFO - codeparrot_training - Step 32453: {'lr': 0.0004495605405827087, 'samples': 16616448, 'steps': 32453, 'loss/train': 2.0984599590301514} +03/05/2022 03:36:22 - INFO - codeparrot_training - Skipping example with length 278 (seq_length=1024) +03/05/2022 03:36:25 - INFO - codeparrot_training - Step 32454: {'lr': 0.00044955734409109135, 'samples': 16616960, 'steps': 32454, 'loss/train': 1.4528424739837646} +03/05/2022 03:36:28 - INFO - codeparrot_training - Step 32455: {'lr': 0.0004495541475095566, 'samples': 16617472, 'steps': 32455, 'loss/train': 1.8714102506637573} +03/05/2022 03:36:30 - INFO - codeparrot_training - Skipping example with length 195 (seq_length=1024) +03/05/2022 03:36:33 - INFO - codeparrot_training - Step 32456: {'lr': 0.0004495509508381058, 'samples': 16617984, 'steps': 32456, 'loss/train': 1.0773853063583374} +03/05/2022 03:36:36 - INFO - codeparrot_training - Step 32457: {'lr': 0.00044954775407674035, 'samples': 16618496, 'steps': 32457, 'loss/train': 1.935227870941162} +03/05/2022 03:36:39 - INFO - codeparrot_training - Skipping example with length 114 (seq_length=1024) +03/05/2022 03:36:42 - INFO - codeparrot_training - Step 32458: {'lr': 0.00044954455722546186, 'samples': 16619008, 'steps': 32458, 'loss/train': 1.594394564628601} +03/05/2022 03:36:45 - INFO - codeparrot_training - Step 32459: {'lr': 0.0004495413602842716, 'samples': 16619520, 'steps': 32459, 'loss/train': 1.6186305284500122} +03/05/2022 03:36:47 - INFO - codeparrot_training - Skipping example with length 408 (seq_length=1024) +03/05/2022 03:36:50 - INFO - codeparrot_training - Step 32460: {'lr': 0.00044953816325317116, 'samples': 16620032, 'steps': 32460, 'loss/train': 2.327622413635254} +03/05/2022 03:36:53 - INFO - codeparrot_training - Step 32461: {'lr': 0.0004495349661321618, 'samples': 16620544, 'steps': 32461, 'loss/train': 1.9374125003814697} +03/05/2022 03:36:56 - INFO - codeparrot_training - Skipping example with length 53 (seq_length=1024) +03/05/2022 03:36:58 - INFO - codeparrot_training - Step 32462: {'lr': 0.0004495317689212452, 'samples': 16621056, 'steps': 32462, 'loss/train': 2.392763137817383} +03/05/2022 03:37:02 - INFO - codeparrot_training - Step 32463: {'lr': 0.0004495285716204226, 'samples': 16621568, 'steps': 32463, 'loss/train': 1.5358927249908447} +03/05/2022 03:37:04 - INFO - codeparrot_training - Skipping example with length 107 (seq_length=1024) +03/05/2022 03:37:07 - INFO - codeparrot_training - Step 32464: {'lr': 0.00044952537422969545, 'samples': 16622080, 'steps': 32464, 'loss/train': 1.72659170627594} +03/05/2022 03:37:10 - INFO - codeparrot_training - Step 32465: {'lr': 0.0004495221767490653, 'samples': 16622592, 'steps': 32465, 'loss/train': 1.0177475214004517} +03/05/2022 03:37:12 - INFO - codeparrot_training - Skipping example with length 271 (seq_length=1024) +03/05/2022 03:37:15 - INFO - codeparrot_training - Step 32466: {'lr': 0.00044951897917853355, 'samples': 16623104, 'steps': 32466, 'loss/train': 1.385553002357483} +03/05/2022 03:37:19 - INFO - codeparrot_training - Step 32467: {'lr': 0.0004495157815181016, 'samples': 16623616, 'steps': 32467, 'loss/train': 2.412515640258789} +03/05/2022 03:37:20 - INFO - codeparrot_training - Skipping example with length 592 (seq_length=1024) +03/05/2022 03:37:24 - INFO - codeparrot_training - Step 32468: {'lr': 0.00044951258376777094, 'samples': 16624128, 'steps': 32468, 'loss/train': 2.292073965072632} +03/05/2022 03:37:27 - INFO - codeparrot_training - Step 32469: {'lr': 0.00044950938592754297, 'samples': 16624640, 'steps': 32469, 'loss/train': 2.0912930965423584} +03/05/2022 03:37:29 - INFO - codeparrot_training - Skipping example with length 511 (seq_length=1024) +03/05/2022 03:37:32 - INFO - codeparrot_training - Step 32470: {'lr': 0.00044950618799741913, 'samples': 16625152, 'steps': 32470, 'loss/train': 1.9644982814788818} +03/05/2022 03:37:35 - INFO - codeparrot_training - Step 32471: {'lr': 0.0004495029899774009, 'samples': 16625664, 'steps': 32471, 'loss/train': 1.2476348876953125} +03/05/2022 03:37:37 - INFO - codeparrot_training - Skipping example with length 673 (seq_length=1024) +03/05/2022 03:37:41 - INFO - codeparrot_training - Step 32472: {'lr': 0.00044949979186748967, 'samples': 16626176, 'steps': 32472, 'loss/train': 1.8012356758117676} +03/05/2022 03:37:44 - INFO - codeparrot_training - Step 32473: {'lr': 0.00044949659366768697, 'samples': 16626688, 'steps': 32473, 'loss/train': 1.7679799795150757} +03/05/2022 03:37:46 - INFO - codeparrot_training - Skipping example with length 722 (seq_length=1024) +03/05/2022 03:37:49 - INFO - codeparrot_training - Step 32474: {'lr': 0.00044949339537799415, 'samples': 16627200, 'steps': 32474, 'loss/train': 1.7883752584457397} +03/05/2022 03:37:52 - INFO - codeparrot_training - Step 32475: {'lr': 0.0004494901969984127, 'samples': 16627712, 'steps': 32475, 'loss/train': 2.003964900970459} +03/05/2022 03:37:54 - INFO - codeparrot_training - Skipping example with length 252 (seq_length=1024) +03/05/2022 03:37:58 - INFO - codeparrot_training - Step 32476: {'lr': 0.000449486998528944, 'samples': 16628224, 'steps': 32476, 'loss/train': 0.9493886828422546} +03/05/2022 03:38:01 - INFO - codeparrot_training - Step 32477: {'lr': 0.00044948379996958963, 'samples': 16628736, 'steps': 32477, 'loss/train': 2.0646250247955322} +03/05/2022 03:38:02 - INFO - codeparrot_training - Skipping example with length 483 (seq_length=1024) +03/05/2022 03:38:06 - INFO - codeparrot_training - Step 32478: {'lr': 0.00044948060132035087, 'samples': 16629248, 'steps': 32478, 'loss/train': 0.6245011687278748} +03/05/2022 03:38:09 - INFO - codeparrot_training - Step 32479: {'lr': 0.00044947740258122925, 'samples': 16629760, 'steps': 32479, 'loss/train': 1.4211345911026} +03/05/2022 03:38:11 - INFO - codeparrot_training - Skipping example with length 231 (seq_length=1024) +03/05/2022 03:38:14 - INFO - codeparrot_training - Step 32480: {'lr': 0.00044947420375222614, 'samples': 16630272, 'steps': 32480, 'loss/train': 2.0545804500579834} +03/05/2022 03:38:18 - INFO - codeparrot_training - Step 32481: {'lr': 0.00044947100483334315, 'samples': 16630784, 'steps': 32481, 'loss/train': 1.4362703561782837} +03/05/2022 03:38:19 - INFO - codeparrot_training - Skipping example with length 261 (seq_length=1024) +03/05/2022 03:38:23 - INFO - codeparrot_training - Step 32482: {'lr': 0.0004494678058245815, 'samples': 16631296, 'steps': 32482, 'loss/train': 1.420967936515808} +03/05/2022 03:38:26 - INFO - codeparrot_training - Step 32483: {'lr': 0.00044946460672594277, 'samples': 16631808, 'steps': 32483, 'loss/train': 1.9648367166519165} +03/05/2022 03:38:27 - INFO - codeparrot_training - Skipping example with length 988 (seq_length=1024) +03/05/2022 03:38:31 - INFO - codeparrot_training - Step 32484: {'lr': 0.0004494614075374283, 'samples': 16632320, 'steps': 32484, 'loss/train': 1.3338794708251953} +03/05/2022 03:38:34 - INFO - codeparrot_training - Step 32485: {'lr': 0.0004494582082590397, 'samples': 16632832, 'steps': 32485, 'loss/train': 1.271061897277832} +03/05/2022 03:38:36 - INFO - codeparrot_training - Skipping example with length 322 (seq_length=1024) +03/05/2022 03:38:40 - INFO - codeparrot_training - Step 32486: {'lr': 0.0004494550088907783, 'samples': 16633344, 'steps': 32486, 'loss/train': 2.485957145690918} +03/05/2022 03:38:43 - INFO - codeparrot_training - Step 32487: {'lr': 0.00044945180943264544, 'samples': 16633856, 'steps': 32487, 'loss/train': 1.375436782836914} +03/05/2022 03:38:44 - INFO - codeparrot_training - Skipping example with length 423 (seq_length=1024) +03/05/2022 03:38:48 - INFO - codeparrot_training - Step 32488: {'lr': 0.00044944860988464276, 'samples': 16634368, 'steps': 32488, 'loss/train': 1.2037006616592407} +03/05/2022 03:38:51 - INFO - codeparrot_training - Step 32489: {'lr': 0.0004494454102467716, 'samples': 16634880, 'steps': 32489, 'loss/train': 1.753919243812561} +03/05/2022 03:38:52 - INFO - codeparrot_training - Skipping example with length 372 (seq_length=1024) +03/05/2022 03:38:56 - INFO - codeparrot_training - Step 32490: {'lr': 0.00044944221051903345, 'samples': 16635392, 'steps': 32490, 'loss/train': 1.0960522890090942} +03/05/2022 03:38:59 - INFO - codeparrot_training - Step 32491: {'lr': 0.0004494390107014297, 'samples': 16635904, 'steps': 32491, 'loss/train': 2.0408830642700195} +03/05/2022 03:39:01 - INFO - codeparrot_training - Skipping example with length 191 (seq_length=1024) +03/05/2022 03:39:05 - INFO - codeparrot_training - Step 32492: {'lr': 0.0004494358107939618, 'samples': 16636416, 'steps': 32492, 'loss/train': 1.9325721263885498} +03/05/2022 03:39:08 - INFO - codeparrot_training - Step 32493: {'lr': 0.0004494326107966311, 'samples': 16636928, 'steps': 32493, 'loss/train': 2.104515790939331} +03/05/2022 03:39:09 - INFO - codeparrot_training - Skipping example with length 74 (seq_length=1024) +03/05/2022 03:39:13 - INFO - codeparrot_training - Step 32494: {'lr': 0.0004494294107094393, 'samples': 16637440, 'steps': 32494, 'loss/train': 1.7816121578216553} +03/05/2022 03:39:16 - INFO - codeparrot_training - Step 32495: {'lr': 0.00044942621053238764, 'samples': 16637952, 'steps': 32495, 'loss/train': 2.0925283432006836} +03/05/2022 03:39:18 - INFO - codeparrot_training - Skipping example with length 693 (seq_length=1024) +03/05/2022 03:39:22 - INFO - codeparrot_training - Step 32496: {'lr': 0.00044942301026547755, 'samples': 16638464, 'steps': 32496, 'loss/train': 1.8603712320327759} +03/05/2022 03:39:25 - INFO - codeparrot_training - Step 32497: {'lr': 0.0004494198099087106, 'samples': 16638976, 'steps': 32497, 'loss/train': 2.3530497550964355} +03/05/2022 03:39:26 - INFO - codeparrot_training - Skipping example with length 847 (seq_length=1024) +03/05/2022 03:39:30 - INFO - codeparrot_training - Step 32498: {'lr': 0.00044941660946208806, 'samples': 16639488, 'steps': 32498, 'loss/train': 1.3806134462356567} +03/05/2022 03:39:33 - INFO - codeparrot_training - Step 32499: {'lr': 0.00044941340892561154, 'samples': 16640000, 'steps': 32499, 'loss/train': 1.5196136236190796} +03/05/2022 03:39:35 - INFO - codeparrot_training - Skipping example with length 22 (seq_length=1024) +03/05/2022 03:39:39 - INFO - codeparrot_training - Step 32500: {'lr': 0.00044941020829928247, 'samples': 16640512, 'steps': 32500, 'loss/train': 1.8932324647903442} +03/05/2022 03:39:42 - INFO - codeparrot_training - Step 32501: {'lr': 0.00044940700758310214, 'samples': 16641024, 'steps': 32501, 'loss/train': 0.6498285531997681} +03/05/2022 03:39:43 - INFO - codeparrot_training - Skipping example with length 220 (seq_length=1024) +03/05/2022 03:39:47 - INFO - codeparrot_training - Step 32502: {'lr': 0.00044940380677707214, 'samples': 16641536, 'steps': 32502, 'loss/train': 0.18013617396354675} +03/05/2022 03:39:51 - INFO - codeparrot_training - Step 32503: {'lr': 0.00044940060588119393, 'samples': 16642048, 'steps': 32503, 'loss/train': 2.164668560028076} +03/05/2022 03:39:53 - INFO - codeparrot_training - Skipping example with length 343 (seq_length=1024) +03/05/2022 03:39:56 - INFO - codeparrot_training - Step 32504: {'lr': 0.00044939740489546875, 'samples': 16642560, 'steps': 32504, 'loss/train': 1.910035252571106} +03/05/2022 03:39:59 - INFO - codeparrot_training - Step 32505: {'lr': 0.0004493942038198983, 'samples': 16643072, 'steps': 32505, 'loss/train': 1.783010482788086} +03/05/2022 03:40:01 - INFO - codeparrot_training - Skipping example with length 614 (seq_length=1024) +03/05/2022 03:40:04 - INFO - codeparrot_training - Step 32506: {'lr': 0.0004493910026544838, 'samples': 16643584, 'steps': 32506, 'loss/train': 1.813146710395813} +03/05/2022 03:40:07 - INFO - codeparrot_training - Step 32507: {'lr': 0.0004493878013992268, 'samples': 16644096, 'steps': 32507, 'loss/train': 1.222377061843872} +03/05/2022 03:40:09 - INFO - codeparrot_training - Skipping example with length 983 (seq_length=1024) +03/05/2022 03:40:13 - INFO - codeparrot_training - Step 32508: {'lr': 0.0004493846000541287, 'samples': 16644608, 'steps': 32508, 'loss/train': 2.4136996269226074} +03/05/2022 03:40:16 - INFO - codeparrot_training - Step 32509: {'lr': 0.00044938139861919115, 'samples': 16645120, 'steps': 32509, 'loss/train': 1.6823498010635376} +03/05/2022 03:40:18 - INFO - codeparrot_training - Skipping example with length 717 (seq_length=1024) +03/05/2022 03:40:21 - INFO - codeparrot_training - Step 32510: {'lr': 0.00044937819709441523, 'samples': 16645632, 'steps': 32510, 'loss/train': 1.9083900451660156} +03/05/2022 03:40:24 - INFO - codeparrot_training - Step 32511: {'lr': 0.00044937499547980265, 'samples': 16646144, 'steps': 32511, 'loss/train': 1.6409327983856201} +03/05/2022 03:40:26 - INFO - codeparrot_training - Skipping example with length 121 (seq_length=1024) +03/05/2022 03:40:30 - INFO - codeparrot_training - Step 32512: {'lr': 0.00044937179377535475, 'samples': 16646656, 'steps': 32512, 'loss/train': 1.6740772724151611} +03/05/2022 03:40:33 - INFO - codeparrot_training - Step 32513: {'lr': 0.00044936859198107306, 'samples': 16647168, 'steps': 32513, 'loss/train': 2.3721959590911865} +03/05/2022 03:40:34 - INFO - codeparrot_training - Skipping example with length 192 (seq_length=1024) +03/05/2022 03:40:38 - INFO - codeparrot_training - Step 32514: {'lr': 0.0004493653900969589, 'samples': 16647680, 'steps': 32514, 'loss/train': 1.899351954460144} +03/05/2022 03:40:41 - INFO - codeparrot_training - Step 32515: {'lr': 0.0004493621881230138, 'samples': 16648192, 'steps': 32515, 'loss/train': 2.058785915374756} +03/05/2022 03:40:44 - INFO - codeparrot_training - Skipping example with length 264 (seq_length=1024) +03/05/2022 03:40:46 - INFO - codeparrot_training - Step 32516: {'lr': 0.00044935898605923916, 'samples': 16648704, 'steps': 32516, 'loss/train': 1.2470084428787231} +03/05/2022 03:40:50 - INFO - codeparrot_training - Step 32517: {'lr': 0.0004493557839056364, 'samples': 16649216, 'steps': 32517, 'loss/train': 1.9156990051269531} +03/05/2022 03:40:52 - INFO - codeparrot_training - Skipping example with length 782 (seq_length=1024) +03/05/2022 03:40:55 - INFO - codeparrot_training - Step 32518: {'lr': 0.00044935258166220704, 'samples': 16649728, 'steps': 32518, 'loss/train': 1.7598196268081665} +03/05/2022 03:40:58 - INFO - codeparrot_training - Step 32519: {'lr': 0.00044934937932895246, 'samples': 16650240, 'steps': 32519, 'loss/train': 2.3987717628479004} +03/05/2022 03:41:00 - INFO - codeparrot_training - Skipping example with length 679 (seq_length=1024) +03/05/2022 03:41:03 - INFO - codeparrot_training - Step 32520: {'lr': 0.0004493461769058742, 'samples': 16650752, 'steps': 32520, 'loss/train': 1.7775099277496338} +03/05/2022 03:41:07 - INFO - codeparrot_training - Step 32521: {'lr': 0.00044934297439297357, 'samples': 16651264, 'steps': 32521, 'loss/train': 1.3451353311538696} +03/05/2022 03:41:08 - INFO - codeparrot_training - Skipping example with length 413 (seq_length=1024) +03/05/2022 03:41:12 - INFO - codeparrot_training - Step 32522: {'lr': 0.0004493397717902521, 'samples': 16651776, 'steps': 32522, 'loss/train': 0.7490481734275818} +03/05/2022 03:41:15 - INFO - codeparrot_training - Step 32523: {'lr': 0.00044933656909771117, 'samples': 16652288, 'steps': 32523, 'loss/train': 1.1000535488128662} +03/05/2022 03:41:18 - INFO - codeparrot_training - Skipping example with length 714 (seq_length=1024) +03/05/2022 03:41:20 - INFO - codeparrot_training - Step 32524: {'lr': 0.00044933336631535224, 'samples': 16652800, 'steps': 32524, 'loss/train': 1.5737924575805664} +03/05/2022 03:41:24 - INFO - codeparrot_training - Step 32525: {'lr': 0.0004493301634431768, 'samples': 16653312, 'steps': 32525, 'loss/train': 2.393526315689087} +03/05/2022 03:41:26 - INFO - codeparrot_training - Skipping example with length 465 (seq_length=1024) +03/05/2022 03:41:29 - INFO - codeparrot_training - Step 32526: {'lr': 0.0004493269604811863, 'samples': 16653824, 'steps': 32526, 'loss/train': 1.6190117597579956} +03/05/2022 03:41:32 - INFO - codeparrot_training - Step 32527: {'lr': 0.000449323757429382, 'samples': 16654336, 'steps': 32527, 'loss/train': 1.4296857118606567} +03/05/2022 03:41:34 - INFO - codeparrot_training - Skipping example with length 104 (seq_length=1024) +03/05/2022 03:41:37 - INFO - codeparrot_training - Step 32528: {'lr': 0.00044932055428776566, 'samples': 16654848, 'steps': 32528, 'loss/train': 0.22194428741931915} +03/05/2022 03:41:40 - INFO - codeparrot_training - Step 32529: {'lr': 0.00044931735105633853, 'samples': 16655360, 'steps': 32529, 'loss/train': 1.9686369895935059} +03/05/2022 03:41:42 - INFO - codeparrot_training - Skipping example with length 331 (seq_length=1024) +03/05/2022 03:41:46 - INFO - codeparrot_training - Step 32530: {'lr': 0.00044931414773510207, 'samples': 16655872, 'steps': 32530, 'loss/train': 2.4895174503326416} +03/05/2022 03:41:49 - INFO - codeparrot_training - Step 32531: {'lr': 0.00044931094432405766, 'samples': 16656384, 'steps': 32531, 'loss/train': 0.12578052282333374} +03/05/2022 03:41:51 - INFO - codeparrot_training - Skipping example with length 954 (seq_length=1024) +03/05/2022 03:41:54 - INFO - codeparrot_training - Step 32532: {'lr': 0.00044930774082320684, 'samples': 16656896, 'steps': 32532, 'loss/train': 1.8606159687042236} +03/05/2022 03:41:57 - INFO - codeparrot_training - Step 32533: {'lr': 0.00044930453723255107, 'samples': 16657408, 'steps': 32533, 'loss/train': 1.4303772449493408} +03/05/2022 03:41:59 - INFO - codeparrot_training - Skipping example with length 310 (seq_length=1024) +03/05/2022 03:42:03 - INFO - codeparrot_training - Step 32534: {'lr': 0.0004493013335520917, 'samples': 16657920, 'steps': 32534, 'loss/train': 1.8415628671646118} +03/05/2022 03:42:06 - INFO - codeparrot_training - Step 32535: {'lr': 0.00044929812978183024, 'samples': 16658432, 'steps': 32535, 'loss/train': 1.287062644958496} +03/05/2022 03:42:08 - INFO - codeparrot_training - Skipping example with length 243 (seq_length=1024) +03/05/2022 03:42:11 - INFO - codeparrot_training - Step 32536: {'lr': 0.0004492949259217681, 'samples': 16658944, 'steps': 32536, 'loss/train': 1.820600986480713} +03/05/2022 03:42:14 - INFO - codeparrot_training - Step 32537: {'lr': 0.00044929172197190684, 'samples': 16659456, 'steps': 32537, 'loss/train': 0.12635044753551483} +03/05/2022 03:42:16 - INFO - codeparrot_training - Skipping example with length 821 (seq_length=1024) +03/05/2022 03:42:20 - INFO - codeparrot_training - Step 32538: {'lr': 0.00044928851793224765, 'samples': 16659968, 'steps': 32538, 'loss/train': 1.5570791959762573} +03/05/2022 03:42:23 - INFO - codeparrot_training - Step 32539: {'lr': 0.00044928531380279224, 'samples': 16660480, 'steps': 32539, 'loss/train': 2.6861183643341064} +03/05/2022 03:42:25 - INFO - codeparrot_training - Skipping example with length 778 (seq_length=1024) +03/05/2022 03:42:28 - INFO - codeparrot_training - Step 32540: {'lr': 0.00044928210958354196, 'samples': 16660992, 'steps': 32540, 'loss/train': 1.9324324131011963} +03/05/2022 03:42:31 - INFO - codeparrot_training - Step 32541: {'lr': 0.0004492789052744982, 'samples': 16661504, 'steps': 32541, 'loss/train': 1.546565055847168} +03/05/2022 03:42:33 - INFO - codeparrot_training - Skipping example with length 64 (seq_length=1024) +03/05/2022 03:42:37 - INFO - codeparrot_training - Step 32542: {'lr': 0.0004492757008756624, 'samples': 16662016, 'steps': 32542, 'loss/train': 2.003206968307495} +03/05/2022 03:42:40 - INFO - codeparrot_training - Step 32543: {'lr': 0.0004492724963870361, 'samples': 16662528, 'steps': 32543, 'loss/train': 1.0537060499191284} +03/05/2022 03:42:42 - INFO - codeparrot_training - Skipping example with length 658 (seq_length=1024) +03/05/2022 03:42:46 - INFO - codeparrot_training - Step 32544: {'lr': 0.00044926929180862064, 'samples': 16663040, 'steps': 32544, 'loss/train': 1.7150063514709473} +03/05/2022 03:42:49 - INFO - codeparrot_training - Step 32545: {'lr': 0.00044926608714041763, 'samples': 16663552, 'steps': 32545, 'loss/train': 2.3302531242370605} +03/05/2022 03:42:52 - INFO - codeparrot_training - Step 32546: {'lr': 0.0004492628823824282, 'samples': 16664064, 'steps': 32546, 'loss/train': 1.3007757663726807} +03/05/2022 03:42:54 - INFO - codeparrot_training - Skipping example with length 457 (seq_length=1024) +03/05/2022 03:42:57 - INFO - codeparrot_training - Step 32547: {'lr': 0.0004492596775346541, 'samples': 16664576, 'steps': 32547, 'loss/train': 1.6382144689559937} +03/05/2022 03:43:01 - INFO - codeparrot_training - Step 32548: {'lr': 0.0004492564725970967, 'samples': 16665088, 'steps': 32548, 'loss/train': 1.7310819625854492} +03/05/2022 03:43:02 - INFO - codeparrot_training - Skipping example with length 29 (seq_length=1024) +03/05/2022 03:43:06 - INFO - codeparrot_training - Step 32549: {'lr': 0.00044925326756975736, 'samples': 16665600, 'steps': 32549, 'loss/train': 2.4321587085723877} +03/05/2022 03:43:09 - INFO - codeparrot_training - Step 32550: {'lr': 0.00044925006245263757, 'samples': 16666112, 'steps': 32550, 'loss/train': 0.09825701266527176} +03/05/2022 03:43:11 - INFO - codeparrot_training - Skipping example with length 96 (seq_length=1024) +03/05/2022 03:43:14 - INFO - codeparrot_training - Step 32551: {'lr': 0.0004492468572457388, 'samples': 16666624, 'steps': 32551, 'loss/train': 1.290374517440796} +03/05/2022 03:43:18 - INFO - codeparrot_training - Step 32552: {'lr': 0.0004492436519490625, 'samples': 16667136, 'steps': 32552, 'loss/train': 1.6578922271728516} +03/05/2022 03:43:19 - INFO - codeparrot_training - Skipping example with length 144 (seq_length=1024) +03/05/2022 03:43:23 - INFO - codeparrot_training - Step 32553: {'lr': 0.00044924044656260997, 'samples': 16667648, 'steps': 32553, 'loss/train': 1.7882187366485596} +03/05/2022 03:43:26 - INFO - codeparrot_training - Step 32554: {'lr': 0.00044923724108638285, 'samples': 16668160, 'steps': 32554, 'loss/train': 1.343475341796875} +03/05/2022 03:43:27 - INFO - codeparrot_training - Skipping example with length 752 (seq_length=1024) +03/05/2022 03:43:31 - INFO - codeparrot_training - Step 32555: {'lr': 0.00044923403552038255, 'samples': 16668672, 'steps': 32555, 'loss/train': 1.6840152740478516} +03/05/2022 03:43:34 - INFO - codeparrot_training - Step 32556: {'lr': 0.0004492308298646104, 'samples': 16669184, 'steps': 32556, 'loss/train': 1.643323302268982} +03/05/2022 03:43:36 - INFO - codeparrot_training - Skipping example with length 826 (seq_length=1024) +03/05/2022 03:43:40 - INFO - codeparrot_training - Step 32557: {'lr': 0.0004492276241190679, 'samples': 16669696, 'steps': 32557, 'loss/train': 2.28226375579834} +03/05/2022 03:43:43 - INFO - codeparrot_training - Step 32558: {'lr': 0.0004492244182837565, 'samples': 16670208, 'steps': 32558, 'loss/train': 1.1694397926330566} +03/05/2022 03:43:44 - INFO - codeparrot_training - Skipping example with length 486 (seq_length=1024) +03/05/2022 03:43:48 - INFO - codeparrot_training - Step 32559: {'lr': 0.00044922121235867776, 'samples': 16670720, 'steps': 32559, 'loss/train': 1.9928205013275146} +03/05/2022 03:43:51 - INFO - codeparrot_training - Step 32560: {'lr': 0.00044921800634383294, 'samples': 16671232, 'steps': 32560, 'loss/train': 1.6142312288284302} +03/05/2022 03:43:52 - INFO - codeparrot_training - Skipping example with length 798 (seq_length=1024) +03/05/2022 03:43:57 - INFO - codeparrot_training - Step 32561: {'lr': 0.0004492148002392235, 'samples': 16671744, 'steps': 32561, 'loss/train': 2.203921318054199} +03/05/2022 03:44:00 - INFO - codeparrot_training - Step 32562: {'lr': 0.000449211594044851, 'samples': 16672256, 'steps': 32562, 'loss/train': 1.9882726669311523} +03/05/2022 03:44:01 - INFO - codeparrot_training - Skipping example with length 105 (seq_length=1024) +03/05/2022 03:44:05 - INFO - codeparrot_training - Step 32563: {'lr': 0.0004492083877607168, 'samples': 16672768, 'steps': 32563, 'loss/train': 1.7191581726074219} +03/05/2022 03:44:08 - INFO - codeparrot_training - Step 32564: {'lr': 0.00044920518138682244, 'samples': 16673280, 'steps': 32564, 'loss/train': 1.5999605655670166} +03/05/2022 03:44:09 - INFO - codeparrot_training - Skipping example with length 270 (seq_length=1024) +03/05/2022 03:44:13 - INFO - codeparrot_training - Step 32565: {'lr': 0.00044920197492316925, 'samples': 16673792, 'steps': 32565, 'loss/train': 1.6284418106079102} +03/05/2022 03:44:17 - INFO - codeparrot_training - Step 32566: {'lr': 0.00044919876836975876, 'samples': 16674304, 'steps': 32566, 'loss/train': 1.8037230968475342} +03/05/2022 03:44:18 - INFO - codeparrot_training - Skipping example with length 142 (seq_length=1024) +03/05/2022 03:44:22 - INFO - codeparrot_training - Step 32567: {'lr': 0.0004491955617265924, 'samples': 16674816, 'steps': 32567, 'loss/train': 1.6405211687088013} +03/05/2022 03:44:26 - INFO - codeparrot_training - Step 32568: {'lr': 0.0004491923549936715, 'samples': 16675328, 'steps': 32568, 'loss/train': 2.170546770095825} +03/05/2022 03:44:29 - INFO - codeparrot_training - Step 32569: {'lr': 0.0004491891481709977, 'samples': 16675840, 'steps': 32569, 'loss/train': 0.10429401695728302} +03/05/2022 03:44:29 - INFO - codeparrot_training - Skipping example with length 432 (seq_length=1024) +03/05/2022 03:44:34 - INFO - codeparrot_training - Step 32570: {'lr': 0.0004491859412585723, 'samples': 16676352, 'steps': 32570, 'loss/train': 1.8292902708053589} +03/05/2022 03:44:37 - INFO - codeparrot_training - Skipping example with length 401 (seq_length=1024) +03/05/2022 03:44:39 - INFO - codeparrot_training - Step 32571: {'lr': 0.0004491827342563968, 'samples': 16676864, 'steps': 32571, 'loss/train': 1.5793107748031616} +03/05/2022 03:44:43 - INFO - codeparrot_training - Step 32572: {'lr': 0.0004491795271644726, 'samples': 16677376, 'steps': 32572, 'loss/train': 1.586366057395935} +03/05/2022 03:44:45 - INFO - codeparrot_training - Skipping example with length 457 (seq_length=1024) +03/05/2022 03:44:48 - INFO - codeparrot_training - Step 32573: {'lr': 0.0004491763199828012, 'samples': 16677888, 'steps': 32573, 'loss/train': 2.0771255493164062} +03/05/2022 03:44:51 - INFO - codeparrot_training - Step 32574: {'lr': 0.00044917311271138393, 'samples': 16678400, 'steps': 32574, 'loss/train': 1.9533355236053467} +03/05/2022 03:44:54 - INFO - codeparrot_training - Skipping example with length 872 (seq_length=1024) +03/05/2022 03:44:56 - INFO - codeparrot_training - Step 32575: {'lr': 0.00044916990535022244, 'samples': 16678912, 'steps': 32575, 'loss/train': 0.7579390406608582} +03/05/2022 03:44:59 - INFO - codeparrot_training - Step 32576: {'lr': 0.00044916669789931806, 'samples': 16679424, 'steps': 32576, 'loss/train': 1.5620167255401611} +03/05/2022 03:45:02 - INFO - codeparrot_training - Skipping example with length 291 (seq_length=1024) +03/05/2022 03:45:05 - INFO - codeparrot_training - Step 32577: {'lr': 0.0004491634903586722, 'samples': 16679936, 'steps': 32577, 'loss/train': 1.672410249710083} +03/05/2022 03:45:08 - INFO - codeparrot_training - Step 32578: {'lr': 0.00044916028272828636, 'samples': 16680448, 'steps': 32578, 'loss/train': 1.8122777938842773} +03/05/2022 03:45:10 - INFO - codeparrot_training - Skipping example with length 513 (seq_length=1024) +03/05/2022 03:45:13 - INFO - codeparrot_training - Step 32579: {'lr': 0.00044915707500816206, 'samples': 16680960, 'steps': 32579, 'loss/train': 1.3082588911056519} +03/05/2022 03:45:16 - INFO - codeparrot_training - Step 32580: {'lr': 0.0004491538671983005, 'samples': 16681472, 'steps': 32580, 'loss/train': 3.292508363723755} +03/05/2022 03:45:19 - INFO - codeparrot_training - Skipping example with length 432 (seq_length=1024) +03/05/2022 03:45:21 - INFO - codeparrot_training - Step 32581: {'lr': 0.00044915065929870335, 'samples': 16681984, 'steps': 32581, 'loss/train': 1.6692408323287964} +03/05/2022 03:45:25 - INFO - codeparrot_training - Step 32582: {'lr': 0.00044914745130937204, 'samples': 16682496, 'steps': 32582, 'loss/train': 1.2074205875396729} +03/05/2022 03:45:27 - INFO - codeparrot_training - Skipping example with length 346 (seq_length=1024) +03/05/2022 03:45:30 - INFO - codeparrot_training - Step 32583: {'lr': 0.0004491442432303079, 'samples': 16683008, 'steps': 32583, 'loss/train': 1.8213645219802856} +03/05/2022 03:45:33 - INFO - codeparrot_training - Step 32584: {'lr': 0.0004491410350615124, 'samples': 16683520, 'steps': 32584, 'loss/train': 1.433095097541809} +03/05/2022 03:45:35 - INFO - codeparrot_training - Skipping example with length 123 (seq_length=1024) +03/05/2022 03:45:38 - INFO - codeparrot_training - Step 32585: {'lr': 0.0004491378268029871, 'samples': 16684032, 'steps': 32585, 'loss/train': 1.6470701694488525} +03/05/2022 03:45:42 - INFO - codeparrot_training - Step 32586: {'lr': 0.00044913461845473335, 'samples': 16684544, 'steps': 32586, 'loss/train': 1.6011825799942017} +03/05/2022 03:45:43 - INFO - codeparrot_training - Skipping example with length 240 (seq_length=1024) +03/05/2022 03:45:47 - INFO - codeparrot_training - Step 32587: {'lr': 0.0004491314100167526, 'samples': 16685056, 'steps': 32587, 'loss/train': 1.8967292308807373} +03/05/2022 03:45:50 - INFO - codeparrot_training - Step 32588: {'lr': 0.00044912820148904634, 'samples': 16685568, 'steps': 32588, 'loss/train': 1.568588376045227} +03/05/2022 03:45:52 - INFO - codeparrot_training - Skipping example with length 89 (seq_length=1024) +03/05/2022 03:45:55 - INFO - codeparrot_training - Step 32589: {'lr': 0.0004491249928716159, 'samples': 16686080, 'steps': 32589, 'loss/train': 1.8458131551742554} +03/05/2022 03:45:58 - INFO - codeparrot_training - Step 32590: {'lr': 0.0004491217841644629, 'samples': 16686592, 'steps': 32590, 'loss/train': 1.2073935270309448} +03/05/2022 03:46:00 - INFO - codeparrot_training - Skipping example with length 70 (seq_length=1024) +03/05/2022 03:46:04 - INFO - codeparrot_training - Step 32591: {'lr': 0.0004491185753675886, 'samples': 16687104, 'steps': 32591, 'loss/train': 1.447007417678833} +03/05/2022 03:46:07 - INFO - codeparrot_training - Step 32592: {'lr': 0.0004491153664809947, 'samples': 16687616, 'steps': 32592, 'loss/train': 1.4809558391571045} +03/05/2022 03:46:09 - INFO - codeparrot_training - Skipping example with length 939 (seq_length=1024) +03/05/2022 03:46:12 - INFO - codeparrot_training - Step 32593: {'lr': 0.00044911215750468236, 'samples': 16688128, 'steps': 32593, 'loss/train': 1.675031065940857} +03/05/2022 03:46:15 - INFO - codeparrot_training - Step 32594: {'lr': 0.0004491089484386531, 'samples': 16688640, 'steps': 32594, 'loss/train': 1.9420222043991089} +03/05/2022 03:46:17 - INFO - codeparrot_training - Skipping example with length 679 (seq_length=1024) +03/05/2022 03:46:21 - INFO - codeparrot_training - Step 32595: {'lr': 0.0004491057392829086, 'samples': 16689152, 'steps': 32595, 'loss/train': 1.6752437353134155} +03/05/2022 03:46:24 - INFO - codeparrot_training - Step 32596: {'lr': 0.00044910253003745007, 'samples': 16689664, 'steps': 32596, 'loss/train': 0.919418454170227} +03/05/2022 03:46:26 - INFO - codeparrot_training - Skipping example with length 407 (seq_length=1024) +03/05/2022 03:46:29 - INFO - codeparrot_training - Step 32597: {'lr': 0.00044909932070227887, 'samples': 16690176, 'steps': 32597, 'loss/train': 1.9615058898925781} +03/05/2022 03:46:32 - INFO - codeparrot_training - Step 32598: {'lr': 0.00044909611127739676, 'samples': 16690688, 'steps': 32598, 'loss/train': 1.6287546157836914} +03/05/2022 03:46:34 - INFO - codeparrot_training - Skipping example with length 907 (seq_length=1024) +03/05/2022 03:46:38 - INFO - codeparrot_training - Step 32599: {'lr': 0.00044909290176280495, 'samples': 16691200, 'steps': 32599, 'loss/train': 2.3242855072021484} +03/05/2022 03:46:41 - INFO - codeparrot_training - Step 32600: {'lr': 0.00044908969215850495, 'samples': 16691712, 'steps': 32600, 'loss/train': 1.300263524055481} +03/05/2022 03:46:43 - INFO - codeparrot_training - Skipping example with length 25 (seq_length=1024) +03/05/2022 03:46:46 - INFO - codeparrot_training - Step 32601: {'lr': 0.0004490864824644982, 'samples': 16692224, 'steps': 32601, 'loss/train': 1.586312174797058} +03/05/2022 03:46:49 - INFO - codeparrot_training - Step 32602: {'lr': 0.0004490832726807862, 'samples': 16692736, 'steps': 32602, 'loss/train': 1.4740346670150757} +03/05/2022 03:46:51 - INFO - codeparrot_training - Skipping example with length 956 (seq_length=1024) +03/05/2022 03:46:55 - INFO - codeparrot_training - Step 32603: {'lr': 0.0004490800628073703, 'samples': 16693248, 'steps': 32603, 'loss/train': 2.284289836883545} +03/05/2022 03:46:58 - INFO - codeparrot_training - Step 32604: {'lr': 0.000449076852844252, 'samples': 16693760, 'steps': 32604, 'loss/train': 2.293776750564575} +03/05/2022 03:47:03 - INFO - codeparrot_training - Step 32605: {'lr': 0.0004490736427914327, 'samples': 16694272, 'steps': 32605, 'loss/train': 2.3977556228637695} +03/05/2022 03:47:06 - INFO - codeparrot_training - Step 32606: {'lr': 0.000449070432648914, 'samples': 16694784, 'steps': 32606, 'loss/train': 2.1151010990142822} +03/05/2022 03:47:08 - INFO - codeparrot_training - Skipping example with length 285 (seq_length=1024) +03/05/2022 03:47:11 - INFO - codeparrot_training - Step 32607: {'lr': 0.0004490672224166972, 'samples': 16695296, 'steps': 32607, 'loss/train': 2.4286179542541504} +03/05/2022 03:47:15 - INFO - codeparrot_training - Step 32608: {'lr': 0.00044906401209478367, 'samples': 16695808, 'steps': 32608, 'loss/train': 2.4963057041168213} +03/05/2022 03:47:16 - INFO - codeparrot_training - Skipping example with length 644 (seq_length=1024) +03/05/2022 03:47:20 - INFO - codeparrot_training - Step 32609: {'lr': 0.00044906080168317507, 'samples': 16696320, 'steps': 32609, 'loss/train': 1.8330910205841064} +03/05/2022 03:47:23 - INFO - codeparrot_training - Step 32610: {'lr': 0.0004490575911818727, 'samples': 16696832, 'steps': 32610, 'loss/train': 0.46499234437942505} +03/05/2022 03:47:25 - INFO - codeparrot_training - Skipping example with length 912 (seq_length=1024) +03/05/2022 03:47:28 - INFO - codeparrot_training - Step 32611: {'lr': 0.0004490543805908781, 'samples': 16697344, 'steps': 32611, 'loss/train': 0.8260604739189148} +03/05/2022 03:47:32 - INFO - codeparrot_training - Step 32612: {'lr': 0.00044905116991019264, 'samples': 16697856, 'steps': 32612, 'loss/train': 2.194272994995117} +03/05/2022 03:47:33 - INFO - codeparrot_training - Skipping example with length 847 (seq_length=1024) +03/05/2022 03:47:37 - INFO - codeparrot_training - Step 32613: {'lr': 0.00044904795913981775, 'samples': 16698368, 'steps': 32613, 'loss/train': 0.8410437703132629} +03/05/2022 03:47:40 - INFO - codeparrot_training - Step 32614: {'lr': 0.00044904474827975506, 'samples': 16698880, 'steps': 32614, 'loss/train': 2.218437433242798} +03/05/2022 03:47:42 - INFO - codeparrot_training - Skipping example with length 171 (seq_length=1024) +03/05/2022 03:47:45 - INFO - codeparrot_training - Step 32615: {'lr': 0.00044904153733000575, 'samples': 16699392, 'steps': 32615, 'loss/train': 1.7397236824035645} +03/05/2022 03:47:49 - INFO - codeparrot_training - Step 32616: {'lr': 0.0004490383262905714, 'samples': 16699904, 'steps': 32616, 'loss/train': 1.3464069366455078} +03/05/2022 03:47:50 - INFO - codeparrot_training - Skipping example with length 30 (seq_length=1024) +03/05/2022 03:47:54 - INFO - codeparrot_training - Step 32617: {'lr': 0.00044903511516145353, 'samples': 16700416, 'steps': 32617, 'loss/train': 1.8454314470291138} +03/05/2022 03:47:57 - INFO - codeparrot_training - Step 32618: {'lr': 0.0004490319039426535, 'samples': 16700928, 'steps': 32618, 'loss/train': 1.8288780450820923} +03/05/2022 03:47:59 - INFO - codeparrot_training - Skipping example with length 320 (seq_length=1024) +03/05/2022 03:48:03 - INFO - codeparrot_training - Step 32619: {'lr': 0.0004490286926341727, 'samples': 16701440, 'steps': 32619, 'loss/train': 1.689068078994751} +03/05/2022 03:48:06 - INFO - codeparrot_training - Step 32620: {'lr': 0.0004490254812360126, 'samples': 16701952, 'steps': 32620, 'loss/train': 1.2634406089782715} +03/05/2022 03:48:11 - INFO - codeparrot_training - Step 32621: {'lr': 0.0004490222697481748, 'samples': 16702464, 'steps': 32621, 'loss/train': 1.8520931005477905} +03/05/2022 03:48:14 - INFO - codeparrot_training - Step 32622: {'lr': 0.00044901905817066055, 'samples': 16702976, 'steps': 32622, 'loss/train': 1.114019751548767} +03/05/2022 03:48:16 - INFO - codeparrot_training - Skipping example with length 618 (seq_length=1024) +03/05/2022 03:48:20 - INFO - codeparrot_training - Step 32623: {'lr': 0.00044901584650347147, 'samples': 16703488, 'steps': 32623, 'loss/train': 1.8870620727539062} +03/05/2022 03:48:23 - INFO - codeparrot_training - Step 32624: {'lr': 0.00044901263474660894, 'samples': 16704000, 'steps': 32624, 'loss/train': 2.325376510620117} +03/05/2022 03:48:24 - INFO - codeparrot_training - Skipping example with length 954 (seq_length=1024) +03/05/2022 03:48:28 - INFO - codeparrot_training - Step 32625: {'lr': 0.0004490094229000743, 'samples': 16704512, 'steps': 32625, 'loss/train': 2.400545120239258} +03/05/2022 03:48:31 - INFO - codeparrot_training - Step 32626: {'lr': 0.00044900621096386904, 'samples': 16705024, 'steps': 32626, 'loss/train': 2.415570020675659} +03/05/2022 03:48:33 - INFO - codeparrot_training - Skipping example with length 27 (seq_length=1024) +03/05/2022 03:48:37 - INFO - codeparrot_training - Step 32627: {'lr': 0.00044900299893799476, 'samples': 16705536, 'steps': 32627, 'loss/train': 1.5444202423095703} +03/05/2022 03:48:40 - INFO - codeparrot_training - Step 32628: {'lr': 0.0004489997868224528, 'samples': 16706048, 'steps': 32628, 'loss/train': 1.923972725868225} +03/05/2022 03:48:41 - INFO - codeparrot_training - Skipping example with length 555 (seq_length=1024) +03/05/2022 03:48:45 - INFO - codeparrot_training - Step 32629: {'lr': 0.00044899657461724453, 'samples': 16706560, 'steps': 32629, 'loss/train': 1.7271745204925537} +03/05/2022 03:48:48 - INFO - codeparrot_training - Step 32630: {'lr': 0.00044899336232237156, 'samples': 16707072, 'steps': 32630, 'loss/train': 1.820676326751709} +03/05/2022 03:48:50 - INFO - codeparrot_training - Skipping example with length 853 (seq_length=1024) +03/05/2022 03:48:54 - INFO - codeparrot_training - Step 32631: {'lr': 0.0004489901499378352, 'samples': 16707584, 'steps': 32631, 'loss/train': 1.829119086265564} +03/05/2022 03:48:57 - INFO - codeparrot_training - Step 32632: {'lr': 0.00044898693746363695, 'samples': 16708096, 'steps': 32632, 'loss/train': 1.2774642705917358} +03/05/2022 03:48:59 - INFO - codeparrot_training - Skipping example with length 296 (seq_length=1024) +03/05/2022 03:49:02 - INFO - codeparrot_training - Step 32633: {'lr': 0.00044898372489977825, 'samples': 16708608, 'steps': 32633, 'loss/train': 1.8329066038131714} +03/05/2022 03:49:05 - INFO - codeparrot_training - Step 32634: {'lr': 0.0004489805122462606, 'samples': 16709120, 'steps': 32634, 'loss/train': 2.4088149070739746} +03/05/2022 03:49:07 - INFO - codeparrot_training - Skipping example with length 300 (seq_length=1024) +03/05/2022 03:49:11 - INFO - codeparrot_training - Step 32635: {'lr': 0.0004489772995030853, 'samples': 16709632, 'steps': 32635, 'loss/train': 2.5353541374206543} +03/05/2022 03:49:14 - INFO - codeparrot_training - Step 32636: {'lr': 0.00044897408667025397, 'samples': 16710144, 'steps': 32636, 'loss/train': 1.9096039533615112} +03/05/2022 03:49:15 - INFO - codeparrot_training - Skipping example with length 127 (seq_length=1024) +03/05/2022 03:49:19 - INFO - codeparrot_training - Step 32637: {'lr': 0.000448970873747768, 'samples': 16710656, 'steps': 32637, 'loss/train': 1.9969711303710938} +03/05/2022 03:49:22 - INFO - codeparrot_training - Step 32638: {'lr': 0.0004489676607356288, 'samples': 16711168, 'steps': 32638, 'loss/train': 1.8620306253433228} +03/05/2022 03:49:23 - INFO - codeparrot_training - Skipping example with length 61 (seq_length=1024) +03/05/2022 03:49:28 - INFO - codeparrot_training - Step 32639: {'lr': 0.00044896444763383787, 'samples': 16711680, 'steps': 32639, 'loss/train': 1.1733413934707642} +03/05/2022 03:49:31 - INFO - codeparrot_training - Step 32640: {'lr': 0.00044896123444239654, 'samples': 16712192, 'steps': 32640, 'loss/train': 1.7918188571929932} +03/05/2022 03:49:32 - INFO - codeparrot_training - Skipping example with length 111 (seq_length=1024) +03/05/2022 03:49:36 - INFO - codeparrot_training - Step 32641: {'lr': 0.00044895802116130644, 'samples': 16712704, 'steps': 32641, 'loss/train': 1.6710946559906006} +03/05/2022 03:49:39 - INFO - codeparrot_training - Step 32642: {'lr': 0.0004489548077905689, 'samples': 16713216, 'steps': 32642, 'loss/train': 0.8930895328521729} +03/05/2022 03:49:41 - INFO - codeparrot_training - Skipping example with length 68 (seq_length=1024) +03/05/2022 03:49:45 - INFO - codeparrot_training - Step 32643: {'lr': 0.0004489515943301854, 'samples': 16713728, 'steps': 32643, 'loss/train': 1.493677020072937} +03/05/2022 03:49:48 - INFO - codeparrot_training - Step 32644: {'lr': 0.0004489483807801574, 'samples': 16714240, 'steps': 32644, 'loss/train': 2.630521774291992} +03/05/2022 03:49:49 - INFO - codeparrot_training - Skipping example with length 372 (seq_length=1024) +03/05/2022 03:49:53 - INFO - codeparrot_training - Step 32645: {'lr': 0.00044894516714048626, 'samples': 16714752, 'steps': 32645, 'loss/train': 1.6930238008499146} +03/05/2022 03:49:56 - INFO - codeparrot_training - Step 32646: {'lr': 0.0004489419534111736, 'samples': 16715264, 'steps': 32646, 'loss/train': 2.1759676933288574} +03/05/2022 03:49:58 - INFO - codeparrot_training - Skipping example with length 806 (seq_length=1024) +03/05/2022 03:50:02 - INFO - codeparrot_training - Step 32647: {'lr': 0.0004489387395922207, 'samples': 16715776, 'steps': 32647, 'loss/train': 1.4858109951019287} +03/05/2022 03:50:05 - INFO - codeparrot_training - Step 32648: {'lr': 0.00044893552568362903, 'samples': 16716288, 'steps': 32648, 'loss/train': 1.5872927904129028} +03/05/2022 03:50:06 - INFO - codeparrot_training - Skipping example with length 17 (seq_length=1024) +03/05/2022 03:50:10 - INFO - codeparrot_training - Step 32649: {'lr': 0.0004489323116854002, 'samples': 16716800, 'steps': 32649, 'loss/train': 1.7567414045333862} +03/05/2022 03:50:13 - INFO - codeparrot_training - Step 32650: {'lr': 0.00044892909759753545, 'samples': 16717312, 'steps': 32650, 'loss/train': 2.0136494636535645} +03/05/2022 03:50:15 - INFO - codeparrot_training - Skipping example with length 57 (seq_length=1024) +03/05/2022 03:50:18 - INFO - codeparrot_training - Step 32651: {'lr': 0.00044892588342003637, 'samples': 16717824, 'steps': 32651, 'loss/train': 2.0238683223724365} +03/05/2022 03:50:22 - INFO - codeparrot_training - Step 32652: {'lr': 0.00044892266915290435, 'samples': 16718336, 'steps': 32652, 'loss/train': 2.0528876781463623} +03/05/2022 03:50:23 - INFO - codeparrot_training - Skipping example with length 889 (seq_length=1024) +03/05/2022 03:50:27 - INFO - codeparrot_training - Step 32653: {'lr': 0.00044891945479614084, 'samples': 16718848, 'steps': 32653, 'loss/train': 2.0141665935516357} +03/05/2022 03:50:30 - INFO - codeparrot_training - Step 32654: {'lr': 0.00044891624034974726, 'samples': 16719360, 'steps': 32654, 'loss/train': 2.152963638305664} +03/05/2022 03:50:32 - INFO - codeparrot_training - Skipping example with length 633 (seq_length=1024) +03/05/2022 03:50:35 - INFO - codeparrot_training - Step 32655: {'lr': 0.00044891302581372513, 'samples': 16719872, 'steps': 32655, 'loss/train': 1.153235673904419} +03/05/2022 03:50:39 - INFO - codeparrot_training - Step 32656: {'lr': 0.00044890981118807585, 'samples': 16720384, 'steps': 32656, 'loss/train': 1.2853738069534302} +03/05/2022 03:50:40 - INFO - codeparrot_training - Skipping example with length 853 (seq_length=1024) +03/05/2022 03:50:44 - INFO - codeparrot_training - Step 32657: {'lr': 0.00044890659647280084, 'samples': 16720896, 'steps': 32657, 'loss/train': 2.67225980758667} +03/05/2022 03:50:47 - INFO - codeparrot_training - Step 32658: {'lr': 0.0004489033816679016, 'samples': 16721408, 'steps': 32658, 'loss/train': 0.6578690409660339} +03/05/2022 03:50:49 - INFO - codeparrot_training - Skipping example with length 93 (seq_length=1024) +03/05/2022 03:50:52 - INFO - codeparrot_training - Step 32659: {'lr': 0.0004489001667733796, 'samples': 16721920, 'steps': 32659, 'loss/train': 1.5650949478149414} +03/05/2022 03:50:55 - INFO - codeparrot_training - Step 32660: {'lr': 0.0004488969517892363, 'samples': 16722432, 'steps': 32660, 'loss/train': 2.210993528366089} +03/05/2022 03:50:57 - INFO - codeparrot_training - Skipping example with length 947 (seq_length=1024) +03/05/2022 03:51:01 - INFO - codeparrot_training - Step 32661: {'lr': 0.000448893736715473, 'samples': 16722944, 'steps': 32661, 'loss/train': 1.9084727764129639} +03/05/2022 03:51:04 - INFO - codeparrot_training - Step 32662: {'lr': 0.0004488905215520913, 'samples': 16723456, 'steps': 32662, 'loss/train': 2.1088318824768066} +03/05/2022 03:51:05 - INFO - codeparrot_training - Skipping example with length 235 (seq_length=1024) +03/05/2022 03:51:09 - INFO - codeparrot_training - Step 32663: {'lr': 0.00044888730629909256, 'samples': 16723968, 'steps': 32663, 'loss/train': 1.6365065574645996} +03/05/2022 03:51:12 - INFO - codeparrot_training - Step 32664: {'lr': 0.00044888409095647833, 'samples': 16724480, 'steps': 32664, 'loss/train': 2.3002421855926514} +03/05/2022 03:51:13 - INFO - codeparrot_training - Skipping example with length 997 (seq_length=1024) +03/05/2022 03:51:18 - INFO - codeparrot_training - Step 32665: {'lr': 0.00044888087552424997, 'samples': 16724992, 'steps': 32665, 'loss/train': 3.2875540256500244} +03/05/2022 03:51:21 - INFO - codeparrot_training - Step 32666: {'lr': 0.00044887766000240893, 'samples': 16725504, 'steps': 32666, 'loss/train': 1.6707509756088257} +03/05/2022 03:51:22 - INFO - codeparrot_training - Skipping example with length 192 (seq_length=1024) +03/05/2022 03:51:26 - INFO - codeparrot_training - Step 32667: {'lr': 0.0004488744443909567, 'samples': 16726016, 'steps': 32667, 'loss/train': 1.344260573387146} +03/05/2022 03:51:29 - INFO - codeparrot_training - Step 32668: {'lr': 0.0004488712286898947, 'samples': 16726528, 'steps': 32668, 'loss/train': 0.09129302948713303} +03/05/2022 03:51:31 - INFO - codeparrot_training - Skipping example with length 197 (seq_length=1024) +03/05/2022 03:51:35 - INFO - codeparrot_training - Step 32669: {'lr': 0.0004488680128992244, 'samples': 16727040, 'steps': 32669, 'loss/train': 1.31582772731781} +03/05/2022 03:51:38 - INFO - codeparrot_training - Step 32670: {'lr': 0.00044886479701894736, 'samples': 16727552, 'steps': 32670, 'loss/train': 1.8459174633026123} +03/05/2022 03:51:40 - INFO - codeparrot_training - Skipping example with length 569 (seq_length=1024) +03/05/2022 03:51:43 - INFO - codeparrot_training - Step 32671: {'lr': 0.00044886158104906476, 'samples': 16728064, 'steps': 32671, 'loss/train': 1.97783362865448} +03/05/2022 03:51:46 - INFO - codeparrot_training - Step 32672: {'lr': 0.0004488583649895782, 'samples': 16728576, 'steps': 32672, 'loss/train': 1.5821096897125244} +03/05/2022 03:51:48 - INFO - codeparrot_training - Skipping example with length 649 (seq_length=1024) +03/05/2022 03:51:52 - INFO - codeparrot_training - Step 32673: {'lr': 0.00044885514884048926, 'samples': 16729088, 'steps': 32673, 'loss/train': 1.4637360572814941} +03/05/2022 03:51:55 - INFO - codeparrot_training - Step 32674: {'lr': 0.0004488519326017991, 'samples': 16729600, 'steps': 32674, 'loss/train': 1.3454618453979492} +03/05/2022 03:51:57 - INFO - codeparrot_training - Skipping example with length 842 (seq_length=1024) +03/05/2022 03:52:00 - INFO - codeparrot_training - Step 32675: {'lr': 0.0004488487162735094, 'samples': 16730112, 'steps': 32675, 'loss/train': 2.1471030712127686} +03/05/2022 03:52:03 - INFO - codeparrot_training - Step 32676: {'lr': 0.00044884549985562165, 'samples': 16730624, 'steps': 32676, 'loss/train': 1.0928417444229126} +03/05/2022 03:52:05 - INFO - codeparrot_training - Skipping example with length 519 (seq_length=1024) +03/05/2022 03:52:08 - INFO - codeparrot_training - Step 32677: {'lr': 0.000448842283348137, 'samples': 16731136, 'steps': 32677, 'loss/train': 2.022397518157959} +03/05/2022 03:52:12 - INFO - codeparrot_training - Step 32678: {'lr': 0.0004488390667510572, 'samples': 16731648, 'steps': 32678, 'loss/train': 1.9457756280899048} +03/05/2022 03:52:13 - INFO - codeparrot_training - Skipping example with length 902 (seq_length=1024) +03/05/2022 03:52:17 - INFO - codeparrot_training - Step 32679: {'lr': 0.00044883585006438354, 'samples': 16732160, 'steps': 32679, 'loss/train': 1.6074765920639038} +03/05/2022 03:52:20 - INFO - codeparrot_training - Step 32680: {'lr': 0.0004488326332881175, 'samples': 16732672, 'steps': 32680, 'loss/train': 1.228408694267273} +03/05/2022 03:52:23 - INFO - codeparrot_training - Skipping example with length 35 (seq_length=1024) +03/05/2022 03:52:26 - INFO - codeparrot_training - Step 32681: {'lr': 0.0004488294164222606, 'samples': 16733184, 'steps': 32681, 'loss/train': 1.343674659729004} +03/05/2022 03:52:29 - INFO - codeparrot_training - Step 32682: {'lr': 0.0004488261994668142, 'samples': 16733696, 'steps': 32682, 'loss/train': 2.043595314025879} +03/05/2022 03:52:31 - INFO - codeparrot_training - Skipping example with length 607 (seq_length=1024) +03/05/2022 03:52:34 - INFO - codeparrot_training - Step 32683: {'lr': 0.00044882298242177976, 'samples': 16734208, 'steps': 32683, 'loss/train': 1.8504143953323364} +03/05/2022 03:52:37 - INFO - codeparrot_training - Step 32684: {'lr': 0.00044881976528715877, 'samples': 16734720, 'steps': 32684, 'loss/train': 1.6843420267105103} +03/05/2022 03:52:40 - INFO - codeparrot_training - Skipping example with length 538 (seq_length=1024) +03/05/2022 03:52:42 - INFO - codeparrot_training - Step 32685: {'lr': 0.0004488165480629527, 'samples': 16735232, 'steps': 32685, 'loss/train': 2.2880945205688477} +03/05/2022 03:52:46 - INFO - codeparrot_training - Step 32686: {'lr': 0.00044881333074916287, 'samples': 16735744, 'steps': 32686, 'loss/train': 2.1325109004974365} +03/05/2022 03:52:48 - INFO - codeparrot_training - Skipping example with length 968 (seq_length=1024) +03/05/2022 03:52:51 - INFO - codeparrot_training - Step 32687: {'lr': 0.00044881011334579093, 'samples': 16736256, 'steps': 32687, 'loss/train': 1.9747942686080933} +03/05/2022 03:52:54 - INFO - codeparrot_training - Step 32688: {'lr': 0.0004488068958528382, 'samples': 16736768, 'steps': 32688, 'loss/train': 0.12265545129776001} +03/05/2022 03:52:57 - INFO - codeparrot_training - Skipping example with length 896 (seq_length=1024) +03/05/2022 03:52:59 - INFO - codeparrot_training - Step 32689: {'lr': 0.0004488036782703061, 'samples': 16737280, 'steps': 32689, 'loss/train': 2.0384621620178223} +03/05/2022 03:53:03 - INFO - codeparrot_training - Step 32690: {'lr': 0.00044880046059819615, 'samples': 16737792, 'steps': 32690, 'loss/train': 1.7089682817459106} +03/05/2022 03:53:05 - INFO - codeparrot_training - Skipping example with length 512 (seq_length=1024) +03/05/2022 03:53:08 - INFO - codeparrot_training - Step 32691: {'lr': 0.00044879724283650976, 'samples': 16738304, 'steps': 32691, 'loss/train': 1.405125379562378} +03/05/2022 03:53:11 - INFO - codeparrot_training - Step 32692: {'lr': 0.0004487940249852484, 'samples': 16738816, 'steps': 32692, 'loss/train': 1.1829493045806885} +03/05/2022 03:53:13 - INFO - codeparrot_training - Skipping example with length 710 (seq_length=1024) +03/05/2022 03:53:17 - INFO - codeparrot_training - Step 32693: {'lr': 0.0004487908070444136, 'samples': 16739328, 'steps': 32693, 'loss/train': 1.746406078338623} +03/05/2022 03:53:20 - INFO - codeparrot_training - Step 32694: {'lr': 0.00044878758901400665, 'samples': 16739840, 'steps': 32694, 'loss/train': 1.3655046224594116} +03/05/2022 03:53:22 - INFO - codeparrot_training - Skipping example with length 760 (seq_length=1024) +03/05/2022 03:53:25 - INFO - codeparrot_training - Step 32695: {'lr': 0.00044878437089402906, 'samples': 16740352, 'steps': 32695, 'loss/train': 1.2845758199691772} +03/05/2022 03:53:28 - INFO - codeparrot_training - Step 32696: {'lr': 0.0004487811526844824, 'samples': 16740864, 'steps': 32696, 'loss/train': 2.1204659938812256} +03/05/2022 03:53:30 - INFO - codeparrot_training - Skipping example with length 459 (seq_length=1024) +03/05/2022 03:53:33 - INFO - codeparrot_training - Step 32697: {'lr': 0.0004487779343853679, 'samples': 16741376, 'steps': 32697, 'loss/train': 1.5406386852264404} +03/05/2022 03:53:37 - INFO - codeparrot_training - Step 32698: {'lr': 0.00044877471599668716, 'samples': 16741888, 'steps': 32698, 'loss/train': 1.820219874382019} +03/05/2022 03:53:39 - INFO - codeparrot_training - Skipping example with length 627 (seq_length=1024) +03/05/2022 03:53:42 - INFO - codeparrot_training - Step 32699: {'lr': 0.00044877149751844164, 'samples': 16742400, 'steps': 32699, 'loss/train': 1.6553469896316528} +03/05/2022 03:53:45 - INFO - codeparrot_training - Step 32700: {'lr': 0.00044876827895063277, 'samples': 16742912, 'steps': 32700, 'loss/train': 0.047965291887521744} +03/05/2022 03:53:47 - INFO - codeparrot_training - Skipping example with length 685 (seq_length=1024) +03/05/2022 03:53:50 - INFO - codeparrot_training - Step 32701: {'lr': 0.0004487650602932619, 'samples': 16743424, 'steps': 32701, 'loss/train': 2.5701000690460205} +03/05/2022 03:53:54 - INFO - codeparrot_training - Step 32702: {'lr': 0.00044876184154633066, 'samples': 16743936, 'steps': 32702, 'loss/train': 1.9226176738739014} +03/05/2022 03:53:56 - INFO - codeparrot_training - Skipping example with length 21 (seq_length=1024) +03/05/2022 03:53:59 - INFO - codeparrot_training - Step 32703: {'lr': 0.00044875862270984035, 'samples': 16744448, 'steps': 32703, 'loss/train': 1.3878147602081299} +03/05/2022 03:54:02 - INFO - codeparrot_training - Step 32704: {'lr': 0.0004487554037837925, 'samples': 16744960, 'steps': 32704, 'loss/train': 1.6687870025634766} +03/05/2022 03:54:04 - INFO - codeparrot_training - Skipping example with length 357 (seq_length=1024) +03/05/2022 03:54:07 - INFO - codeparrot_training - Step 32705: {'lr': 0.00044875218476818845, 'samples': 16745472, 'steps': 32705, 'loss/train': 0.13286301493644714} +03/05/2022 03:54:11 - INFO - codeparrot_training - Step 32706: {'lr': 0.0004487489656630298, 'samples': 16745984, 'steps': 32706, 'loss/train': 2.061570882797241} +03/05/2022 03:54:12 - INFO - codeparrot_training - Skipping example with length 373 (seq_length=1024) +03/05/2022 03:54:16 - INFO - codeparrot_training - Step 32707: {'lr': 0.00044874574646831794, 'samples': 16746496, 'steps': 32707, 'loss/train': 1.7554301023483276} +03/05/2022 03:54:19 - INFO - codeparrot_training - Step 32708: {'lr': 0.0004487425271840543, 'samples': 16747008, 'steps': 32708, 'loss/train': 1.3654509782791138} +03/05/2022 03:54:20 - INFO - codeparrot_training - Skipping example with length 999 (seq_length=1024) +03/05/2022 03:54:24 - INFO - codeparrot_training - Step 32709: {'lr': 0.0004487393078102403, 'samples': 16747520, 'steps': 32709, 'loss/train': 1.493709921836853} +03/05/2022 03:54:27 - INFO - codeparrot_training - Step 32710: {'lr': 0.00044873608834687754, 'samples': 16748032, 'steps': 32710, 'loss/train': 2.0046284198760986} +03/05/2022 03:54:29 - INFO - codeparrot_training - Skipping example with length 767 (seq_length=1024) +03/05/2022 03:54:33 - INFO - codeparrot_training - Step 32711: {'lr': 0.00044873286879396724, 'samples': 16748544, 'steps': 32711, 'loss/train': 1.7019821405410767} +03/05/2022 03:54:36 - INFO - codeparrot_training - Step 32712: {'lr': 0.00044872964915151106, 'samples': 16749056, 'steps': 32712, 'loss/train': 1.5509377717971802} +03/05/2022 03:54:37 - INFO - codeparrot_training - Skipping example with length 256 (seq_length=1024) +03/05/2022 03:54:41 - INFO - codeparrot_training - Step 32713: {'lr': 0.00044872642941951035, 'samples': 16749568, 'steps': 32713, 'loss/train': 2.696380138397217} +03/05/2022 03:54:44 - INFO - codeparrot_training - Step 32714: {'lr': 0.0004487232095979666, 'samples': 16750080, 'steps': 32714, 'loss/train': 1.6360069513320923} +03/05/2022 03:54:46 - INFO - codeparrot_training - Skipping example with length 373 (seq_length=1024) +03/05/2022 03:54:50 - INFO - codeparrot_training - Step 32715: {'lr': 0.0004487199896868812, 'samples': 16750592, 'steps': 32715, 'loss/train': 1.5997015237808228} +03/05/2022 03:54:53 - INFO - codeparrot_training - Step 32716: {'lr': 0.00044871676968625564, 'samples': 16751104, 'steps': 32716, 'loss/train': 1.1536569595336914} +03/05/2022 03:54:54 - INFO - codeparrot_training - Skipping example with length 368 (seq_length=1024) +03/05/2022 03:54:58 - INFO - codeparrot_training - Step 32717: {'lr': 0.00044871354959609135, 'samples': 16751616, 'steps': 32717, 'loss/train': 1.2594804763793945} +03/05/2022 03:55:01 - INFO - codeparrot_training - Step 32718: {'lr': 0.00044871032941638984, 'samples': 16752128, 'steps': 32718, 'loss/train': 1.242711067199707} +03/05/2022 03:55:02 - INFO - codeparrot_training - Skipping example with length 689 (seq_length=1024) +03/05/2022 03:55:06 - INFO - codeparrot_training - Step 32719: {'lr': 0.00044870710914715254, 'samples': 16752640, 'steps': 32719, 'loss/train': 2.034914255142212} +03/05/2022 03:55:09 - INFO - codeparrot_training - Step 32720: {'lr': 0.00044870388878838084, 'samples': 16753152, 'steps': 32720, 'loss/train': 1.8568755388259888} +03/05/2022 03:55:11 - INFO - codeparrot_training - Skipping example with length 471 (seq_length=1024) +03/05/2022 03:55:15 - INFO - codeparrot_training - Step 32721: {'lr': 0.00044870066834007627, 'samples': 16753664, 'steps': 32721, 'loss/train': 1.9558056592941284} +03/05/2022 03:55:18 - INFO - codeparrot_training - Step 32722: {'lr': 0.0004486974478022402, 'samples': 16754176, 'steps': 32722, 'loss/train': 2.210042715072632} +03/05/2022 03:55:19 - INFO - codeparrot_training - Skipping example with length 310 (seq_length=1024) +03/05/2022 03:55:23 - INFO - codeparrot_training - Step 32723: {'lr': 0.0004486942271748742, 'samples': 16754688, 'steps': 32723, 'loss/train': 2.743617296218872} +03/05/2022 03:55:26 - INFO - codeparrot_training - Step 32724: {'lr': 0.0004486910064579796, 'samples': 16755200, 'steps': 32724, 'loss/train': 1.5356628894805908} +03/05/2022 03:55:27 - INFO - codeparrot_training - Skipping example with length 117 (seq_length=1024) +03/05/2022 03:55:32 - INFO - codeparrot_training - Step 32725: {'lr': 0.00044868778565155783, 'samples': 16755712, 'steps': 32725, 'loss/train': 1.792995810508728} +03/05/2022 03:55:35 - INFO - codeparrot_training - Step 32726: {'lr': 0.00044868456475561047, 'samples': 16756224, 'steps': 32726, 'loss/train': 1.8955814838409424} +03/05/2022 03:55:36 - INFO - codeparrot_training - Skipping example with length 458 (seq_length=1024) +03/05/2022 03:55:40 - INFO - codeparrot_training - Step 32727: {'lr': 0.0004486813437701389, 'samples': 16756736, 'steps': 32727, 'loss/train': 1.643625020980835} +03/05/2022 03:55:43 - INFO - codeparrot_training - Step 32728: {'lr': 0.0004486781226951446, 'samples': 16757248, 'steps': 32728, 'loss/train': 2.0542855262756348} +03/05/2022 03:55:44 - INFO - codeparrot_training - Skipping example with length 259 (seq_length=1024) +03/05/2022 03:55:48 - INFO - codeparrot_training - Step 32729: {'lr': 0.000448674901530629, 'samples': 16757760, 'steps': 32729, 'loss/train': 1.3662149906158447} +03/05/2022 03:55:52 - INFO - codeparrot_training - Step 32730: {'lr': 0.00044867168027659356, 'samples': 16758272, 'steps': 32730, 'loss/train': 1.1919394731521606} +03/05/2022 03:55:52 - INFO - codeparrot_training - Skipping example with length 308 (seq_length=1024) +03/05/2022 03:55:57 - INFO - codeparrot_training - Step 32731: {'lr': 0.00044866845893303973, 'samples': 16758784, 'steps': 32731, 'loss/train': 0.7135829925537109} +03/05/2022 03:56:00 - INFO - codeparrot_training - Step 32732: {'lr': 0.00044866523749996897, 'samples': 16759296, 'steps': 32732, 'loss/train': 1.944987177848816} +03/05/2022 03:56:02 - INFO - codeparrot_training - Skipping example with length 432 (seq_length=1024) +03/05/2022 03:56:06 - INFO - codeparrot_training - Step 32733: {'lr': 0.0004486620159773827, 'samples': 16759808, 'steps': 32733, 'loss/train': 2.688162088394165} +03/05/2022 03:56:09 - INFO - codeparrot_training - Step 32734: {'lr': 0.0004486587943652823, 'samples': 16760320, 'steps': 32734, 'loss/train': 1.6266406774520874} +03/05/2022 03:56:11 - INFO - codeparrot_training - Skipping example with length 667 (seq_length=1024) +03/05/2022 03:56:14 - INFO - codeparrot_training - Step 32735: {'lr': 0.00044865557266366953, 'samples': 16760832, 'steps': 32735, 'loss/train': 1.9560359716415405} +03/05/2022 03:56:17 - INFO - codeparrot_training - Step 32736: {'lr': 0.0004486523508725454, 'samples': 16761344, 'steps': 32736, 'loss/train': 1.807797908782959} +03/05/2022 03:56:19 - INFO - codeparrot_training - Skipping example with length 308 (seq_length=1024) +03/05/2022 03:56:23 - INFO - codeparrot_training - Step 32737: {'lr': 0.00044864912899191174, 'samples': 16761856, 'steps': 32737, 'loss/train': 3.4237112998962402} +03/05/2022 03:56:26 - INFO - codeparrot_training - Step 32738: {'lr': 0.00044864590702176977, 'samples': 16762368, 'steps': 32738, 'loss/train': 2.1485090255737305} +03/05/2022 03:56:28 - INFO - codeparrot_training - Skipping example with length 552 (seq_length=1024) +03/05/2022 03:56:31 - INFO - codeparrot_training - Step 32739: {'lr': 0.000448642684962121, 'samples': 16762880, 'steps': 32739, 'loss/train': 1.5788065195083618} +03/05/2022 03:56:34 - INFO - codeparrot_training - Step 32740: {'lr': 0.000448639462812967, 'samples': 16763392, 'steps': 32740, 'loss/train': 1.4504294395446777} +03/05/2022 03:56:36 - INFO - codeparrot_training - Skipping example with length 469 (seq_length=1024) +03/05/2022 03:56:40 - INFO - codeparrot_training - Step 32741: {'lr': 0.0004486362405743091, 'samples': 16763904, 'steps': 32741, 'loss/train': 1.064976453781128} +03/05/2022 03:56:43 - INFO - codeparrot_training - Step 32742: {'lr': 0.0004486330182461487, 'samples': 16764416, 'steps': 32742, 'loss/train': 1.6573737859725952} +03/05/2022 03:56:45 - INFO - codeparrot_training - Skipping example with length 60 (seq_length=1024) +03/05/2022 03:56:48 - INFO - codeparrot_training - Step 32743: {'lr': 0.0004486297958284874, 'samples': 16764928, 'steps': 32743, 'loss/train': 1.679376482963562} +03/05/2022 03:56:51 - INFO - codeparrot_training - Step 32744: {'lr': 0.0004486265733213265, 'samples': 16765440, 'steps': 32744, 'loss/train': 1.9473892450332642} +03/05/2022 03:56:53 - INFO - codeparrot_training - Skipping example with length 603 (seq_length=1024) +03/05/2022 03:56:56 - INFO - codeparrot_training - Step 32745: {'lr': 0.00044862335072466767, 'samples': 16765952, 'steps': 32745, 'loss/train': 1.3998804092407227} +03/05/2022 03:57:00 - INFO - codeparrot_training - Step 32746: {'lr': 0.00044862012803851203, 'samples': 16766464, 'steps': 32746, 'loss/train': 1.9323163032531738} +03/05/2022 03:57:01 - INFO - codeparrot_training - Skipping example with length 974 (seq_length=1024) +03/05/2022 03:57:05 - INFO - codeparrot_training - Step 32747: {'lr': 0.00044861690526286135, 'samples': 16766976, 'steps': 32747, 'loss/train': 1.2599306106567383} +03/05/2022 03:57:09 - INFO - codeparrot_training - Step 32748: {'lr': 0.00044861368239771694, 'samples': 16767488, 'steps': 32748, 'loss/train': 2.1158111095428467} +03/05/2022 03:57:10 - INFO - codeparrot_training - Skipping example with length 449 (seq_length=1024) +03/05/2022 03:57:14 - INFO - codeparrot_training - Step 32749: {'lr': 0.00044861045944308026, 'samples': 16768000, 'steps': 32749, 'loss/train': 1.5830293893814087} +03/05/2022 03:57:17 - INFO - codeparrot_training - Step 32750: {'lr': 0.0004486072363989528, 'samples': 16768512, 'steps': 32750, 'loss/train': 0.0596163235604763} +03/05/2022 03:57:19 - INFO - codeparrot_training - Skipping example with length 783 (seq_length=1024) +03/05/2022 03:57:22 - INFO - codeparrot_training - Step 32751: {'lr': 0.00044860401326533595, 'samples': 16769024, 'steps': 32751, 'loss/train': 1.6744040250778198} +03/05/2022 03:57:25 - INFO - codeparrot_training - Step 32752: {'lr': 0.0004486007900422312, 'samples': 16769536, 'steps': 32752, 'loss/train': 2.0595200061798096} +03/05/2022 03:57:27 - INFO - codeparrot_training - Skipping example with length 104 (seq_length=1024) +03/05/2022 03:57:31 - INFO - codeparrot_training - Step 32753: {'lr': 0.00044859756672964, 'samples': 16770048, 'steps': 32753, 'loss/train': 1.6305497884750366} +03/05/2022 03:57:34 - INFO - codeparrot_training - Step 32754: {'lr': 0.00044859434332756383, 'samples': 16770560, 'steps': 32754, 'loss/train': 2.1313297748565674} +03/05/2022 03:57:36 - INFO - codeparrot_training - Skipping example with length 542 (seq_length=1024) +03/05/2022 03:57:39 - INFO - codeparrot_training - Step 32755: {'lr': 0.0004485911198360041, 'samples': 16771072, 'steps': 32755, 'loss/train': 1.8246662616729736} +03/05/2022 03:57:42 - INFO - codeparrot_training - Step 32756: {'lr': 0.0004485878962549622, 'samples': 16771584, 'steps': 32756, 'loss/train': 1.6334152221679688} +03/05/2022 03:57:44 - INFO - codeparrot_training - Skipping example with length 410 (seq_length=1024) +03/05/2022 03:57:48 - INFO - codeparrot_training - Step 32757: {'lr': 0.0004485846725844398, 'samples': 16772096, 'steps': 32757, 'loss/train': 2.1353466510772705} +03/05/2022 03:57:51 - INFO - codeparrot_training - Step 32758: {'lr': 0.0004485814488244381, 'samples': 16772608, 'steps': 32758, 'loss/train': 1.4135867357254028} +03/05/2022 03:57:53 - INFO - codeparrot_training - Skipping example with length 298 (seq_length=1024) +03/05/2022 03:57:56 - INFO - codeparrot_training - Step 32759: {'lr': 0.0004485782249749587, 'samples': 16773120, 'steps': 32759, 'loss/train': 1.8091596364974976} +03/05/2022 03:57:59 - INFO - codeparrot_training - Step 32760: {'lr': 0.00044857500103600304, 'samples': 16773632, 'steps': 32760, 'loss/train': 2.317765235900879} +03/05/2022 03:58:01 - INFO - codeparrot_training - Skipping example with length 854 (seq_length=1024) +03/05/2022 03:58:05 - INFO - codeparrot_training - Step 32761: {'lr': 0.00044857177700757247, 'samples': 16774144, 'steps': 32761, 'loss/train': 1.1527115106582642} +03/05/2022 03:58:08 - INFO - codeparrot_training - Step 32762: {'lr': 0.00044856855288966856, 'samples': 16774656, 'steps': 32762, 'loss/train': 1.5814310312271118} +03/05/2022 03:58:09 - INFO - codeparrot_training - Skipping example with length 581 (seq_length=1024) +03/05/2022 03:58:13 - INFO - codeparrot_training - Step 32763: {'lr': 0.0004485653286822927, 'samples': 16775168, 'steps': 32763, 'loss/train': 0.9628899097442627} +03/05/2022 03:58:16 - INFO - codeparrot_training - Step 32764: {'lr': 0.0004485621043854465, 'samples': 16775680, 'steps': 32764, 'loss/train': 1.5995169878005981} +03/05/2022 03:58:17 - INFO - codeparrot_training - Skipping example with length 348 (seq_length=1024) +03/05/2022 03:58:21 - INFO - codeparrot_training - Step 32765: {'lr': 0.0004485588799991311, 'samples': 16776192, 'steps': 32765, 'loss/train': 1.2330594062805176} +03/05/2022 03:58:25 - INFO - codeparrot_training - Step 32766: {'lr': 0.0004485556555233483, 'samples': 16776704, 'steps': 32766, 'loss/train': 1.987736701965332} +03/05/2022 03:58:26 - INFO - codeparrot_training - Skipping example with length 872 (seq_length=1024) +03/05/2022 03:58:30 - INFO - codeparrot_training - Step 32767: {'lr': 0.0004485524309580993, 'samples': 16777216, 'steps': 32767, 'loss/train': 2.2815704345703125} +03/05/2022 03:58:33 - INFO - codeparrot_training - Step 32768: {'lr': 0.0004485492063033856, 'samples': 16777728, 'steps': 32768, 'loss/train': 0.10674573481082916} +03/05/2022 03:58:35 - INFO - codeparrot_training - Skipping example with length 998 (seq_length=1024) +03/05/2022 03:58:38 - INFO - codeparrot_training - Step 32769: {'lr': 0.0004485459815592087, 'samples': 16778240, 'steps': 32769, 'loss/train': 1.229867696762085} +03/05/2022 03:58:42 - INFO - codeparrot_training - Step 32770: {'lr': 0.0004485427567255701, 'samples': 16778752, 'steps': 32770, 'loss/train': 2.820906400680542} +03/05/2022 03:58:43 - INFO - codeparrot_training - Skipping example with length 913 (seq_length=1024) +03/05/2022 03:58:47 - INFO - codeparrot_training - Step 32771: {'lr': 0.0004485395318024712, 'samples': 16779264, 'steps': 32771, 'loss/train': 1.6190396547317505} +03/05/2022 03:58:50 - INFO - codeparrot_training - Step 32772: {'lr': 0.00044853630678991344, 'samples': 16779776, 'steps': 32772, 'loss/train': 1.6512805223464966} +03/05/2022 03:58:51 - INFO - codeparrot_training - Skipping example with length 929 (seq_length=1024) +03/05/2022 03:58:55 - INFO - codeparrot_training - Step 32773: {'lr': 0.00044853308168789824, 'samples': 16780288, 'steps': 32773, 'loss/train': 1.3366000652313232} +03/05/2022 03:58:58 - INFO - codeparrot_training - Step 32774: {'lr': 0.00044852985649642714, 'samples': 16780800, 'steps': 32774, 'loss/train': 1.9807907342910767} +03/05/2022 03:58:59 - INFO - codeparrot_training - Skipping example with length 978 (seq_length=1024) +03/05/2022 03:59:04 - INFO - codeparrot_training - Step 32775: {'lr': 0.0004485266312155015, 'samples': 16781312, 'steps': 32775, 'loss/train': 2.06160044670105} +03/05/2022 03:59:07 - INFO - codeparrot_training - Step 32776: {'lr': 0.00044852340584512285, 'samples': 16781824, 'steps': 32776, 'loss/train': 1.2140681743621826} +03/05/2022 03:59:08 - INFO - codeparrot_training - Skipping example with length 382 (seq_length=1024) +03/05/2022 03:59:12 - INFO - codeparrot_training - Step 32777: {'lr': 0.00044852018038529264, 'samples': 16782336, 'steps': 32777, 'loss/train': 1.6866059303283691} +03/05/2022 03:59:16 - INFO - codeparrot_training - Step 32778: {'lr': 0.00044851695483601227, 'samples': 16782848, 'steps': 32778, 'loss/train': 1.1241260766983032} +03/05/2022 03:59:16 - INFO - codeparrot_training - Skipping example with length 54 (seq_length=1024) +03/05/2022 03:59:21 - INFO - codeparrot_training - Step 32779: {'lr': 0.0004485137291972833, 'samples': 16783360, 'steps': 32779, 'loss/train': 1.7784221172332764} +03/05/2022 03:59:24 - INFO - codeparrot_training - Step 32780: {'lr': 0.00044851050346910706, 'samples': 16783872, 'steps': 32780, 'loss/train': 2.2918736934661865} +03/05/2022 03:59:25 - INFO - codeparrot_training - Skipping example with length 271 (seq_length=1024) +03/05/2022 03:59:29 - INFO - codeparrot_training - Step 32781: {'lr': 0.00044850727765148504, 'samples': 16784384, 'steps': 32781, 'loss/train': 1.7876278162002563} +03/05/2022 03:59:33 - INFO - codeparrot_training - Step 32782: {'lr': 0.00044850405174441866, 'samples': 16784896, 'steps': 32782, 'loss/train': 1.8087859153747559} +03/05/2022 03:59:34 - INFO - codeparrot_training - Skipping example with length 724 (seq_length=1024) +03/05/2022 03:59:38 - INFO - codeparrot_training - Step 32783: {'lr': 0.00044850082574790945, 'samples': 16785408, 'steps': 32783, 'loss/train': 2.3987033367156982} +03/05/2022 03:59:41 - INFO - codeparrot_training - Step 32784: {'lr': 0.0004484975996619589, 'samples': 16785920, 'steps': 32784, 'loss/train': 2.1207242012023926} +03/05/2022 03:59:42 - INFO - codeparrot_training - Skipping example with length 621 (seq_length=1024) +03/05/2022 03:59:46 - INFO - codeparrot_training - Step 32785: {'lr': 0.0004484943734865683, 'samples': 16786432, 'steps': 32785, 'loss/train': 2.3311638832092285} +03/05/2022 03:59:49 - INFO - codeparrot_training - Step 32786: {'lr': 0.0004484911472217392, 'samples': 16786944, 'steps': 32786, 'loss/train': 2.0124664306640625} +03/05/2022 03:59:50 - INFO - codeparrot_training - Skipping example with length 509 (seq_length=1024) +03/05/2022 03:59:55 - INFO - codeparrot_training - Step 32787: {'lr': 0.0004484879208674731, 'samples': 16787456, 'steps': 32787, 'loss/train': 2.211538314819336} +03/05/2022 03:59:58 - INFO - codeparrot_training - Step 32788: {'lr': 0.0004484846944237714, 'samples': 16787968, 'steps': 32788, 'loss/train': 1.4898900985717773} +03/05/2022 03:59:59 - INFO - codeparrot_training - Skipping example with length 414 (seq_length=1024) +03/05/2022 04:00:03 - INFO - codeparrot_training - Step 32789: {'lr': 0.0004484814678906355, 'samples': 16788480, 'steps': 32789, 'loss/train': 1.68108332157135} +03/05/2022 04:00:06 - INFO - codeparrot_training - Step 32790: {'lr': 0.00044847824126806703, 'samples': 16788992, 'steps': 32790, 'loss/train': 1.9250514507293701} +03/05/2022 04:00:07 - INFO - codeparrot_training - Skipping example with length 744 (seq_length=1024) +03/05/2022 04:00:12 - INFO - codeparrot_training - Step 32791: {'lr': 0.0004484750145560672, 'samples': 16789504, 'steps': 32791, 'loss/train': 5.070474624633789} +03/05/2022 04:00:15 - INFO - codeparrot_training - Step 32792: {'lr': 0.0004484717877546377, 'samples': 16790016, 'steps': 32792, 'loss/train': 2.026045322418213} +03/05/2022 04:00:17 - INFO - codeparrot_training - Skipping example with length 10 (seq_length=1024) +03/05/2022 04:00:20 - INFO - codeparrot_training - Step 32793: {'lr': 0.0004484685608637798, 'samples': 16790528, 'steps': 32793, 'loss/train': 2.200256109237671} +03/05/2022 04:00:23 - INFO - codeparrot_training - Step 32794: {'lr': 0.00044846533388349507, 'samples': 16791040, 'steps': 32794, 'loss/train': 2.316960573196411} +03/05/2022 04:00:25 - INFO - codeparrot_training - Skipping example with length 29 (seq_length=1024) +03/05/2022 04:00:29 - INFO - codeparrot_training - Step 32795: {'lr': 0.00044846210681378487, 'samples': 16791552, 'steps': 32795, 'loss/train': 3.859579086303711} +03/05/2022 04:00:32 - INFO - codeparrot_training - Step 32796: {'lr': 0.00044845887965465076, 'samples': 16792064, 'steps': 32796, 'loss/train': 1.2751544713974} +03/05/2022 04:00:34 - INFO - codeparrot_training - Skipping example with length 368 (seq_length=1024) +03/05/2022 04:00:37 - INFO - codeparrot_training - Step 32797: {'lr': 0.0004484556524060941, 'samples': 16792576, 'steps': 32797, 'loss/train': 2.0813605785369873} +03/05/2022 04:00:41 - INFO - codeparrot_training - Step 32798: {'lr': 0.00044845242506811646, 'samples': 16793088, 'steps': 32798, 'loss/train': 1.368618130683899} +03/05/2022 04:00:44 - INFO - codeparrot_training - Step 32799: {'lr': 0.0004484491976407192, 'samples': 16793600, 'steps': 32799, 'loss/train': 1.979921579360962} +03/05/2022 04:00:44 - INFO - codeparrot_training - Skipping example with length 243 (seq_length=1024) +03/05/2022 04:00:49 - INFO - codeparrot_training - Step 32800: {'lr': 0.00044844597012390374, 'samples': 16794112, 'steps': 32800, 'loss/train': 1.2909562587738037} +03/05/2022 04:00:52 - INFO - codeparrot_training - Step 32801: {'lr': 0.0004484427425176716, 'samples': 16794624, 'steps': 32801, 'loss/train': 1.80970299243927} +03/05/2022 04:00:52 - INFO - codeparrot_training - Skipping example with length 194 (seq_length=1024) +03/05/2022 04:00:57 - INFO - codeparrot_training - Step 32802: {'lr': 0.0004484395148220243, 'samples': 16795136, 'steps': 32802, 'loss/train': 1.514662504196167} +03/05/2022 04:01:01 - INFO - codeparrot_training - Step 32803: {'lr': 0.000448436287036963, 'samples': 16795648, 'steps': 32803, 'loss/train': 2.1822876930236816} +03/05/2022 04:01:01 - INFO - codeparrot_training - Skipping example with length 282 (seq_length=1024) +03/05/2022 04:01:06 - INFO - codeparrot_training - Step 32804: {'lr': 0.0004484330591624896, 'samples': 16796160, 'steps': 32804, 'loss/train': 1.836177945137024} +03/05/2022 04:01:09 - INFO - codeparrot_training - Step 32805: {'lr': 0.00044842983119860525, 'samples': 16796672, 'steps': 32805, 'loss/train': 2.757866144180298} +03/05/2022 04:01:10 - INFO - codeparrot_training - Skipping example with length 509 (seq_length=1024) +03/05/2022 04:01:14 - INFO - codeparrot_training - Step 32806: {'lr': 0.00044842660314531145, 'samples': 16797184, 'steps': 32806, 'loss/train': 2.1904819011688232} +03/05/2022 04:01:18 - INFO - codeparrot_training - Step 32807: {'lr': 0.0004484233750026098, 'samples': 16797696, 'steps': 32807, 'loss/train': 1.824310064315796} +03/05/2022 04:01:18 - INFO - codeparrot_training - Skipping example with length 13 (seq_length=1024) +03/05/2022 04:01:23 - INFO - codeparrot_training - Step 32808: {'lr': 0.00044842014677050145, 'samples': 16798208, 'steps': 32808, 'loss/train': 2.2862887382507324} +03/05/2022 04:01:26 - INFO - codeparrot_training - Step 32809: {'lr': 0.0004484169184489882, 'samples': 16798720, 'steps': 32809, 'loss/train': 2.0309438705444336} +03/05/2022 04:01:27 - INFO - codeparrot_training - Skipping example with length 452 (seq_length=1024) +03/05/2022 04:01:31 - INFO - codeparrot_training - Step 32810: {'lr': 0.0004484136900380713, 'samples': 16799232, 'steps': 32810, 'loss/train': 1.4617422819137573} +03/05/2022 04:01:35 - INFO - codeparrot_training - Step 32811: {'lr': 0.00044841046153775224, 'samples': 16799744, 'steps': 32811, 'loss/train': 0.5655346512794495} +03/05/2022 04:01:35 - INFO - codeparrot_training - Skipping example with length 107 (seq_length=1024) +03/05/2022 04:01:40 - INFO - codeparrot_training - Step 32812: {'lr': 0.0004484072329480325, 'samples': 16800256, 'steps': 32812, 'loss/train': 1.6036378145217896} +03/05/2022 04:01:43 - INFO - codeparrot_training - Step 32813: {'lr': 0.00044840400426891347, 'samples': 16800768, 'steps': 32813, 'loss/train': 1.8214073181152344} +03/05/2022 04:01:44 - INFO - codeparrot_training - Skipping example with length 455 (seq_length=1024) +03/05/2022 04:01:48 - INFO - codeparrot_training - Step 32814: {'lr': 0.00044840077550039676, 'samples': 16801280, 'steps': 32814, 'loss/train': 1.649049997329712} +03/05/2022 04:01:51 - INFO - codeparrot_training - Step 32815: {'lr': 0.0004483975466424837, 'samples': 16801792, 'steps': 32815, 'loss/train': 0.9569042921066284} +03/05/2022 04:01:52 - INFO - codeparrot_training - Skipping example with length 160 (seq_length=1024) +03/05/2022 04:01:57 - INFO - codeparrot_training - Step 32816: {'lr': 0.0004483943176951757, 'samples': 16802304, 'steps': 32816, 'loss/train': 1.8066608905792236} +03/05/2022 04:02:00 - INFO - codeparrot_training - Step 32817: {'lr': 0.0004483910886584743, 'samples': 16802816, 'steps': 32817, 'loss/train': 1.1769850254058838} +03/05/2022 04:02:00 - INFO - codeparrot_training - Skipping example with length 95 (seq_length=1024) +03/05/2022 04:02:05 - INFO - codeparrot_training - Step 32818: {'lr': 0.00044838785953238094, 'samples': 16803328, 'steps': 32818, 'loss/train': 1.6284947395324707} +03/05/2022 04:02:08 - INFO - codeparrot_training - Step 32819: {'lr': 0.0004483846303168971, 'samples': 16803840, 'steps': 32819, 'loss/train': 1.8191710710525513} +03/05/2022 04:02:09 - INFO - codeparrot_training - Skipping example with length 778 (seq_length=1024) +03/05/2022 04:02:14 - INFO - codeparrot_training - Step 32820: {'lr': 0.0004483814010120242, 'samples': 16804352, 'steps': 32820, 'loss/train': 1.59821617603302} +03/05/2022 04:02:17 - INFO - codeparrot_training - Step 32821: {'lr': 0.00044837817161776366, 'samples': 16804864, 'steps': 32821, 'loss/train': 2.291229248046875} +03/05/2022 04:02:18 - INFO - codeparrot_training - Skipping example with length 850 (seq_length=1024) +03/05/2022 04:02:22 - INFO - codeparrot_training - Step 32822: {'lr': 0.000448374942134117, 'samples': 16805376, 'steps': 32822, 'loss/train': 1.7003612518310547} +03/05/2022 04:02:25 - INFO - codeparrot_training - Step 32823: {'lr': 0.0004483717125610857, 'samples': 16805888, 'steps': 32823, 'loss/train': 1.4782660007476807} +03/05/2022 04:02:26 - INFO - codeparrot_training - Skipping example with length 159 (seq_length=1024) +03/05/2022 04:02:31 - INFO - codeparrot_training - Step 32824: {'lr': 0.0004483684828986712, 'samples': 16806400, 'steps': 32824, 'loss/train': 2.4041008949279785} +03/05/2022 04:02:34 - INFO - codeparrot_training - Step 32825: {'lr': 0.00044836525314687477, 'samples': 16806912, 'steps': 32825, 'loss/train': 1.981614589691162} +03/05/2022 04:02:35 - INFO - codeparrot_training - Skipping example with length 673 (seq_length=1024) +03/05/2022 04:02:39 - INFO - codeparrot_training - Step 32826: {'lr': 0.0004483620233056981, 'samples': 16807424, 'steps': 32826, 'loss/train': 1.7828078269958496} +03/05/2022 04:02:42 - INFO - codeparrot_training - Step 32827: {'lr': 0.00044835879337514254, 'samples': 16807936, 'steps': 32827, 'loss/train': 0.46749308705329895} +03/05/2022 04:02:43 - INFO - codeparrot_training - Skipping example with length 232 (seq_length=1024) +03/05/2022 04:02:47 - INFO - codeparrot_training - Step 32828: {'lr': 0.0004483555633552096, 'samples': 16808448, 'steps': 32828, 'loss/train': 1.4670099020004272} +03/05/2022 04:02:51 - INFO - codeparrot_training - Step 32829: {'lr': 0.00044835233324590077, 'samples': 16808960, 'steps': 32829, 'loss/train': 1.3449726104736328} +03/05/2022 04:02:51 - INFO - codeparrot_training - Skipping example with length 349 (seq_length=1024) +03/05/2022 04:02:56 - INFO - codeparrot_training - Step 32830: {'lr': 0.0004483491030472173, 'samples': 16809472, 'steps': 32830, 'loss/train': 0.9999790191650391} +03/05/2022 04:02:59 - INFO - codeparrot_training - Step 32831: {'lr': 0.00044834587275916084, 'samples': 16809984, 'steps': 32831, 'loss/train': 2.293489933013916} +03/05/2022 04:03:00 - INFO - codeparrot_training - Skipping example with length 333 (seq_length=1024) +03/05/2022 04:03:04 - INFO - codeparrot_training - Step 32832: {'lr': 0.00044834264238173283, 'samples': 16810496, 'steps': 32832, 'loss/train': 1.4310274124145508} +03/05/2022 04:03:07 - INFO - codeparrot_training - Step 32833: {'lr': 0.00044833941191493463, 'samples': 16811008, 'steps': 32833, 'loss/train': 1.4755841493606567} +03/05/2022 04:03:08 - INFO - codeparrot_training - Skipping example with length 983 (seq_length=1024) +03/05/2022 04:03:13 - INFO - codeparrot_training - Step 32834: {'lr': 0.0004483361813587678, 'samples': 16811520, 'steps': 32834, 'loss/train': 1.912050724029541} +03/05/2022 04:03:16 - INFO - codeparrot_training - Step 32835: {'lr': 0.0004483329507132337, 'samples': 16812032, 'steps': 32835, 'loss/train': 0.9388858675956726} +03/05/2022 04:03:17 - INFO - codeparrot_training - Skipping example with length 397 (seq_length=1024) +03/05/2022 04:03:21 - INFO - codeparrot_training - Step 32836: {'lr': 0.0004483297199783338, 'samples': 16812544, 'steps': 32836, 'loss/train': 3.141925096511841} +03/05/2022 04:03:24 - INFO - codeparrot_training - Step 32837: {'lr': 0.0004483264891540697, 'samples': 16813056, 'steps': 32837, 'loss/train': 1.3589732646942139} +03/05/2022 04:03:25 - INFO - codeparrot_training - Skipping example with length 679 (seq_length=1024) +03/05/2022 04:03:29 - INFO - codeparrot_training - Step 32838: {'lr': 0.00044832325824044274, 'samples': 16813568, 'steps': 32838, 'loss/train': 1.9961891174316406} +03/05/2022 04:03:33 - INFO - codeparrot_training - Step 32839: {'lr': 0.0004483200272374543, 'samples': 16814080, 'steps': 32839, 'loss/train': 2.361741304397583} +03/05/2022 04:03:33 - INFO - codeparrot_training - Skipping example with length 112 (seq_length=1024) +03/05/2022 04:03:38 - INFO - codeparrot_training - Step 32840: {'lr': 0.0004483167961451059, 'samples': 16814592, 'steps': 32840, 'loss/train': 1.9078457355499268} +03/05/2022 04:03:41 - INFO - codeparrot_training - Step 32841: {'lr': 0.00044831356496339913, 'samples': 16815104, 'steps': 32841, 'loss/train': 0.7789722681045532} +03/05/2022 04:03:42 - INFO - codeparrot_training - Skipping example with length 179 (seq_length=1024) +03/05/2022 04:03:46 - INFO - codeparrot_training - Step 32842: {'lr': 0.0004483103336923352, 'samples': 16815616, 'steps': 32842, 'loss/train': 2.1905312538146973} +03/05/2022 04:03:49 - INFO - codeparrot_training - Step 32843: {'lr': 0.00044830710233191573, 'samples': 16816128, 'steps': 32843, 'loss/train': 1.7192633152008057} +03/05/2022 04:03:50 - INFO - codeparrot_training - Skipping example with length 509 (seq_length=1024) +03/05/2022 04:03:55 - INFO - codeparrot_training - Step 32844: {'lr': 0.0004483038708821422, 'samples': 16816640, 'steps': 32844, 'loss/train': 1.3239785432815552} +03/05/2022 04:03:58 - INFO - codeparrot_training - Step 32845: {'lr': 0.00044830063934301603, 'samples': 16817152, 'steps': 32845, 'loss/train': 2.708096981048584} +03/05/2022 04:03:58 - INFO - codeparrot_training - Skipping example with length 212 (seq_length=1024) +03/05/2022 04:04:03 - INFO - codeparrot_training - Step 32846: {'lr': 0.0004482974077145385, 'samples': 16817664, 'steps': 32846, 'loss/train': 1.8473336696624756} +03/05/2022 04:04:06 - INFO - codeparrot_training - Step 32847: {'lr': 0.0004482941759967113, 'samples': 16818176, 'steps': 32847, 'loss/train': 1.0972201824188232} +03/05/2022 04:04:07 - INFO - codeparrot_training - Skipping example with length 283 (seq_length=1024) +03/05/2022 04:04:12 - INFO - codeparrot_training - Step 32848: {'lr': 0.00044829094418953586, 'samples': 16818688, 'steps': 32848, 'loss/train': 1.987696886062622} +03/05/2022 04:04:15 - INFO - codeparrot_training - Step 32849: {'lr': 0.00044828771229301354, 'samples': 16819200, 'steps': 32849, 'loss/train': 1.7891756296157837} +03/05/2022 04:04:15 - INFO - codeparrot_training - Skipping example with length 853 (seq_length=1024) +03/05/2022 04:04:20 - INFO - codeparrot_training - Step 32850: {'lr': 0.0004482844803071458, 'samples': 16819712, 'steps': 32850, 'loss/train': 1.7835396528244019} +03/05/2022 04:04:23 - INFO - codeparrot_training - Step 32851: {'lr': 0.00044828124823193417, 'samples': 16820224, 'steps': 32851, 'loss/train': 1.7560997009277344} +03/05/2022 04:04:24 - INFO - codeparrot_training - Skipping example with length 496 (seq_length=1024) +03/05/2022 04:04:29 - INFO - codeparrot_training - Step 32852: {'lr': 0.00044827801606738004, 'samples': 16820736, 'steps': 32852, 'loss/train': 5.391373634338379} +03/05/2022 04:04:32 - INFO - codeparrot_training - Step 32853: {'lr': 0.00044827478381348495, 'samples': 16821248, 'steps': 32853, 'loss/train': 2.0404882431030273} +03/05/2022 04:04:32 - INFO - codeparrot_training - Skipping example with length 591 (seq_length=1024) +03/05/2022 04:04:37 - INFO - codeparrot_training - Step 32854: {'lr': 0.00044827155147025025, 'samples': 16821760, 'steps': 32854, 'loss/train': 1.9201496839523315} +03/05/2022 04:04:40 - INFO - codeparrot_training - Step 32855: {'lr': 0.00044826831903767745, 'samples': 16822272, 'steps': 32855, 'loss/train': 1.5028250217437744} +03/05/2022 04:04:41 - INFO - codeparrot_training - Skipping example with length 56 (seq_length=1024) +03/05/2022 04:04:45 - INFO - codeparrot_training - Step 32856: {'lr': 0.000448265086515768, 'samples': 16822784, 'steps': 32856, 'loss/train': 1.9948362112045288} +03/05/2022 04:04:49 - INFO - codeparrot_training - Step 32857: {'lr': 0.0004482618539045234, 'samples': 16823296, 'steps': 32857, 'loss/train': 1.8896045684814453} +03/05/2022 04:04:49 - INFO - codeparrot_training - Skipping example with length 924 (seq_length=1024) +03/05/2022 04:04:54 - INFO - codeparrot_training - Step 32858: {'lr': 0.00044825862120394504, 'samples': 16823808, 'steps': 32858, 'loss/train': 1.2678031921386719} +03/05/2022 04:04:57 - INFO - codeparrot_training - Step 32859: {'lr': 0.00044825538841403444, 'samples': 16824320, 'steps': 32859, 'loss/train': 1.913914442062378} +03/05/2022 04:04:58 - INFO - codeparrot_training - Skipping example with length 722 (seq_length=1024) +03/05/2022 04:05:02 - INFO - codeparrot_training - Step 32860: {'lr': 0.000448252155534793, 'samples': 16824832, 'steps': 32860, 'loss/train': 1.2840266227722168} +03/05/2022 04:05:05 - INFO - codeparrot_training - Step 32861: {'lr': 0.0004482489225662222, 'samples': 16825344, 'steps': 32861, 'loss/train': 1.8806462287902832} +03/05/2022 04:05:06 - INFO - codeparrot_training - Skipping example with length 175 (seq_length=1024) +03/05/2022 04:05:11 - INFO - codeparrot_training - Step 32862: {'lr': 0.00044824568950832343, 'samples': 16825856, 'steps': 32862, 'loss/train': 0.8809359669685364} +03/05/2022 04:05:14 - INFO - codeparrot_training - Step 32863: {'lr': 0.0004482424563610983, 'samples': 16826368, 'steps': 32863, 'loss/train': 1.1482504606246948} +03/05/2022 04:05:14 - INFO - codeparrot_training - Skipping example with length 649 (seq_length=1024) +03/05/2022 04:05:19 - INFO - codeparrot_training - Step 32864: {'lr': 0.00044823922312454815, 'samples': 16826880, 'steps': 32864, 'loss/train': 1.9535433053970337} +03/05/2022 04:05:22 - INFO - codeparrot_training - Step 32865: {'lr': 0.00044823598979867445, 'samples': 16827392, 'steps': 32865, 'loss/train': 2.1363930702209473} +03/05/2022 04:05:22 - INFO - codeparrot_training - Skipping example with length 297 (seq_length=1024) +03/05/2022 04:05:27 - INFO - codeparrot_training - Step 32866: {'lr': 0.0004482327563834787, 'samples': 16827904, 'steps': 32866, 'loss/train': 0.9224907755851746} +03/05/2022 04:05:30 - INFO - codeparrot_training - Skipping example with length 698 (seq_length=1024) +03/05/2022 04:05:33 - INFO - codeparrot_training - Step 32867: {'lr': 0.00044822952287896237, 'samples': 16828416, 'steps': 32867, 'loss/train': 2.0211193561553955} +03/05/2022 04:05:36 - INFO - codeparrot_training - Step 32868: {'lr': 0.00044822628928512675, 'samples': 16828928, 'steps': 32868, 'loss/train': 0.8293685913085938} +03/05/2022 04:05:39 - INFO - codeparrot_training - Step 32869: {'lr': 0.0004482230556019735, 'samples': 16829440, 'steps': 32869, 'loss/train': 0.07612051069736481} +03/05/2022 04:05:39 - INFO - codeparrot_training - Skipping example with length 642 (seq_length=1024) +03/05/2022 04:05:45 - INFO - codeparrot_training - Step 32870: {'lr': 0.00044821982182950405, 'samples': 16829952, 'steps': 32870, 'loss/train': 1.3174169063568115} +03/05/2022 04:05:48 - INFO - codeparrot_training - Step 32871: {'lr': 0.0004482165879677197, 'samples': 16830464, 'steps': 32871, 'loss/train': 1.7359033823013306} +03/05/2022 04:05:48 - INFO - codeparrot_training - Skipping example with length 143 (seq_length=1024) +03/05/2022 04:05:53 - INFO - codeparrot_training - Step 32872: {'lr': 0.0004482133540166221, 'samples': 16830976, 'steps': 32872, 'loss/train': 1.622950792312622} +03/05/2022 04:05:56 - INFO - codeparrot_training - Skipping example with length 643 (seq_length=1024) +03/05/2022 04:05:58 - INFO - codeparrot_training - Step 32873: {'lr': 0.00044821011997621255, 'samples': 16831488, 'steps': 32873, 'loss/train': 1.4304238557815552} +03/05/2022 04:06:01 - INFO - codeparrot_training - Step 32874: {'lr': 0.0004482068858464926, 'samples': 16832000, 'steps': 32874, 'loss/train': 1.420791745185852} +03/05/2022 04:06:04 - INFO - codeparrot_training - Skipping example with length 380 (seq_length=1024) +03/05/2022 04:06:07 - INFO - codeparrot_training - Step 32875: {'lr': 0.00044820365162746373, 'samples': 16832512, 'steps': 32875, 'loss/train': 2.7937448024749756} +03/05/2022 04:06:10 - INFO - codeparrot_training - Step 32876: {'lr': 0.00044820041731912733, 'samples': 16833024, 'steps': 32876, 'loss/train': 0.967921257019043} +03/05/2022 04:06:12 - INFO - codeparrot_training - Skipping example with length 411 (seq_length=1024) +03/05/2022 04:06:15 - INFO - codeparrot_training - Step 32877: {'lr': 0.0004481971829214848, 'samples': 16833536, 'steps': 32877, 'loss/train': 1.5176584720611572} +03/05/2022 04:06:18 - INFO - codeparrot_training - Step 32878: {'lr': 0.0004481939484345378, 'samples': 16834048, 'steps': 32878, 'loss/train': 2.285003662109375} +03/05/2022 04:06:21 - INFO - codeparrot_training - Skipping example with length 34 (seq_length=1024) +03/05/2022 04:06:24 - INFO - codeparrot_training - Step 32879: {'lr': 0.0004481907138582876, 'samples': 16834560, 'steps': 32879, 'loss/train': 1.7813334465026855} +03/05/2022 04:06:27 - INFO - codeparrot_training - Step 32880: {'lr': 0.00044818747919273574, 'samples': 16835072, 'steps': 32880, 'loss/train': 1.9654215574264526} +03/05/2022 04:06:29 - INFO - codeparrot_training - Skipping example with length 483 (seq_length=1024) +03/05/2022 04:06:32 - INFO - codeparrot_training - Step 32881: {'lr': 0.0004481842444378837, 'samples': 16835584, 'steps': 32881, 'loss/train': 1.2609437704086304} +03/05/2022 04:06:35 - INFO - codeparrot_training - Step 32882: {'lr': 0.0004481810095937329, 'samples': 16836096, 'steps': 32882, 'loss/train': 0.6035986542701721} +03/05/2022 04:06:37 - INFO - codeparrot_training - Skipping example with length 373 (seq_length=1024) +03/05/2022 04:06:41 - INFO - codeparrot_training - Step 32883: {'lr': 0.00044817777466028467, 'samples': 16836608, 'steps': 32883, 'loss/train': 1.7963297367095947} +03/05/2022 04:06:44 - INFO - codeparrot_training - Step 32884: {'lr': 0.0004481745396375407, 'samples': 16837120, 'steps': 32884, 'loss/train': 1.2177305221557617} +03/05/2022 04:06:47 - INFO - codeparrot_training - Step 32885: {'lr': 0.0004481713045255023, 'samples': 16837632, 'steps': 32885, 'loss/train': 1.4318976402282715} +03/05/2022 04:06:50 - INFO - codeparrot_training - Skipping example with length 140 (seq_length=1024) +03/05/2022 04:06:52 - INFO - codeparrot_training - Step 32886: {'lr': 0.000448168069324171, 'samples': 16838144, 'steps': 32886, 'loss/train': 1.370668888092041} +03/05/2022 04:06:56 - INFO - codeparrot_training - Step 32887: {'lr': 0.0004481648340335482, 'samples': 16838656, 'steps': 32887, 'loss/train': 1.574015498161316} +03/05/2022 04:06:59 - INFO - codeparrot_training - Step 32888: {'lr': 0.0004481615986536354, 'samples': 16839168, 'steps': 32888, 'loss/train': 2.401139497756958} +03/05/2022 04:06:59 - INFO - codeparrot_training - Skipping example with length 849 (seq_length=1024) +03/05/2022 04:07:04 - INFO - codeparrot_training - Step 32889: {'lr': 0.000448158363184434, 'samples': 16839680, 'steps': 32889, 'loss/train': 2.0068302154541016} +03/05/2022 04:07:07 - INFO - codeparrot_training - Skipping example with length 874 (seq_length=1024) +03/05/2022 04:07:09 - INFO - codeparrot_training - Step 32890: {'lr': 0.00044815512762594556, 'samples': 16840192, 'steps': 32890, 'loss/train': 1.8892120122909546} +03/05/2022 04:07:13 - INFO - codeparrot_training - Step 32891: {'lr': 0.00044815189197817143, 'samples': 16840704, 'steps': 32891, 'loss/train': 1.3384286165237427} +03/05/2022 04:07:15 - INFO - codeparrot_training - Skipping example with length 890 (seq_length=1024) +03/05/2022 04:07:18 - INFO - codeparrot_training - Step 32892: {'lr': 0.0004481486562411131, 'samples': 16841216, 'steps': 32892, 'loss/train': 1.219661831855774} +03/05/2022 04:07:21 - INFO - codeparrot_training - Step 32893: {'lr': 0.0004481454204147721, 'samples': 16841728, 'steps': 32893, 'loss/train': 2.2584476470947266} +03/05/2022 04:07:24 - INFO - codeparrot_training - Step 32894: {'lr': 0.0004481421844991498, 'samples': 16842240, 'steps': 32894, 'loss/train': 2.880666494369507} +03/05/2022 04:07:24 - INFO - codeparrot_training - Skipping example with length 52 (seq_length=1024) +03/05/2022 04:07:29 - INFO - codeparrot_training - Step 32895: {'lr': 0.00044813894849424777, 'samples': 16842752, 'steps': 32895, 'loss/train': 1.37331223487854} +03/05/2022 04:07:32 - INFO - codeparrot_training - Skipping example with length 450 (seq_length=1024) +03/05/2022 04:07:35 - INFO - codeparrot_training - Step 32896: {'lr': 0.0004481357124000672, 'samples': 16843264, 'steps': 32896, 'loss/train': 2.0404725074768066} +03/05/2022 04:07:38 - INFO - codeparrot_training - Step 32897: {'lr': 0.0004481324762166099, 'samples': 16843776, 'steps': 32897, 'loss/train': 2.410694122314453} +03/05/2022 04:07:41 - INFO - codeparrot_training - Skipping example with length 640 (seq_length=1024) +03/05/2022 04:07:43 - INFO - codeparrot_training - Step 32898: {'lr': 0.0004481292399438771, 'samples': 16844288, 'steps': 32898, 'loss/train': 1.8052374124526978} +03/05/2022 04:07:46 - INFO - codeparrot_training - Step 32899: {'lr': 0.0004481260035818704, 'samples': 16844800, 'steps': 32899, 'loss/train': 1.1577407121658325} +03/05/2022 04:07:49 - INFO - codeparrot_training - Skipping example with length 686 (seq_length=1024) +03/05/2022 04:07:52 - INFO - codeparrot_training - Step 32900: {'lr': 0.00044812276713059106, 'samples': 16845312, 'steps': 32900, 'loss/train': 1.1407105922698975} +03/05/2022 04:07:55 - INFO - codeparrot_training - Step 32901: {'lr': 0.00044811953059004073, 'samples': 16845824, 'steps': 32901, 'loss/train': 3.0366439819335938} +03/05/2022 04:07:58 - INFO - codeparrot_training - Step 32902: {'lr': 0.0004481162939602208, 'samples': 16846336, 'steps': 32902, 'loss/train': 1.4314132928848267} +03/05/2022 04:07:58 - INFO - codeparrot_training - Skipping example with length 490 (seq_length=1024) +03/05/2022 04:08:03 - INFO - codeparrot_training - Step 32903: {'lr': 0.0004481130572411327, 'samples': 16846848, 'steps': 32903, 'loss/train': 1.3393806219100952} +03/05/2022 04:08:07 - INFO - codeparrot_training - Step 32904: {'lr': 0.00044810982043277795, 'samples': 16847360, 'steps': 32904, 'loss/train': 2.32403826713562} +03/05/2022 04:08:07 - INFO - codeparrot_training - Skipping example with length 271 (seq_length=1024) +03/05/2022 04:08:12 - INFO - codeparrot_training - Step 32905: {'lr': 0.0004481065835351579, 'samples': 16847872, 'steps': 32905, 'loss/train': 1.1604489088058472} +03/05/2022 04:08:15 - INFO - codeparrot_training - Skipping example with length 684 (seq_length=1024) +03/05/2022 04:08:18 - INFO - codeparrot_training - Step 32906: {'lr': 0.0004481033465482741, 'samples': 16848384, 'steps': 32906, 'loss/train': 1.3880707025527954} +03/05/2022 04:08:21 - INFO - codeparrot_training - Step 32907: {'lr': 0.00044810010947212803, 'samples': 16848896, 'steps': 32907, 'loss/train': 1.631986379623413} +03/05/2022 04:08:24 - INFO - codeparrot_training - Step 32908: {'lr': 0.00044809687230672115, 'samples': 16849408, 'steps': 32908, 'loss/train': 1.8036261796951294} +03/05/2022 04:08:24 - INFO - codeparrot_training - Skipping example with length 765 (seq_length=1024) +03/05/2022 04:08:29 - INFO - codeparrot_training - Step 32909: {'lr': 0.0004480936350520548, 'samples': 16849920, 'steps': 32909, 'loss/train': 2.1829309463500977} +03/05/2022 04:08:32 - INFO - codeparrot_training - Step 32910: {'lr': 0.0004480903977081305, 'samples': 16850432, 'steps': 32910, 'loss/train': 1.823407530784607} +03/05/2022 04:08:33 - INFO - codeparrot_training - Skipping example with length 432 (seq_length=1024) +03/05/2022 04:08:38 - INFO - codeparrot_training - Step 32911: {'lr': 0.00044808716027494973, 'samples': 16850944, 'steps': 32911, 'loss/train': 0.08967943489551544} +03/05/2022 04:08:41 - INFO - codeparrot_training - Step 32912: {'lr': 0.000448083922752514, 'samples': 16851456, 'steps': 32912, 'loss/train': 2.0421366691589355} +03/05/2022 04:08:41 - INFO - codeparrot_training - Skipping example with length 808 (seq_length=1024) +03/05/2022 04:08:46 - INFO - codeparrot_training - Step 32913: {'lr': 0.00044808068514082467, 'samples': 16851968, 'steps': 32913, 'loss/train': 1.7712178230285645} +03/05/2022 04:08:50 - INFO - codeparrot_training - Step 32914: {'lr': 0.0004480774474398832, 'samples': 16852480, 'steps': 32914, 'loss/train': 1.859857439994812} +03/05/2022 04:08:50 - INFO - codeparrot_training - Skipping example with length 475 (seq_length=1024) +03/05/2022 04:08:55 - INFO - codeparrot_training - Step 32915: {'lr': 0.00044807420964969113, 'samples': 16852992, 'steps': 32915, 'loss/train': 0.33804088830947876} +03/05/2022 04:08:58 - INFO - codeparrot_training - Step 32916: {'lr': 0.0004480709717702499, 'samples': 16853504, 'steps': 32916, 'loss/train': 2.5722317695617676} +03/05/2022 04:08:59 - INFO - codeparrot_training - Skipping example with length 169 (seq_length=1024) +03/05/2022 04:09:03 - INFO - codeparrot_training - Step 32917: {'lr': 0.000448067733801561, 'samples': 16854016, 'steps': 32917, 'loss/train': 1.5674976110458374} +03/05/2022 04:09:07 - INFO - codeparrot_training - Step 32918: {'lr': 0.00044806449574362575, 'samples': 16854528, 'steps': 32918, 'loss/train': 1.0514800548553467} +03/05/2022 04:09:08 - INFO - codeparrot_training - Skipping example with length 434 (seq_length=1024) +03/05/2022 04:09:12 - INFO - codeparrot_training - Step 32919: {'lr': 0.00044806125759644567, 'samples': 16855040, 'steps': 32919, 'loss/train': 1.8234845399856567} +03/05/2022 04:09:15 - INFO - codeparrot_training - Step 32920: {'lr': 0.00044805801936002225, 'samples': 16855552, 'steps': 32920, 'loss/train': 2.082367181777954} +03/05/2022 04:09:16 - INFO - codeparrot_training - Skipping example with length 135 (seq_length=1024) +03/05/2022 04:09:20 - INFO - codeparrot_training - Step 32921: {'lr': 0.00044805478103435707, 'samples': 16856064, 'steps': 32921, 'loss/train': 2.083266496658325} +03/05/2022 04:09:23 - INFO - codeparrot_training - Step 32922: {'lr': 0.0004480515426194513, 'samples': 16856576, 'steps': 32922, 'loss/train': 1.7718514204025269} +03/05/2022 04:09:24 - INFO - codeparrot_training - Skipping example with length 559 (seq_length=1024) +03/05/2022 04:09:29 - INFO - codeparrot_training - Step 32923: {'lr': 0.0004480483041153066, 'samples': 16857088, 'steps': 32923, 'loss/train': 1.1922067403793335} +03/05/2022 04:09:32 - INFO - codeparrot_training - Step 32924: {'lr': 0.00044804506552192447, 'samples': 16857600, 'steps': 32924, 'loss/train': 2.181920289993286} +03/05/2022 04:09:32 - INFO - codeparrot_training - Skipping example with length 392 (seq_length=1024) +03/05/2022 04:09:37 - INFO - codeparrot_training - Step 32925: {'lr': 0.0004480418268393062, 'samples': 16858112, 'steps': 32925, 'loss/train': 1.1025288105010986} +03/05/2022 04:09:40 - INFO - codeparrot_training - Step 32926: {'lr': 0.0004480385880674534, 'samples': 16858624, 'steps': 32926, 'loss/train': 0.1388394832611084} +03/05/2022 04:09:41 - INFO - codeparrot_training - Skipping example with length 973 (seq_length=1024) +03/05/2022 04:09:46 - INFO - codeparrot_training - Step 32927: {'lr': 0.00044803534920636744, 'samples': 16859136, 'steps': 32927, 'loss/train': 1.7906074523925781} +03/05/2022 04:09:49 - INFO - codeparrot_training - Step 32928: {'lr': 0.00044803211025604985, 'samples': 16859648, 'steps': 32928, 'loss/train': 5.568546295166016} +03/05/2022 04:09:49 - INFO - codeparrot_training - Skipping example with length 360 (seq_length=1024) +03/05/2022 04:09:54 - INFO - codeparrot_training - Step 32929: {'lr': 0.000448028871216502, 'samples': 16860160, 'steps': 32929, 'loss/train': 0.21931499242782593} +03/05/2022 04:09:57 - INFO - codeparrot_training - Step 32930: {'lr': 0.0004480256320877254, 'samples': 16860672, 'steps': 32930, 'loss/train': 1.9319590330123901} +03/05/2022 04:09:58 - INFO - codeparrot_training - Skipping example with length 1006 (seq_length=1024) +03/05/2022 04:10:02 - INFO - codeparrot_training - Step 32931: {'lr': 0.00044802239286972147, 'samples': 16861184, 'steps': 32931, 'loss/train': 0.9951972961425781} +03/05/2022 04:10:06 - INFO - codeparrot_training - Step 32932: {'lr': 0.0004480191535624918, 'samples': 16861696, 'steps': 32932, 'loss/train': 1.1043416261672974} +03/05/2022 04:10:06 - INFO - codeparrot_training - Skipping example with length 159 (seq_length=1024) +03/05/2022 04:10:11 - INFO - codeparrot_training - Step 32933: {'lr': 0.0004480159141660377, 'samples': 16862208, 'steps': 32933, 'loss/train': 1.8001677989959717} +03/05/2022 04:10:14 - INFO - codeparrot_training - Step 32934: {'lr': 0.00044801267468036064, 'samples': 16862720, 'steps': 32934, 'loss/train': 2.076057195663452} +03/05/2022 04:10:14 - INFO - codeparrot_training - Skipping example with length 389 (seq_length=1024) +03/05/2022 04:10:19 - INFO - codeparrot_training - Step 32935: {'lr': 0.0004480094351054622, 'samples': 16863232, 'steps': 32935, 'loss/train': 1.3910447359085083} +03/05/2022 04:10:22 - INFO - codeparrot_training - Step 32936: {'lr': 0.00044800619544134375, 'samples': 16863744, 'steps': 32936, 'loss/train': 2.0677878856658936} +03/05/2022 04:10:22 - INFO - codeparrot_training - Skipping example with length 581 (seq_length=1024) +03/05/2022 04:10:28 - INFO - codeparrot_training - Step 32937: {'lr': 0.00044800295568800673, 'samples': 16864256, 'steps': 32937, 'loss/train': 1.7169177532196045} +03/05/2022 04:10:31 - INFO - codeparrot_training - Step 32938: {'lr': 0.0004479997158454526, 'samples': 16864768, 'steps': 32938, 'loss/train': 1.739062786102295} +03/05/2022 04:10:31 - INFO - codeparrot_training - Skipping example with length 764 (seq_length=1024) +03/05/2022 04:10:36 - INFO - codeparrot_training - Step 32939: {'lr': 0.00044799647591368296, 'samples': 16865280, 'steps': 32939, 'loss/train': 1.8108279705047607} +03/05/2022 04:10:39 - INFO - codeparrot_training - Step 32940: {'lr': 0.00044799323589269914, 'samples': 16865792, 'steps': 32940, 'loss/train': 1.9718165397644043} +03/05/2022 04:10:39 - INFO - codeparrot_training - Skipping example with length 189 (seq_length=1024) +03/05/2022 04:10:45 - INFO - codeparrot_training - Step 32941: {'lr': 0.00044798999578250255, 'samples': 16866304, 'steps': 32941, 'loss/train': 1.542114019393921} +03/05/2022 04:10:48 - INFO - codeparrot_training - Step 32942: {'lr': 0.0004479867555830948, 'samples': 16866816, 'steps': 32942, 'loss/train': 1.9566525220870972} +03/05/2022 04:10:48 - INFO - codeparrot_training - Skipping example with length 680 (seq_length=1024) +03/05/2022 04:10:53 - INFO - codeparrot_training - Step 32943: {'lr': 0.0004479835152944772, 'samples': 16867328, 'steps': 32943, 'loss/train': 2.2091989517211914} +03/05/2022 04:10:56 - INFO - codeparrot_training - Step 32944: {'lr': 0.00044798027491665135, 'samples': 16867840, 'steps': 32944, 'loss/train': 2.3931496143341064} +03/05/2022 04:11:02 - INFO - codeparrot_training - Step 32945: {'lr': 0.00044797703444961857, 'samples': 16868352, 'steps': 32945, 'loss/train': 2.2849676609039307} +03/05/2022 04:11:05 - INFO - codeparrot_training - Step 32946: {'lr': 0.00044797379389338045, 'samples': 16868864, 'steps': 32946, 'loss/train': 1.1501230001449585} +03/05/2022 04:11:05 - INFO - codeparrot_training - Skipping example with length 478 (seq_length=1024) +03/05/2022 04:11:10 - INFO - codeparrot_training - Step 32947: {'lr': 0.0004479705532479384, 'samples': 16869376, 'steps': 32947, 'loss/train': 1.5604846477508545} +03/05/2022 04:11:13 - INFO - codeparrot_training - Step 32948: {'lr': 0.0004479673125132938, 'samples': 16869888, 'steps': 32948, 'loss/train': 1.7970181703567505} +03/05/2022 04:11:14 - INFO - codeparrot_training - Skipping example with length 216 (seq_length=1024) +03/05/2022 04:11:19 - INFO - codeparrot_training - Step 32949: {'lr': 0.0004479640716894483, 'samples': 16870400, 'steps': 32949, 'loss/train': 0.5720889568328857} +03/05/2022 04:11:22 - INFO - codeparrot_training - Step 32950: {'lr': 0.00044796083077640314, 'samples': 16870912, 'steps': 32950, 'loss/train': 1.4395393133163452} +03/05/2022 04:11:22 - INFO - codeparrot_training - Skipping example with length 448 (seq_length=1024) +03/05/2022 04:11:27 - INFO - codeparrot_training - Step 32951: {'lr': 0.00044795758977416, 'samples': 16871424, 'steps': 32951, 'loss/train': 1.7781352996826172} +03/05/2022 04:11:30 - INFO - codeparrot_training - Skipping example with length 985 (seq_length=1024) +03/05/2022 04:11:32 - INFO - codeparrot_training - Step 32952: {'lr': 0.0004479543486827201, 'samples': 16871936, 'steps': 32952, 'loss/train': 1.1561284065246582} +03/05/2022 04:11:35 - INFO - codeparrot_training - Step 32953: {'lr': 0.0004479511075020851, 'samples': 16872448, 'steps': 32953, 'loss/train': 1.6943188905715942} +03/05/2022 04:11:38 - INFO - codeparrot_training - Skipping example with length 541 (seq_length=1024) +03/05/2022 04:11:41 - INFO - codeparrot_training - Step 32954: {'lr': 0.00044794786623225636, 'samples': 16872960, 'steps': 32954, 'loss/train': 0.9862486720085144} +03/05/2022 04:11:44 - INFO - codeparrot_training - Step 32955: {'lr': 0.0004479446248732354, 'samples': 16873472, 'steps': 32955, 'loss/train': 1.4168609380722046} +03/05/2022 04:11:46 - INFO - codeparrot_training - Skipping example with length 899 (seq_length=1024) +03/05/2022 04:11:49 - INFO - codeparrot_training - Step 32956: {'lr': 0.00044794138342502354, 'samples': 16873984, 'steps': 32956, 'loss/train': 0.8822023272514343} +03/05/2022 04:11:52 - INFO - codeparrot_training - Step 32957: {'lr': 0.0004479381418876225, 'samples': 16874496, 'steps': 32957, 'loss/train': 1.8924466371536255} +03/05/2022 04:11:55 - INFO - codeparrot_training - Skipping example with length 712 (seq_length=1024) +03/05/2022 04:11:57 - INFO - codeparrot_training - Step 32958: {'lr': 0.00044793490026103346, 'samples': 16875008, 'steps': 32958, 'loss/train': 1.4720741510391235} +03/05/2022 04:12:01 - INFO - codeparrot_training - Step 32959: {'lr': 0.0004479316585452581, 'samples': 16875520, 'steps': 32959, 'loss/train': 1.7246819734573364} +03/05/2022 04:12:03 - INFO - codeparrot_training - Skipping example with length 939 (seq_length=1024) +03/05/2022 04:12:06 - INFO - codeparrot_training - Step 32960: {'lr': 0.0004479284167402977, 'samples': 16876032, 'steps': 32960, 'loss/train': 1.6629647016525269} +03/05/2022 04:12:09 - INFO - codeparrot_training - Step 32961: {'lr': 0.00044792517484615384, 'samples': 16876544, 'steps': 32961, 'loss/train': 1.6395092010498047} +03/05/2022 04:12:11 - INFO - codeparrot_training - Skipping example with length 664 (seq_length=1024) +03/05/2022 04:12:15 - INFO - codeparrot_training - Step 32962: {'lr': 0.000447921932862828, 'samples': 16877056, 'steps': 32962, 'loss/train': 1.8148956298828125} +03/05/2022 04:12:18 - INFO - codeparrot_training - Step 32963: {'lr': 0.00044791869079032154, 'samples': 16877568, 'steps': 32963, 'loss/train': 2.174255609512329} +03/05/2022 04:12:21 - INFO - codeparrot_training - Step 32964: {'lr': 0.000447915448628636, 'samples': 16878080, 'steps': 32964, 'loss/train': 5.452362060546875} +03/05/2022 04:12:22 - INFO - codeparrot_training - Skipping example with length 760 (seq_length=1024) +03/05/2022 04:12:26 - INFO - codeparrot_training - Step 32965: {'lr': 0.0004479122063777728, 'samples': 16878592, 'steps': 32965, 'loss/train': 2.160876989364624} +03/05/2022 04:12:29 - INFO - codeparrot_training - Step 32966: {'lr': 0.0004479089640377334, 'samples': 16879104, 'steps': 32966, 'loss/train': 1.7248125076293945} +03/05/2022 04:12:30 - INFO - codeparrot_training - Skipping example with length 473 (seq_length=1024) +03/05/2022 04:12:35 - INFO - codeparrot_training - Step 32967: {'lr': 0.00044790572160851926, 'samples': 16879616, 'steps': 32967, 'loss/train': 1.7237592935562134} +03/05/2022 04:12:38 - INFO - codeparrot_training - Step 32968: {'lr': 0.00044790247909013195, 'samples': 16880128, 'steps': 32968, 'loss/train': 1.6506916284561157} +03/05/2022 04:12:38 - INFO - codeparrot_training - Skipping example with length 483 (seq_length=1024) +03/05/2022 04:12:43 - INFO - codeparrot_training - Step 32969: {'lr': 0.0004478992364825728, 'samples': 16880640, 'steps': 32969, 'loss/train': 2.5072579383850098} +03/05/2022 04:12:46 - INFO - codeparrot_training - Step 32970: {'lr': 0.00044789599378584324, 'samples': 16881152, 'steps': 32970, 'loss/train': 0.46988773345947266} +03/05/2022 04:12:47 - INFO - codeparrot_training - Skipping example with length 513 (seq_length=1024) +03/05/2022 04:12:52 - INFO - codeparrot_training - Step 32971: {'lr': 0.0004478927509999449, 'samples': 16881664, 'steps': 32971, 'loss/train': 1.8728784322738647} +03/05/2022 04:12:55 - INFO - codeparrot_training - Step 32972: {'lr': 0.00044788950812487907, 'samples': 16882176, 'steps': 32972, 'loss/train': 1.9999496936798096} +03/05/2022 04:12:55 - INFO - codeparrot_training - Skipping example with length 899 (seq_length=1024) +03/05/2022 04:13:00 - INFO - codeparrot_training - Step 32973: {'lr': 0.0004478862651606472, 'samples': 16882688, 'steps': 32973, 'loss/train': 0.8502224683761597} +03/05/2022 04:13:03 - INFO - codeparrot_training - Step 32974: {'lr': 0.000447883022107251, 'samples': 16883200, 'steps': 32974, 'loss/train': 1.6958385705947876} +03/05/2022 04:13:04 - INFO - codeparrot_training - Skipping example with length 796 (seq_length=1024) +03/05/2022 04:13:08 - INFO - codeparrot_training - Step 32975: {'lr': 0.00044787977896469167, 'samples': 16883712, 'steps': 32975, 'loss/train': 1.6159026622772217} +03/05/2022 04:13:12 - INFO - codeparrot_training - Step 32976: {'lr': 0.0004478765357329708, 'samples': 16884224, 'steps': 32976, 'loss/train': 1.754978060722351} +03/05/2022 04:13:12 - INFO - codeparrot_training - Skipping example with length 923 (seq_length=1024) +03/05/2022 04:13:17 - INFO - codeparrot_training - Step 32977: {'lr': 0.0004478732924120897, 'samples': 16884736, 'steps': 32977, 'loss/train': 2.27590274810791} +03/05/2022 04:13:20 - INFO - codeparrot_training - Step 32978: {'lr': 0.0004478700490020501, 'samples': 16885248, 'steps': 32978, 'loss/train': 1.645606517791748} +03/05/2022 04:13:20 - INFO - codeparrot_training - Skipping example with length 406 (seq_length=1024) +03/05/2022 04:13:25 - INFO - codeparrot_training - Step 32979: {'lr': 0.0004478668055028533, 'samples': 16885760, 'steps': 32979, 'loss/train': 1.6534570455551147} +03/05/2022 04:13:28 - INFO - codeparrot_training - Step 32980: {'lr': 0.0004478635619145007, 'samples': 16886272, 'steps': 32980, 'loss/train': 1.9479100704193115} +03/05/2022 04:13:29 - INFO - codeparrot_training - Skipping example with length 908 (seq_length=1024) +03/05/2022 04:13:34 - INFO - codeparrot_training - Step 32981: {'lr': 0.00044786031823699384, 'samples': 16886784, 'steps': 32981, 'loss/train': 2.95906662940979} +03/05/2022 04:13:37 - INFO - codeparrot_training - Step 32982: {'lr': 0.0004478570744703342, 'samples': 16887296, 'steps': 32982, 'loss/train': 1.5737457275390625} +03/05/2022 04:13:37 - INFO - codeparrot_training - Skipping example with length 959 (seq_length=1024) +03/05/2022 04:13:42 - INFO - codeparrot_training - Step 32983: {'lr': 0.00044785383061452324, 'samples': 16887808, 'steps': 32983, 'loss/train': 2.577038049697876} +03/05/2022 04:13:45 - INFO - codeparrot_training - Step 32984: {'lr': 0.00044785058666956234, 'samples': 16888320, 'steps': 32984, 'loss/train': 1.4159278869628906} +03/05/2022 04:13:45 - INFO - codeparrot_training - Skipping example with length 423 (seq_length=1024) +03/05/2022 04:13:50 - INFO - codeparrot_training - Step 32985: {'lr': 0.000447847342635453, 'samples': 16888832, 'steps': 32985, 'loss/train': 1.6427963972091675} +03/05/2022 04:13:53 - INFO - codeparrot_training - Skipping example with length 18 (seq_length=1024) +03/05/2022 04:13:56 - INFO - codeparrot_training - Step 32986: {'lr': 0.00044784409851219675, 'samples': 16889344, 'steps': 32986, 'loss/train': 2.015334367752075} +03/05/2022 04:13:59 - INFO - codeparrot_training - Step 32987: {'lr': 0.00044784085429979504, 'samples': 16889856, 'steps': 32987, 'loss/train': 1.1424051523208618} +03/05/2022 04:14:02 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 04:14:04 - INFO - codeparrot_training - Step 32988: {'lr': 0.00044783760999824926, 'samples': 16890368, 'steps': 32988, 'loss/train': 1.9466280937194824} +03/05/2022 04:14:07 - INFO - codeparrot_training - Step 32989: {'lr': 0.00044783436560756086, 'samples': 16890880, 'steps': 32989, 'loss/train': 1.3393410444259644} +03/05/2022 04:14:10 - INFO - codeparrot_training - Skipping example with length 793 (seq_length=1024) +03/05/2022 04:14:12 - INFO - codeparrot_training - Step 32990: {'lr': 0.00044783112112773137, 'samples': 16891392, 'steps': 32990, 'loss/train': 1.3325341939926147} +03/05/2022 04:14:16 - INFO - codeparrot_training - Step 32991: {'lr': 0.0004478278765587623, 'samples': 16891904, 'steps': 32991, 'loss/train': 1.4183118343353271} +03/05/2022 04:14:18 - INFO - codeparrot_training - Skipping example with length 114 (seq_length=1024) +03/05/2022 04:14:21 - INFO - codeparrot_training - Step 32992: {'lr': 0.000447824631900655, 'samples': 16892416, 'steps': 32992, 'loss/train': 2.4589672088623047} +03/05/2022 04:14:24 - INFO - codeparrot_training - Step 32993: {'lr': 0.00044782138715341094, 'samples': 16892928, 'steps': 32993, 'loss/train': 1.7131288051605225} +03/05/2022 04:14:26 - INFO - codeparrot_training - Skipping example with length 810 (seq_length=1024) +03/05/2022 04:14:29 - INFO - codeparrot_training - Step 32994: {'lr': 0.00044781814231703164, 'samples': 16893440, 'steps': 32994, 'loss/train': 1.8118724822998047} +03/05/2022 04:14:32 - INFO - codeparrot_training - Step 32995: {'lr': 0.00044781489739151856, 'samples': 16893952, 'steps': 32995, 'loss/train': 1.2344074249267578} +03/05/2022 04:14:35 - INFO - codeparrot_training - Skipping example with length 79 (seq_length=1024) +03/05/2022 04:14:38 - INFO - codeparrot_training - Step 32996: {'lr': 0.00044781165237687306, 'samples': 16894464, 'steps': 32996, 'loss/train': 1.0614559650421143} +03/05/2022 04:14:41 - INFO - codeparrot_training - Step 32997: {'lr': 0.00044780840727309676, 'samples': 16894976, 'steps': 32997, 'loss/train': 1.1566686630249023} +03/05/2022 04:14:43 - INFO - codeparrot_training - Skipping example with length 453 (seq_length=1024) +03/05/2022 04:14:46 - INFO - codeparrot_training - Step 32998: {'lr': 0.000447805162080191, 'samples': 16895488, 'steps': 32998, 'loss/train': 1.7748897075653076} +03/05/2022 04:14:49 - INFO - codeparrot_training - Step 32999: {'lr': 0.0004478019167981573, 'samples': 16896000, 'steps': 32999, 'loss/train': 1.5093451738357544} +03/05/2022 04:14:51 - INFO - codeparrot_training - Skipping example with length 207 (seq_length=1024) +03/05/2022 04:14:55 - INFO - codeparrot_training - Step 33000: {'lr': 0.00044779867142699713, 'samples': 16896512, 'steps': 33000, 'loss/train': 1.4905484914779663} +03/05/2022 04:14:58 - INFO - codeparrot_training - Step 33001: {'lr': 0.0004477954259667119, 'samples': 16897024, 'steps': 33001, 'loss/train': 2.0186970233917236} +03/05/2022 04:15:00 - INFO - codeparrot_training - Skipping example with length 127 (seq_length=1024) +03/05/2022 04:15:03 - INFO - codeparrot_training - Step 33002: {'lr': 0.00044779218041730314, 'samples': 16897536, 'steps': 33002, 'loss/train': 2.1597375869750977} +03/05/2022 04:15:06 - INFO - codeparrot_training - Step 33003: {'lr': 0.00044778893477877225, 'samples': 16898048, 'steps': 33003, 'loss/train': 1.7150853872299194} +03/05/2022 04:15:09 - INFO - codeparrot_training - Skipping example with length 567 (seq_length=1024) +03/05/2022 04:15:11 - INFO - codeparrot_training - Step 33004: {'lr': 0.0004477856890511207, 'samples': 16898560, 'steps': 33004, 'loss/train': 1.1960991621017456} +03/05/2022 04:15:15 - INFO - codeparrot_training - Step 33005: {'lr': 0.00044778244323435, 'samples': 16899072, 'steps': 33005, 'loss/train': 2.00954008102417} +03/05/2022 04:15:17 - INFO - codeparrot_training - Skipping example with length 611 (seq_length=1024) +03/05/2022 04:15:20 - INFO - codeparrot_training - Step 33006: {'lr': 0.0004477791973284616, 'samples': 16899584, 'steps': 33006, 'loss/train': 2.0102460384368896} +03/05/2022 04:15:23 - INFO - codeparrot_training - Step 33007: {'lr': 0.00044777595133345686, 'samples': 16900096, 'steps': 33007, 'loss/train': 0.05891214683651924} +03/05/2022 04:15:25 - INFO - codeparrot_training - Skipping example with length 448 (seq_length=1024) +03/05/2022 04:15:28 - INFO - codeparrot_training - Step 33008: {'lr': 0.0004477727052493374, 'samples': 16900608, 'steps': 33008, 'loss/train': 1.1184289455413818} +03/05/2022 04:15:32 - INFO - codeparrot_training - Step 33009: {'lr': 0.0004477694590761046, 'samples': 16901120, 'steps': 33009, 'loss/train': 0.05224824696779251} +03/05/2022 04:15:34 - INFO - codeparrot_training - Skipping example with length 186 (seq_length=1024) +03/05/2022 04:15:37 - INFO - codeparrot_training - Step 33010: {'lr': 0.00044776621281375994, 'samples': 16901632, 'steps': 33010, 'loss/train': 1.8125286102294922} +03/05/2022 04:15:40 - INFO - codeparrot_training - Step 33011: {'lr': 0.00044776296646230487, 'samples': 16902144, 'steps': 33011, 'loss/train': 2.3796088695526123} +03/05/2022 04:15:42 - INFO - codeparrot_training - Skipping example with length 16 (seq_length=1024) +03/05/2022 04:15:45 - INFO - codeparrot_training - Step 33012: {'lr': 0.00044775972002174085, 'samples': 16902656, 'steps': 33012, 'loss/train': 1.739351749420166} +03/05/2022 04:15:48 - INFO - codeparrot_training - Step 33013: {'lr': 0.0004477564734920694, 'samples': 16903168, 'steps': 33013, 'loss/train': 0.966182291507721} +03/05/2022 04:15:50 - INFO - codeparrot_training - Skipping example with length 758 (seq_length=1024) +03/05/2022 04:15:54 - INFO - codeparrot_training - Step 33014: {'lr': 0.0004477532268732919, 'samples': 16903680, 'steps': 33014, 'loss/train': 1.606831431388855} +03/05/2022 04:15:57 - INFO - codeparrot_training - Step 33015: {'lr': 0.00044774998016540977, 'samples': 16904192, 'steps': 33015, 'loss/train': 1.6030378341674805} +03/05/2022 04:15:58 - INFO - codeparrot_training - Skipping example with length 583 (seq_length=1024) +03/05/2022 04:16:03 - INFO - codeparrot_training - Step 33016: {'lr': 0.00044774673336842464, 'samples': 16904704, 'steps': 33016, 'loss/train': 2.202526330947876} +03/05/2022 04:16:06 - INFO - codeparrot_training - Step 33017: {'lr': 0.0004477434864823379, 'samples': 16905216, 'steps': 33017, 'loss/train': 1.2800613641738892} +03/05/2022 04:16:09 - INFO - codeparrot_training - Step 33018: {'lr': 0.00044774023950715095, 'samples': 16905728, 'steps': 33018, 'loss/train': 1.3114080429077148} +03/05/2022 04:16:10 - INFO - codeparrot_training - Skipping example with length 450 (seq_length=1024) +03/05/2022 04:16:14 - INFO - codeparrot_training - Step 33019: {'lr': 0.0004477369924428653, 'samples': 16906240, 'steps': 33019, 'loss/train': 1.9431343078613281} +03/05/2022 04:16:17 - INFO - codeparrot_training - Step 33020: {'lr': 0.0004477337452894824, 'samples': 16906752, 'steps': 33020, 'loss/train': 1.983815312385559} +03/05/2022 04:16:18 - INFO - codeparrot_training - Skipping example with length 556 (seq_length=1024) +03/05/2022 04:16:23 - INFO - codeparrot_training - Step 33021: {'lr': 0.0004477304980470038, 'samples': 16907264, 'steps': 33021, 'loss/train': 0.5019639730453491} +03/05/2022 04:16:26 - INFO - codeparrot_training - Step 33022: {'lr': 0.0004477272507154308, 'samples': 16907776, 'steps': 33022, 'loss/train': 1.659754991531372} +03/05/2022 04:16:26 - INFO - codeparrot_training - Skipping example with length 1016 (seq_length=1024) +03/05/2022 04:16:31 - INFO - codeparrot_training - Step 33023: {'lr': 0.00044772400329476505, 'samples': 16908288, 'steps': 33023, 'loss/train': 1.7549325227737427} +03/05/2022 04:16:34 - INFO - codeparrot_training - Step 33024: {'lr': 0.0004477207557850078, 'samples': 16908800, 'steps': 33024, 'loss/train': 0.8928710222244263} +03/05/2022 04:16:35 - INFO - codeparrot_training - Skipping example with length 280 (seq_length=1024) +03/05/2022 04:16:39 - INFO - codeparrot_training - Step 33025: {'lr': 0.00044771750818616067, 'samples': 16909312, 'steps': 33025, 'loss/train': 1.886451244354248} +03/05/2022 04:16:43 - INFO - codeparrot_training - Step 33026: {'lr': 0.0004477142604982251, 'samples': 16909824, 'steps': 33026, 'loss/train': 1.3175508975982666} +03/05/2022 04:16:43 - INFO - codeparrot_training - Skipping example with length 832 (seq_length=1024) +03/05/2022 04:16:48 - INFO - codeparrot_training - Step 33027: {'lr': 0.0004477110127212025, 'samples': 16910336, 'steps': 33027, 'loss/train': 2.170865297317505} +03/05/2022 04:16:51 - INFO - codeparrot_training - Step 33028: {'lr': 0.00044770776485509445, 'samples': 16910848, 'steps': 33028, 'loss/train': 1.8284481763839722} +03/05/2022 04:16:51 - INFO - codeparrot_training - Skipping example with length 855 (seq_length=1024) +03/05/2022 04:16:56 - INFO - codeparrot_training - Step 33029: {'lr': 0.00044770451689990227, 'samples': 16911360, 'steps': 33029, 'loss/train': 2.1039533615112305} +03/05/2022 04:16:59 - INFO - codeparrot_training - Step 33030: {'lr': 0.0004477012688556275, 'samples': 16911872, 'steps': 33030, 'loss/train': 1.4315627813339233} +03/05/2022 04:16:59 - INFO - codeparrot_training - Skipping example with length 103 (seq_length=1024) +03/05/2022 04:17:05 - INFO - codeparrot_training - Step 33031: {'lr': 0.0004476980207222716, 'samples': 16912384, 'steps': 33031, 'loss/train': 1.7976057529449463} +03/05/2022 04:17:08 - INFO - codeparrot_training - Step 33032: {'lr': 0.00044769477249983596, 'samples': 16912896, 'steps': 33032, 'loss/train': 1.3541350364685059} +03/05/2022 04:17:08 - INFO - codeparrot_training - Skipping example with length 33 (seq_length=1024) +03/05/2022 04:17:13 - INFO - codeparrot_training - Step 33033: {'lr': 0.00044769152418832215, 'samples': 16913408, 'steps': 33033, 'loss/train': 0.954656183719635} +03/05/2022 04:17:16 - INFO - codeparrot_training - Step 33034: {'lr': 0.00044768827578773164, 'samples': 16913920, 'steps': 33034, 'loss/train': 1.6620924472808838} +03/05/2022 04:17:16 - INFO - codeparrot_training - Skipping example with length 720 (seq_length=1024) +03/05/2022 04:17:22 - INFO - codeparrot_training - Step 33035: {'lr': 0.00044768502729806574, 'samples': 16914432, 'steps': 33035, 'loss/train': 0.0657031387090683} +03/05/2022 04:17:25 - INFO - codeparrot_training - Step 33036: {'lr': 0.0004476817787193261, 'samples': 16914944, 'steps': 33036, 'loss/train': 2.6146161556243896} +03/05/2022 04:17:25 - INFO - codeparrot_training - Skipping example with length 35 (seq_length=1024) +03/05/2022 04:17:30 - INFO - codeparrot_training - Step 33037: {'lr': 0.0004476785300515141, 'samples': 16915456, 'steps': 33037, 'loss/train': 1.4477626085281372} +03/05/2022 04:17:33 - INFO - codeparrot_training - Skipping example with length 601 (seq_length=1024) +03/05/2022 04:17:35 - INFO - codeparrot_training - Step 33038: {'lr': 0.0004476752812946312, 'samples': 16915968, 'steps': 33038, 'loss/train': 1.442064642906189} +03/05/2022 04:17:38 - INFO - codeparrot_training - Step 33039: {'lr': 0.0004476720324486788, 'samples': 16916480, 'steps': 33039, 'loss/train': 0.7201438546180725} +03/05/2022 04:17:41 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 04:17:44 - INFO - codeparrot_training - Step 33040: {'lr': 0.0004476687835136585, 'samples': 16916992, 'steps': 33040, 'loss/train': 0.7878016829490662} +03/05/2022 04:17:47 - INFO - codeparrot_training - Step 33041: {'lr': 0.0004476655344895717, 'samples': 16917504, 'steps': 33041, 'loss/train': 1.5895615816116333} +03/05/2022 04:17:50 - INFO - codeparrot_training - Skipping example with length 532 (seq_length=1024) +03/05/2022 04:17:52 - INFO - codeparrot_training - Step 33042: {'lr': 0.0004476622853764198, 'samples': 16918016, 'steps': 33042, 'loss/train': 2.5252041816711426} +03/05/2022 04:17:55 - INFO - codeparrot_training - Step 33043: {'lr': 0.00044765903617420436, 'samples': 16918528, 'steps': 33043, 'loss/train': 2.5129315853118896} +03/05/2022 04:17:58 - INFO - codeparrot_training - Skipping example with length 35 (seq_length=1024) +03/05/2022 04:18:01 - INFO - codeparrot_training - Step 33044: {'lr': 0.00044765578688292686, 'samples': 16919040, 'steps': 33044, 'loss/train': 2.534588098526001} +03/05/2022 04:18:04 - INFO - codeparrot_training - Step 33045: {'lr': 0.0004476525375025886, 'samples': 16919552, 'steps': 33045, 'loss/train': 1.2728670835494995} +03/05/2022 04:18:07 - INFO - codeparrot_training - Skipping example with length 340 (seq_length=1024) +03/05/2022 04:18:09 - INFO - codeparrot_training - Step 33046: {'lr': 0.00044764928803319126, 'samples': 16920064, 'steps': 33046, 'loss/train': 1.235376238822937} +03/05/2022 04:18:12 - INFO - codeparrot_training - Step 33047: {'lr': 0.00044764603847473615, 'samples': 16920576, 'steps': 33047, 'loss/train': 1.8117481470108032} +03/05/2022 04:18:15 - INFO - codeparrot_training - Skipping example with length 194 (seq_length=1024) +03/05/2022 04:18:17 - INFO - codeparrot_training - Step 33048: {'lr': 0.0004476427888272248, 'samples': 16921088, 'steps': 33048, 'loss/train': 1.74118971824646} +03/05/2022 04:18:21 - INFO - codeparrot_training - Step 33049: {'lr': 0.0004476395390906586, 'samples': 16921600, 'steps': 33049, 'loss/train': 1.5807212591171265} +03/05/2022 04:18:23 - INFO - codeparrot_training - Skipping example with length 276 (seq_length=1024) +03/05/2022 04:18:26 - INFO - codeparrot_training - Step 33050: {'lr': 0.0004476362892650392, 'samples': 16922112, 'steps': 33050, 'loss/train': 1.9261671304702759} +03/05/2022 04:18:29 - INFO - codeparrot_training - Step 33051: {'lr': 0.0004476330393503678, 'samples': 16922624, 'steps': 33051, 'loss/train': 1.978813886642456} +03/05/2022 04:18:31 - INFO - codeparrot_training - Skipping example with length 945 (seq_length=1024) +03/05/2022 04:18:34 - INFO - codeparrot_training - Step 33052: {'lr': 0.0004476297893466461, 'samples': 16923136, 'steps': 33052, 'loss/train': 1.574313759803772} +03/05/2022 04:18:37 - INFO - codeparrot_training - Step 33053: {'lr': 0.0004476265392538754, 'samples': 16923648, 'steps': 33053, 'loss/train': 2.2591452598571777} +03/05/2022 04:18:40 - INFO - codeparrot_training - Skipping example with length 372 (seq_length=1024) +03/05/2022 04:18:43 - INFO - codeparrot_training - Step 33054: {'lr': 0.0004476232890720573, 'samples': 16924160, 'steps': 33054, 'loss/train': 0.21593250334262848} +03/05/2022 04:18:46 - INFO - codeparrot_training - Step 33055: {'lr': 0.0004476200388011932, 'samples': 16924672, 'steps': 33055, 'loss/train': 2.560988187789917} +03/05/2022 04:18:48 - INFO - codeparrot_training - Skipping example with length 688 (seq_length=1024) +03/05/2022 04:18:51 - INFO - codeparrot_training - Step 33056: {'lr': 0.0004476167884412845, 'samples': 16925184, 'steps': 33056, 'loss/train': 1.9278711080551147} +03/05/2022 04:18:54 - INFO - codeparrot_training - Step 33057: {'lr': 0.00044761353799233273, 'samples': 16925696, 'steps': 33057, 'loss/train': 0.09464825689792633} +03/05/2022 04:18:57 - INFO - codeparrot_training - Skipping example with length 24 (seq_length=1024) +03/05/2022 04:19:00 - INFO - codeparrot_training - Step 33058: {'lr': 0.00044761028745433934, 'samples': 16926208, 'steps': 33058, 'loss/train': 1.5981062650680542} +03/05/2022 04:19:03 - INFO - codeparrot_training - Step 33059: {'lr': 0.00044760703682730584, 'samples': 16926720, 'steps': 33059, 'loss/train': 0.5028110146522522} +03/05/2022 04:19:05 - INFO - codeparrot_training - Skipping example with length 387 (seq_length=1024) +03/05/2022 04:19:08 - INFO - codeparrot_training - Step 33060: {'lr': 0.00044760378611123365, 'samples': 16927232, 'steps': 33060, 'loss/train': 1.439496397972107} +03/05/2022 04:19:11 - INFO - codeparrot_training - Step 33061: {'lr': 0.0004476005353061242, 'samples': 16927744, 'steps': 33061, 'loss/train': 2.2588398456573486} +03/05/2022 04:19:14 - INFO - codeparrot_training - Skipping example with length 944 (seq_length=1024) +03/05/2022 04:19:16 - INFO - codeparrot_training - Step 33062: {'lr': 0.00044759728441197904, 'samples': 16928256, 'steps': 33062, 'loss/train': 1.6910161972045898} +03/05/2022 04:19:20 - INFO - codeparrot_training - Step 33063: {'lr': 0.0004475940334287996, 'samples': 16928768, 'steps': 33063, 'loss/train': 2.3105356693267822} +03/05/2022 04:19:22 - INFO - codeparrot_training - Skipping example with length 853 (seq_length=1024) +03/05/2022 04:19:25 - INFO - codeparrot_training - Step 33064: {'lr': 0.0004475907823565873, 'samples': 16929280, 'steps': 33064, 'loss/train': 2.732370615005493} +03/05/2022 04:19:28 - INFO - codeparrot_training - Step 33065: {'lr': 0.00044758753119534373, 'samples': 16929792, 'steps': 33065, 'loss/train': 2.0259897708892822} +03/05/2022 04:19:31 - INFO - codeparrot_training - Step 33066: {'lr': 0.0004475842799450702, 'samples': 16930304, 'steps': 33066, 'loss/train': 2.103271007537842} +03/05/2022 04:19:31 - INFO - codeparrot_training - Skipping example with length 332 (seq_length=1024) +03/05/2022 04:19:37 - INFO - codeparrot_training - Step 33067: {'lr': 0.0004475810286057682, 'samples': 16930816, 'steps': 33067, 'loss/train': 0.9005130529403687} +03/05/2022 04:19:39 - INFO - codeparrot_training - Skipping example with length 722 (seq_length=1024) +03/05/2022 04:19:42 - INFO - codeparrot_training - Step 33068: {'lr': 0.0004475777771774393, 'samples': 16931328, 'steps': 33068, 'loss/train': 1.537448525428772} +03/05/2022 04:19:45 - INFO - codeparrot_training - Step 33069: {'lr': 0.00044757452566008497, 'samples': 16931840, 'steps': 33069, 'loss/train': 1.4250881671905518} +03/05/2022 04:19:48 - INFO - codeparrot_training - Skipping example with length 918 (seq_length=1024) +03/05/2022 04:19:50 - INFO - codeparrot_training - Step 33070: {'lr': 0.00044757127405370645, 'samples': 16932352, 'steps': 33070, 'loss/train': 1.5197818279266357} +03/05/2022 04:19:53 - INFO - codeparrot_training - Step 33071: {'lr': 0.00044756802235830544, 'samples': 16932864, 'steps': 33071, 'loss/train': 1.6353663206100464} +03/05/2022 04:19:56 - INFO - codeparrot_training - Skipping example with length 852 (seq_length=1024) +03/05/2022 04:19:59 - INFO - codeparrot_training - Step 33072: {'lr': 0.00044756477057388336, 'samples': 16933376, 'steps': 33072, 'loss/train': 0.8650037050247192} +03/05/2022 04:20:02 - INFO - codeparrot_training - Step 33073: {'lr': 0.0004475615187004416, 'samples': 16933888, 'steps': 33073, 'loss/train': 1.7573469877243042} +03/05/2022 04:20:04 - INFO - codeparrot_training - Skipping example with length 633 (seq_length=1024) +03/05/2022 04:20:07 - INFO - codeparrot_training - Step 33074: {'lr': 0.0004475582667379817, 'samples': 16934400, 'steps': 33074, 'loss/train': 1.3492982387542725} +03/05/2022 04:20:10 - INFO - codeparrot_training - Step 33075: {'lr': 0.0004475550146865051, 'samples': 16934912, 'steps': 33075, 'loss/train': 1.9725797176361084} +03/05/2022 04:20:13 - INFO - codeparrot_training - Skipping example with length 507 (seq_length=1024) +03/05/2022 04:20:16 - INFO - codeparrot_training - Step 33076: {'lr': 0.00044755176254601323, 'samples': 16935424, 'steps': 33076, 'loss/train': 1.2180640697479248} +03/05/2022 04:20:19 - INFO - codeparrot_training - Step 33077: {'lr': 0.00044754851031650756, 'samples': 16935936, 'steps': 33077, 'loss/train': 1.948065996170044} +03/05/2022 04:20:21 - INFO - codeparrot_training - Skipping example with length 547 (seq_length=1024) +03/05/2022 04:20:24 - INFO - codeparrot_training - Step 33078: {'lr': 0.0004475452579979896, 'samples': 16936448, 'steps': 33078, 'loss/train': 1.8464277982711792} +03/05/2022 04:20:27 - INFO - codeparrot_training - Step 33079: {'lr': 0.00044754200559046076, 'samples': 16936960, 'steps': 33079, 'loss/train': 1.9367538690567017} +03/05/2022 04:20:29 - INFO - codeparrot_training - Skipping example with length 830 (seq_length=1024) +03/05/2022 04:20:33 - INFO - codeparrot_training - Step 33080: {'lr': 0.0004475387530939226, 'samples': 16937472, 'steps': 33080, 'loss/train': 2.307396173477173} +03/05/2022 04:20:36 - INFO - codeparrot_training - Step 33081: {'lr': 0.00044753550050837654, 'samples': 16937984, 'steps': 33081, 'loss/train': 1.8598867654800415} +03/05/2022 04:20:38 - INFO - codeparrot_training - Skipping example with length 81 (seq_length=1024) +03/05/2022 04:20:41 - INFO - codeparrot_training - Step 33082: {'lr': 0.00044753224783382394, 'samples': 16938496, 'steps': 33082, 'loss/train': 2.262383460998535} +03/05/2022 04:20:45 - INFO - codeparrot_training - Step 33083: {'lr': 0.00044752899507026646, 'samples': 16939008, 'steps': 33083, 'loss/train': 1.4210560321807861} +03/05/2022 04:20:48 - INFO - codeparrot_training - Step 33084: {'lr': 0.00044752574221770537, 'samples': 16939520, 'steps': 33084, 'loss/train': 1.2933735847473145} +03/05/2022 04:20:48 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 04:20:53 - INFO - codeparrot_training - Step 33085: {'lr': 0.0004475224892761423, 'samples': 16940032, 'steps': 33085, 'loss/train': 1.797582983970642} +03/05/2022 04:20:56 - INFO - codeparrot_training - Step 33086: {'lr': 0.00044751923624557866, 'samples': 16940544, 'steps': 33086, 'loss/train': 0.8822979927062988} +03/05/2022 04:20:57 - INFO - codeparrot_training - Skipping example with length 360 (seq_length=1024) +03/05/2022 04:21:01 - INFO - codeparrot_training - Step 33087: {'lr': 0.0004475159831260158, 'samples': 16941056, 'steps': 33087, 'loss/train': 1.564642310142517} +03/05/2022 04:21:05 - INFO - codeparrot_training - Step 33088: {'lr': 0.00044751272991745537, 'samples': 16941568, 'steps': 33088, 'loss/train': 1.5531375408172607} +03/05/2022 04:21:05 - INFO - codeparrot_training - Skipping example with length 347 (seq_length=1024) +03/05/2022 04:21:10 - INFO - codeparrot_training - Step 33089: {'lr': 0.00044750947661989873, 'samples': 16942080, 'steps': 33089, 'loss/train': 1.2890675067901611} +03/05/2022 04:21:13 - INFO - codeparrot_training - Step 33090: {'lr': 0.0004475062232333474, 'samples': 16942592, 'steps': 33090, 'loss/train': 1.044869065284729} +03/05/2022 04:21:13 - INFO - codeparrot_training - Skipping example with length 966 (seq_length=1024) +03/05/2022 04:21:18 - INFO - codeparrot_training - Step 33091: {'lr': 0.00044750296975780277, 'samples': 16943104, 'steps': 33091, 'loss/train': 1.585540771484375} +03/05/2022 04:21:22 - INFO - codeparrot_training - Step 33092: {'lr': 0.00044749971619326633, 'samples': 16943616, 'steps': 33092, 'loss/train': 2.3870625495910645} +03/05/2022 04:21:22 - INFO - codeparrot_training - Skipping example with length 49 (seq_length=1024) +03/05/2022 04:21:27 - INFO - codeparrot_training - Step 33093: {'lr': 0.0004474964625397396, 'samples': 16944128, 'steps': 33093, 'loss/train': 2.506782293319702} +03/05/2022 04:21:30 - INFO - codeparrot_training - Step 33094: {'lr': 0.000447493208797224, 'samples': 16944640, 'steps': 33094, 'loss/train': 1.5199761390686035} +03/05/2022 04:21:30 - INFO - codeparrot_training - Skipping example with length 171 (seq_length=1024) +03/05/2022 04:21:35 - INFO - codeparrot_training - Step 33095: {'lr': 0.00044748995496572105, 'samples': 16945152, 'steps': 33095, 'loss/train': 1.9823384284973145} +03/05/2022 04:21:39 - INFO - codeparrot_training - Step 33096: {'lr': 0.0004474867010452321, 'samples': 16945664, 'steps': 33096, 'loss/train': 1.3394315242767334} +03/05/2022 04:21:39 - INFO - codeparrot_training - Skipping example with length 594 (seq_length=1024) +03/05/2022 04:21:44 - INFO - codeparrot_training - Step 33097: {'lr': 0.0004474834470357587, 'samples': 16946176, 'steps': 33097, 'loss/train': 1.5819625854492188} +03/05/2022 04:21:47 - INFO - codeparrot_training - Skipping example with length 136 (seq_length=1024) +03/05/2022 04:21:49 - INFO - codeparrot_training - Step 33098: {'lr': 0.00044748019293730236, 'samples': 16946688, 'steps': 33098, 'loss/train': 0.9642543196678162} +03/05/2022 04:21:52 - INFO - codeparrot_training - Step 33099: {'lr': 0.0004474769387498645, 'samples': 16947200, 'steps': 33099, 'loss/train': 2.053542375564575} +03/05/2022 04:21:55 - INFO - codeparrot_training - Step 33100: {'lr': 0.0004474736844734465, 'samples': 16947712, 'steps': 33100, 'loss/train': 1.1247843503952026} +03/05/2022 04:21:56 - INFO - codeparrot_training - Skipping example with length 6 (seq_length=1024) +03/05/2022 04:22:01 - INFO - codeparrot_training - Step 33101: {'lr': 0.00044747043010805, 'samples': 16948224, 'steps': 33101, 'loss/train': 2.1274490356445312} +03/05/2022 04:22:04 - INFO - codeparrot_training - Step 33102: {'lr': 0.0004474671756536763, 'samples': 16948736, 'steps': 33102, 'loss/train': 2.713592290878296} +03/05/2022 04:22:04 - INFO - codeparrot_training - Skipping example with length 556 (seq_length=1024) +03/05/2022 04:22:09 - INFO - codeparrot_training - Step 33103: {'lr': 0.00044746392111032695, 'samples': 16949248, 'steps': 33103, 'loss/train': 2.0415961742401123} +03/05/2022 04:22:12 - INFO - codeparrot_training - Step 33104: {'lr': 0.00044746066647800343, 'samples': 16949760, 'steps': 33104, 'loss/train': 1.6582971811294556} +03/05/2022 04:22:12 - INFO - codeparrot_training - Skipping example with length 297 (seq_length=1024) +03/05/2022 04:22:17 - INFO - codeparrot_training - Step 33105: {'lr': 0.0004474574117567072, 'samples': 16950272, 'steps': 33105, 'loss/train': 1.3262115716934204} +03/05/2022 04:22:21 - INFO - codeparrot_training - Step 33106: {'lr': 0.00044745415694643964, 'samples': 16950784, 'steps': 33106, 'loss/train': 1.4172344207763672} +03/05/2022 04:22:21 - INFO - codeparrot_training - Skipping example with length 908 (seq_length=1024) +03/05/2022 04:22:26 - INFO - codeparrot_training - Step 33107: {'lr': 0.0004474509020472023, 'samples': 16951296, 'steps': 33107, 'loss/train': 6.424846172332764} +03/05/2022 04:22:29 - INFO - codeparrot_training - Step 33108: {'lr': 0.0004474476470589967, 'samples': 16951808, 'steps': 33108, 'loss/train': 1.4720209836959839} +03/05/2022 04:22:31 - INFO - codeparrot_training - Skipping example with length 869 (seq_length=1024) +03/05/2022 04:22:35 - INFO - codeparrot_training - Step 33109: {'lr': 0.0004474443919818241, 'samples': 16952320, 'steps': 33109, 'loss/train': 1.9591988325119019} +03/05/2022 04:22:38 - INFO - codeparrot_training - Step 33110: {'lr': 0.0004474411368156862, 'samples': 16952832, 'steps': 33110, 'loss/train': 1.7638566493988037} +03/05/2022 04:22:39 - INFO - codeparrot_training - Skipping example with length 597 (seq_length=1024) +03/05/2022 04:22:44 - INFO - codeparrot_training - Step 33111: {'lr': 0.00044743788156058437, 'samples': 16953344, 'steps': 33111, 'loss/train': 1.6902018785476685} +03/05/2022 04:22:47 - INFO - codeparrot_training - Step 33112: {'lr': 0.00044743462621652007, 'samples': 16953856, 'steps': 33112, 'loss/train': 1.8489786386489868} +03/05/2022 04:22:49 - INFO - codeparrot_training - Skipping example with length 262 (seq_length=1024) +03/05/2022 04:22:52 - INFO - codeparrot_training - Step 33113: {'lr': 0.0004474313707834947, 'samples': 16954368, 'steps': 33113, 'loss/train': 1.8566254377365112} +03/05/2022 04:22:55 - INFO - codeparrot_training - Step 33114: {'lr': 0.00044742811526150996, 'samples': 16954880, 'steps': 33114, 'loss/train': 1.3113315105438232} +03/05/2022 04:22:57 - INFO - codeparrot_training - Skipping example with length 697 (seq_length=1024) +03/05/2022 04:23:01 - INFO - codeparrot_training - Step 33115: {'lr': 0.000447424859650567, 'samples': 16955392, 'steps': 33115, 'loss/train': 1.6944289207458496} +03/05/2022 04:23:04 - INFO - codeparrot_training - Step 33116: {'lr': 0.00044742160395066756, 'samples': 16955904, 'steps': 33116, 'loss/train': 1.5802167654037476} +03/05/2022 04:23:07 - INFO - codeparrot_training - Skipping example with length 617 (seq_length=1024) +03/05/2022 04:23:09 - INFO - codeparrot_training - Step 33117: {'lr': 0.0004474183481618129, 'samples': 16956416, 'steps': 33117, 'loss/train': 1.2100180387496948} +03/05/2022 04:23:12 - INFO - codeparrot_training - Step 33118: {'lr': 0.00044741509228400465, 'samples': 16956928, 'steps': 33118, 'loss/train': 0.3639983534812927} +03/05/2022 04:23:15 - INFO - codeparrot_training - Step 33119: {'lr': 0.0004474118363172441, 'samples': 16957440, 'steps': 33119, 'loss/train': 1.4498764276504517} +03/05/2022 04:23:16 - INFO - codeparrot_training - Skipping example with length 592 (seq_length=1024) +03/05/2022 04:23:21 - INFO - codeparrot_training - Step 33120: {'lr': 0.000447408580261533, 'samples': 16957952, 'steps': 33120, 'loss/train': 1.8144738674163818} +03/05/2022 04:23:24 - INFO - codeparrot_training - Step 33121: {'lr': 0.0004474053241168725, 'samples': 16958464, 'steps': 33121, 'loss/train': 1.6722996234893799} +03/05/2022 04:23:24 - INFO - codeparrot_training - Skipping example with length 543 (seq_length=1024) +03/05/2022 04:23:29 - INFO - codeparrot_training - Step 33122: {'lr': 0.00044740206788326423, 'samples': 16958976, 'steps': 33122, 'loss/train': 1.9530354738235474} +03/05/2022 04:23:32 - INFO - codeparrot_training - Step 33123: {'lr': 0.0004473988115607097, 'samples': 16959488, 'steps': 33123, 'loss/train': 1.8632655143737793} +03/05/2022 04:23:38 - INFO - codeparrot_training - Step 33124: {'lr': 0.00044739555514921025, 'samples': 16960000, 'steps': 33124, 'loss/train': 1.59609055519104} +03/05/2022 04:23:41 - INFO - codeparrot_training - Step 33125: {'lr': 0.0004473922986487674, 'samples': 16960512, 'steps': 33125, 'loss/train': 1.8414554595947266} +03/05/2022 04:23:41 - INFO - codeparrot_training - Skipping example with length 503 (seq_length=1024) +03/05/2022 04:23:46 - INFO - codeparrot_training - Step 33126: {'lr': 0.00044738904205938264, 'samples': 16961024, 'steps': 33126, 'loss/train': 1.814988613128662} +03/05/2022 04:23:49 - INFO - codeparrot_training - Step 33127: {'lr': 0.00044738578538105746, 'samples': 16961536, 'steps': 33127, 'loss/train': 2.1402242183685303} +03/05/2022 04:23:49 - INFO - codeparrot_training - Skipping example with length 727 (seq_length=1024) +03/05/2022 04:23:55 - INFO - codeparrot_training - Step 33128: {'lr': 0.0004473825286137933, 'samples': 16962048, 'steps': 33128, 'loss/train': 1.9264236688613892} +03/05/2022 04:23:58 - INFO - codeparrot_training - Step 33129: {'lr': 0.0004473792717575915, 'samples': 16962560, 'steps': 33129, 'loss/train': 1.0212764739990234} +03/05/2022 04:23:58 - INFO - codeparrot_training - Skipping example with length 744 (seq_length=1024) +03/05/2022 04:24:03 - INFO - codeparrot_training - Step 33130: {'lr': 0.00044737601481245376, 'samples': 16963072, 'steps': 33130, 'loss/train': 1.0782076120376587} +03/05/2022 04:24:06 - INFO - codeparrot_training - Skipping example with length 184 (seq_length=1024) +03/05/2022 04:24:08 - INFO - codeparrot_training - Step 33131: {'lr': 0.00044737275777838136, 'samples': 16963584, 'steps': 33131, 'loss/train': 1.4459834098815918} +03/05/2022 04:24:12 - INFO - codeparrot_training - Step 33132: {'lr': 0.0004473695006553759, 'samples': 16964096, 'steps': 33132, 'loss/train': 2.4437780380249023} +03/05/2022 04:24:14 - INFO - codeparrot_training - Skipping example with length 365 (seq_length=1024) +03/05/2022 04:24:17 - INFO - codeparrot_training - Step 33133: {'lr': 0.0004473662434434388, 'samples': 16964608, 'steps': 33133, 'loss/train': 1.305116891860962} +03/05/2022 04:24:20 - INFO - codeparrot_training - Step 33134: {'lr': 0.00044736298614257144, 'samples': 16965120, 'steps': 33134, 'loss/train': 2.374018907546997} +03/05/2022 04:24:23 - INFO - codeparrot_training - Step 33135: {'lr': 0.0004473597287527754, 'samples': 16965632, 'steps': 33135, 'loss/train': 1.4758410453796387} +03/05/2022 04:24:24 - INFO - codeparrot_training - Skipping example with length 969 (seq_length=1024) +03/05/2022 04:24:29 - INFO - codeparrot_training - Step 33136: {'lr': 0.00044735647127405216, 'samples': 16966144, 'steps': 33136, 'loss/train': 2.0594801902770996} +03/05/2022 04:24:32 - INFO - codeparrot_training - Step 33137: {'lr': 0.00044735321370640316, 'samples': 16966656, 'steps': 33137, 'loss/train': 1.5817471742630005} +03/05/2022 04:24:32 - INFO - codeparrot_training - Skipping example with length 81 (seq_length=1024) +03/05/2022 04:24:37 - INFO - codeparrot_training - Step 33138: {'lr': 0.00044734995604982973, 'samples': 16967168, 'steps': 33138, 'loss/train': 1.5470978021621704} +03/05/2022 04:24:40 - INFO - codeparrot_training - Step 33139: {'lr': 0.0004473466983043335, 'samples': 16967680, 'steps': 33139, 'loss/train': 2.2806003093719482} +03/05/2022 04:24:40 - INFO - codeparrot_training - Skipping example with length 700 (seq_length=1024) +03/05/2022 04:24:45 - INFO - codeparrot_training - Step 33140: {'lr': 0.0004473434404699159, 'samples': 16968192, 'steps': 33140, 'loss/train': 1.482629418373108} +03/05/2022 04:24:48 - INFO - codeparrot_training - Step 33141: {'lr': 0.00044734018254657845, 'samples': 16968704, 'steps': 33141, 'loss/train': 1.1464323997497559} +03/05/2022 04:24:49 - INFO - codeparrot_training - Skipping example with length 273 (seq_length=1024) +03/05/2022 04:24:54 - INFO - codeparrot_training - Step 33142: {'lr': 0.00044733692453432253, 'samples': 16969216, 'steps': 33142, 'loss/train': 1.6330277919769287} +03/05/2022 04:24:57 - INFO - codeparrot_training - Step 33143: {'lr': 0.00044733366643314956, 'samples': 16969728, 'steps': 33143, 'loss/train': 0.7457121014595032} +03/05/2022 04:24:58 - INFO - codeparrot_training - Skipping example with length 440 (seq_length=1024) +03/05/2022 04:25:02 - INFO - codeparrot_training - Step 33144: {'lr': 0.00044733040824306117, 'samples': 16970240, 'steps': 33144, 'loss/train': 1.621644377708435} +03/05/2022 04:25:06 - INFO - codeparrot_training - Step 33145: {'lr': 0.00044732714996405866, 'samples': 16970752, 'steps': 33145, 'loss/train': 1.2490003108978271} +03/05/2022 04:25:06 - INFO - codeparrot_training - Skipping example with length 651 (seq_length=1024) +03/05/2022 04:25:11 - INFO - codeparrot_training - Step 33146: {'lr': 0.0004473238915961436, 'samples': 16971264, 'steps': 33146, 'loss/train': 1.9932024478912354} +03/05/2022 04:25:14 - INFO - codeparrot_training - Step 33147: {'lr': 0.0004473206331393175, 'samples': 16971776, 'steps': 33147, 'loss/train': 1.0518676042556763} +03/05/2022 04:25:14 - INFO - codeparrot_training - Skipping example with length 493 (seq_length=1024) +03/05/2022 04:25:19 - INFO - codeparrot_training - Step 33148: {'lr': 0.0004473173745935818, 'samples': 16972288, 'steps': 33148, 'loss/train': 2.415705919265747} +03/05/2022 04:25:23 - INFO - codeparrot_training - Step 33149: {'lr': 0.00044731411595893785, 'samples': 16972800, 'steps': 33149, 'loss/train': 1.2922922372817993} +03/05/2022 04:25:23 - INFO - codeparrot_training - Skipping example with length 807 (seq_length=1024) +03/05/2022 04:25:28 - INFO - codeparrot_training - Step 33150: {'lr': 0.00044731085723538725, 'samples': 16973312, 'steps': 33150, 'loss/train': 1.4215087890625} +03/05/2022 04:25:31 - INFO - codeparrot_training - Step 33151: {'lr': 0.00044730759842293136, 'samples': 16973824, 'steps': 33151, 'loss/train': 1.6480581760406494} +03/05/2022 04:25:31 - INFO - codeparrot_training - Skipping example with length 359 (seq_length=1024) +03/05/2022 04:25:36 - INFO - codeparrot_training - Step 33152: {'lr': 0.0004473043395215718, 'samples': 16974336, 'steps': 33152, 'loss/train': 1.6556274890899658} +03/05/2022 04:25:39 - INFO - codeparrot_training - Step 33153: {'lr': 0.00044730108053130986, 'samples': 16974848, 'steps': 33153, 'loss/train': 0.8544706702232361} +03/05/2022 04:25:39 - INFO - codeparrot_training - Skipping example with length 200 (seq_length=1024) +03/05/2022 04:25:45 - INFO - codeparrot_training - Step 33154: {'lr': 0.00044729782145214717, 'samples': 16975360, 'steps': 33154, 'loss/train': 1.3904697895050049} +03/05/2022 04:25:48 - INFO - codeparrot_training - Step 33155: {'lr': 0.00044729456228408506, 'samples': 16975872, 'steps': 33155, 'loss/train': 2.405191421508789} +03/05/2022 04:25:48 - INFO - codeparrot_training - Skipping example with length 857 (seq_length=1024) +03/05/2022 04:25:53 - INFO - codeparrot_training - Step 33156: {'lr': 0.00044729130302712504, 'samples': 16976384, 'steps': 33156, 'loss/train': 0.6117886900901794} +03/05/2022 04:25:56 - INFO - codeparrot_training - Step 33157: {'lr': 0.00044728804368126873, 'samples': 16976896, 'steps': 33157, 'loss/train': 1.6728873252868652} +03/05/2022 04:25:57 - INFO - codeparrot_training - Skipping example with length 774 (seq_length=1024) +03/05/2022 04:26:02 - INFO - codeparrot_training - Step 33158: {'lr': 0.00044728478424651744, 'samples': 16977408, 'steps': 33158, 'loss/train': 1.8064402341842651} +03/05/2022 04:26:05 - INFO - codeparrot_training - Step 33159: {'lr': 0.0004472815247228726, 'samples': 16977920, 'steps': 33159, 'loss/train': 1.4956008195877075} +03/05/2022 04:26:06 - INFO - codeparrot_training - Skipping example with length 847 (seq_length=1024) +03/05/2022 04:26:10 - INFO - codeparrot_training - Step 33160: {'lr': 0.00044727826511033577, 'samples': 16978432, 'steps': 33160, 'loss/train': 1.8971668481826782} +03/05/2022 04:26:13 - INFO - codeparrot_training - Step 33161: {'lr': 0.0004472750054089084, 'samples': 16978944, 'steps': 33161, 'loss/train': 0.687340259552002} +03/05/2022 04:26:14 - INFO - codeparrot_training - Skipping example with length 728 (seq_length=1024) +03/05/2022 04:26:19 - INFO - codeparrot_training - Step 33162: {'lr': 0.00044727174561859194, 'samples': 16979456, 'steps': 33162, 'loss/train': 1.8402913808822632} +03/05/2022 04:26:22 - INFO - codeparrot_training - Step 33163: {'lr': 0.00044726848573938796, 'samples': 16979968, 'steps': 33163, 'loss/train': 3.331056833267212} +03/05/2022 04:26:22 - INFO - codeparrot_training - Skipping example with length 228 (seq_length=1024) +03/05/2022 04:26:27 - INFO - codeparrot_training - Step 33164: {'lr': 0.0004472652257712978, 'samples': 16980480, 'steps': 33164, 'loss/train': 2.099949836730957} +03/05/2022 04:26:30 - INFO - codeparrot_training - Step 33165: {'lr': 0.0004472619657143229, 'samples': 16980992, 'steps': 33165, 'loss/train': 1.7522810697555542} +03/05/2022 04:26:30 - INFO - codeparrot_training - Skipping example with length 951 (seq_length=1024) +03/05/2022 04:26:36 - INFO - codeparrot_training - Step 33166: {'lr': 0.00044725870556846495, 'samples': 16981504, 'steps': 33166, 'loss/train': 0.6204085350036621} +03/05/2022 04:26:38 - INFO - codeparrot_training - Skipping example with length 725 (seq_length=1024) +03/05/2022 04:26:41 - INFO - codeparrot_training - Step 33167: {'lr': 0.00044725544533372516, 'samples': 16982016, 'steps': 33167, 'loss/train': 1.8202327489852905} +03/05/2022 04:26:44 - INFO - codeparrot_training - Step 33168: {'lr': 0.00044725218501010514, 'samples': 16982528, 'steps': 33168, 'loss/train': 2.160159111022949} +03/05/2022 04:26:47 - INFO - codeparrot_training - Step 33169: {'lr': 0.0004472489245976063, 'samples': 16983040, 'steps': 33169, 'loss/train': 1.1060634851455688} +03/05/2022 04:26:47 - INFO - codeparrot_training - Skipping example with length 641 (seq_length=1024) +03/05/2022 04:26:53 - INFO - codeparrot_training - Step 33170: {'lr': 0.00044724566409623013, 'samples': 16983552, 'steps': 33170, 'loss/train': 1.4933899641036987} +03/05/2022 04:26:56 - INFO - codeparrot_training - Step 33171: {'lr': 0.0004472424035059782, 'samples': 16984064, 'steps': 33171, 'loss/train': 1.1600592136383057} +03/05/2022 04:26:56 - INFO - codeparrot_training - Skipping example with length 448 (seq_length=1024) +03/05/2022 04:27:01 - INFO - codeparrot_training - Step 33172: {'lr': 0.0004472391428268518, 'samples': 16984576, 'steps': 33172, 'loss/train': 0.935180127620697} +03/05/2022 04:27:04 - INFO - codeparrot_training - Step 33173: {'lr': 0.00044723588205885254, 'samples': 16985088, 'steps': 33173, 'loss/train': 1.3908851146697998} +03/05/2022 04:27:04 - INFO - codeparrot_training - Skipping example with length 748 (seq_length=1024) +03/05/2022 04:27:09 - INFO - codeparrot_training - Step 33174: {'lr': 0.00044723262120198177, 'samples': 16985600, 'steps': 33174, 'loss/train': 2.400458335876465} +03/05/2022 04:27:13 - INFO - codeparrot_training - Step 33175: {'lr': 0.00044722936025624107, 'samples': 16986112, 'steps': 33175, 'loss/train': 1.163452386856079} +03/05/2022 04:27:13 - INFO - codeparrot_training - Skipping example with length 355 (seq_length=1024) +03/05/2022 04:27:18 - INFO - codeparrot_training - Step 33176: {'lr': 0.00044722609922163184, 'samples': 16986624, 'steps': 33176, 'loss/train': 1.6472268104553223} +03/05/2022 04:27:21 - INFO - codeparrot_training - Step 33177: {'lr': 0.0004472228380981556, 'samples': 16987136, 'steps': 33177, 'loss/train': 1.6158864498138428} +03/05/2022 04:27:21 - INFO - codeparrot_training - Skipping example with length 535 (seq_length=1024) +03/05/2022 04:27:26 - INFO - codeparrot_training - Step 33178: {'lr': 0.0004472195768858138, 'samples': 16987648, 'steps': 33178, 'loss/train': 1.4883235692977905} +03/05/2022 04:27:29 - INFO - codeparrot_training - Skipping example with length 88 (seq_length=1024) +03/05/2022 04:27:32 - INFO - codeparrot_training - Step 33179: {'lr': 0.0004472163155846078, 'samples': 16988160, 'steps': 33179, 'loss/train': 1.5981900691986084} +03/05/2022 04:27:35 - INFO - codeparrot_training - Step 33180: {'lr': 0.0004472130541945393, 'samples': 16988672, 'steps': 33180, 'loss/train': 1.588862419128418} +03/05/2022 04:27:38 - INFO - codeparrot_training - Skipping example with length 371 (seq_length=1024) +03/05/2022 04:27:40 - INFO - codeparrot_training - Step 33181: {'lr': 0.00044720979271560963, 'samples': 16989184, 'steps': 33181, 'loss/train': 1.939510464668274} +03/05/2022 04:27:43 - INFO - codeparrot_training - Step 33182: {'lr': 0.00044720653114782024, 'samples': 16989696, 'steps': 33182, 'loss/train': 1.5683015584945679} +03/05/2022 04:27:46 - INFO - codeparrot_training - Skipping example with length 40 (seq_length=1024) +03/05/2022 04:27:49 - INFO - codeparrot_training - Step 33183: {'lr': 0.0004472032694911726, 'samples': 16990208, 'steps': 33183, 'loss/train': 1.6475050449371338} +03/05/2022 04:27:52 - INFO - codeparrot_training - Step 33184: {'lr': 0.0004472000077456683, 'samples': 16990720, 'steps': 33184, 'loss/train': 2.097450017929077} +03/05/2022 04:27:54 - INFO - codeparrot_training - Skipping example with length 511 (seq_length=1024) +03/05/2022 04:27:57 - INFO - codeparrot_training - Step 33185: {'lr': 0.0004471967459113086, 'samples': 16991232, 'steps': 33185, 'loss/train': 1.6029285192489624} +03/05/2022 04:28:00 - INFO - codeparrot_training - Step 33186: {'lr': 0.0004471934839880951, 'samples': 16991744, 'steps': 33186, 'loss/train': 3.058795690536499} +03/05/2022 04:28:03 - INFO - codeparrot_training - Skipping example with length 671 (seq_length=1024) +03/05/2022 04:28:05 - INFO - codeparrot_training - Step 33187: {'lr': 0.00044719022197602933, 'samples': 16992256, 'steps': 33187, 'loss/train': 2.059544086456299} +03/05/2022 04:28:08 - INFO - codeparrot_training - Step 33188: {'lr': 0.0004471869598751127, 'samples': 16992768, 'steps': 33188, 'loss/train': 2.651294231414795} +03/05/2022 04:28:11 - INFO - codeparrot_training - Skipping example with length 819 (seq_length=1024) +03/05/2022 04:28:14 - INFO - codeparrot_training - Step 33189: {'lr': 0.0004471836976853466, 'samples': 16993280, 'steps': 33189, 'loss/train': 2.556591510772705} +03/05/2022 04:28:17 - INFO - codeparrot_training - Step 33190: {'lr': 0.00044718043540673257, 'samples': 16993792, 'steps': 33190, 'loss/train': 1.1929570436477661} +03/05/2022 04:28:20 - INFO - codeparrot_training - Skipping example with length 165 (seq_length=1024) +03/05/2022 04:28:22 - INFO - codeparrot_training - Step 33191: {'lr': 0.0004471771730392722, 'samples': 16994304, 'steps': 33191, 'loss/train': 1.7729196548461914} +03/05/2022 04:28:25 - INFO - codeparrot_training - Step 33192: {'lr': 0.0004471739105829667, 'samples': 16994816, 'steps': 33192, 'loss/train': 1.9572309255599976} +03/05/2022 04:28:28 - INFO - codeparrot_training - Skipping example with length 604 (seq_length=1024) +03/05/2022 04:28:30 - INFO - codeparrot_training - Step 33193: {'lr': 0.00044717064803781773, 'samples': 16995328, 'steps': 33193, 'loss/train': 1.5869766473770142} +03/05/2022 04:28:34 - INFO - codeparrot_training - Step 33194: {'lr': 0.00044716738540382674, 'samples': 16995840, 'steps': 33194, 'loss/train': 2.144937753677368} +03/05/2022 04:28:36 - INFO - codeparrot_training - Skipping example with length 288 (seq_length=1024) +03/05/2022 04:28:39 - INFO - codeparrot_training - Step 33195: {'lr': 0.0004471641226809951, 'samples': 16996352, 'steps': 33195, 'loss/train': 0.8947886228561401} +03/05/2022 04:28:42 - INFO - codeparrot_training - Step 33196: {'lr': 0.0004471608598693244, 'samples': 16996864, 'steps': 33196, 'loss/train': 2.214202642440796} +03/05/2022 04:28:45 - INFO - codeparrot_training - Skipping example with length 303 (seq_length=1024) +03/05/2022 04:28:47 - INFO - codeparrot_training - Step 33197: {'lr': 0.000447157596968816, 'samples': 16997376, 'steps': 33197, 'loss/train': 1.1589488983154297} +03/05/2022 04:28:50 - INFO - codeparrot_training - Step 33198: {'lr': 0.0004471543339794715, 'samples': 16997888, 'steps': 33198, 'loss/train': 1.6613566875457764} +03/05/2022 04:28:53 - INFO - codeparrot_training - Skipping example with length 362 (seq_length=1024) +03/05/2022 04:28:56 - INFO - codeparrot_training - Step 33199: {'lr': 0.00044715107090129223, 'samples': 16998400, 'steps': 33199, 'loss/train': 1.3289883136749268} +03/05/2022 04:28:59 - INFO - codeparrot_training - Step 33200: {'lr': 0.00044714780773427975, 'samples': 16998912, 'steps': 33200, 'loss/train': 1.175379753112793} +03/05/2022 04:29:02 - INFO - codeparrot_training - Skipping example with length 651 (seq_length=1024) +03/05/2022 04:29:04 - INFO - codeparrot_training - Step 33201: {'lr': 0.00044714454447843555, 'samples': 16999424, 'steps': 33201, 'loss/train': 1.8422783613204956} +03/05/2022 04:29:07 - INFO - codeparrot_training - Step 33202: {'lr': 0.0004471412811337611, 'samples': 16999936, 'steps': 33202, 'loss/train': 2.581817150115967} +03/05/2022 04:29:10 - INFO - codeparrot_training - Skipping example with length 155 (seq_length=1024) +03/05/2022 04:29:13 - INFO - codeparrot_training - Step 33203: {'lr': 0.00044713801770025774, 'samples': 17000448, 'steps': 33203, 'loss/train': 1.3269267082214355} +03/05/2022 04:29:16 - INFO - codeparrot_training - Step 33204: {'lr': 0.00044713475417792705, 'samples': 17000960, 'steps': 33204, 'loss/train': 1.0786504745483398} +03/05/2022 04:29:18 - INFO - codeparrot_training - Skipping example with length 41 (seq_length=1024) +03/05/2022 04:29:21 - INFO - codeparrot_training - Step 33205: {'lr': 0.0004471314905667705, 'samples': 17001472, 'steps': 33205, 'loss/train': 2.004253625869751} +03/05/2022 04:29:24 - INFO - codeparrot_training - Step 33206: {'lr': 0.00044712822686678955, 'samples': 17001984, 'steps': 33206, 'loss/train': 1.311555027961731} +03/05/2022 04:29:27 - INFO - codeparrot_training - Skipping example with length 103 (seq_length=1024) +03/05/2022 04:29:29 - INFO - codeparrot_training - Step 33207: {'lr': 0.00044712496307798566, 'samples': 17002496, 'steps': 33207, 'loss/train': 1.9221293926239014} +03/05/2022 04:29:32 - INFO - codeparrot_training - Step 33208: {'lr': 0.0004471216992003603, 'samples': 17003008, 'steps': 33208, 'loss/train': 2.0810890197753906} +03/05/2022 04:29:35 - INFO - codeparrot_training - Skipping example with length 774 (seq_length=1024) +03/05/2022 04:29:38 - INFO - codeparrot_training - Step 33209: {'lr': 0.0004471184352339149, 'samples': 17003520, 'steps': 33209, 'loss/train': 1.4921197891235352} +03/05/2022 04:29:41 - INFO - codeparrot_training - Step 33210: {'lr': 0.00044711517117865105, 'samples': 17004032, 'steps': 33210, 'loss/train': 1.4429517984390259} +03/05/2022 04:29:43 - INFO - codeparrot_training - Skipping example with length 117 (seq_length=1024) +03/05/2022 04:29:47 - INFO - codeparrot_training - Step 33211: {'lr': 0.00044711190703457005, 'samples': 17004544, 'steps': 33211, 'loss/train': 2.0883426666259766} +03/05/2022 04:29:50 - INFO - codeparrot_training - Step 33212: {'lr': 0.00044710864280167353, 'samples': 17005056, 'steps': 33212, 'loss/train': 1.9144353866577148} +03/05/2022 04:29:52 - INFO - codeparrot_training - Skipping example with length 44 (seq_length=1024) +03/05/2022 04:29:55 - INFO - codeparrot_training - Step 33213: {'lr': 0.0004471053784799629, 'samples': 17005568, 'steps': 33213, 'loss/train': 1.1978492736816406} +03/05/2022 04:29:58 - INFO - codeparrot_training - Step 33214: {'lr': 0.0004471021140694396, 'samples': 17006080, 'steps': 33214, 'loss/train': 1.7336554527282715} +03/05/2022 04:30:00 - INFO - codeparrot_training - Skipping example with length 793 (seq_length=1024) +03/05/2022 04:30:03 - INFO - codeparrot_training - Step 33215: {'lr': 0.0004470988495701052, 'samples': 17006592, 'steps': 33215, 'loss/train': 2.7905797958374023} +03/05/2022 04:30:07 - INFO - codeparrot_training - Step 33216: {'lr': 0.00044709558498196104, 'samples': 17007104, 'steps': 33216, 'loss/train': 2.2112233638763428} +03/05/2022 04:30:08 - INFO - codeparrot_training - Skipping example with length 341 (seq_length=1024) +03/05/2022 04:30:12 - INFO - codeparrot_training - Step 33217: {'lr': 0.00044709232030500865, 'samples': 17007616, 'steps': 33217, 'loss/train': 0.7260366082191467} +03/05/2022 04:30:15 - INFO - codeparrot_training - Step 33218: {'lr': 0.0004470890555392495, 'samples': 17008128, 'steps': 33218, 'loss/train': 1.4261099100112915} +03/05/2022 04:30:17 - INFO - codeparrot_training - Skipping example with length 1002 (seq_length=1024) +03/05/2022 04:30:21 - INFO - codeparrot_training - Step 33219: {'lr': 0.00044708579068468505, 'samples': 17008640, 'steps': 33219, 'loss/train': 1.6846941709518433} +03/05/2022 04:30:24 - INFO - codeparrot_training - Step 33220: {'lr': 0.0004470825257413168, 'samples': 17009152, 'steps': 33220, 'loss/train': 1.5941340923309326} +03/05/2022 04:30:25 - INFO - codeparrot_training - Skipping example with length 358 (seq_length=1024) +03/05/2022 04:30:29 - INFO - codeparrot_training - Step 33221: {'lr': 0.00044707926070914624, 'samples': 17009664, 'steps': 33221, 'loss/train': 1.6662383079528809} +03/05/2022 04:30:32 - INFO - codeparrot_training - Step 33222: {'lr': 0.0004470759955881748, 'samples': 17010176, 'steps': 33222, 'loss/train': 1.9865210056304932} +03/05/2022 04:30:34 - INFO - codeparrot_training - Skipping example with length 752 (seq_length=1024) +03/05/2022 04:30:37 - INFO - codeparrot_training - Step 33223: {'lr': 0.0004470727303784039, 'samples': 17010688, 'steps': 33223, 'loss/train': 1.568503737449646} +03/05/2022 04:30:41 - INFO - codeparrot_training - Step 33224: {'lr': 0.00044706946507983513, 'samples': 17011200, 'steps': 33224, 'loss/train': 1.9292640686035156} +03/05/2022 04:30:42 - INFO - codeparrot_training - Skipping example with length 769 (seq_length=1024) +03/05/2022 04:30:46 - INFO - codeparrot_training - Step 33225: {'lr': 0.00044706619969246984, 'samples': 17011712, 'steps': 33225, 'loss/train': 1.674340844154358} +03/05/2022 04:30:49 - INFO - codeparrot_training - Step 33226: {'lr': 0.0004470629342163096, 'samples': 17012224, 'steps': 33226, 'loss/train': 1.9835761785507202} +03/05/2022 04:30:50 - INFO - codeparrot_training - Skipping example with length 32 (seq_length=1024) +03/05/2022 04:30:54 - INFO - codeparrot_training - Step 33227: {'lr': 0.00044705966865135583, 'samples': 17012736, 'steps': 33227, 'loss/train': 1.2123897075653076} +03/05/2022 04:30:57 - INFO - codeparrot_training - Step 33228: {'lr': 0.00044705640299761004, 'samples': 17013248, 'steps': 33228, 'loss/train': 2.29453182220459} +03/05/2022 04:30:59 - INFO - codeparrot_training - Skipping example with length 714 (seq_length=1024) +03/05/2022 04:31:03 - INFO - codeparrot_training - Step 33229: {'lr': 0.0004470531372550736, 'samples': 17013760, 'steps': 33229, 'loss/train': 2.295593738555908} +03/05/2022 04:31:06 - INFO - codeparrot_training - Step 33230: {'lr': 0.00044704987142374814, 'samples': 17014272, 'steps': 33230, 'loss/train': 1.7721439599990845} +03/05/2022 04:31:07 - INFO - codeparrot_training - Skipping example with length 9 (seq_length=1024) +03/05/2022 04:31:11 - INFO - codeparrot_training - Step 33231: {'lr': 0.00044704660550363507, 'samples': 17014784, 'steps': 33231, 'loss/train': 1.7082793712615967} +03/05/2022 04:31:14 - INFO - codeparrot_training - Step 33232: {'lr': 0.00044704333949473576, 'samples': 17015296, 'steps': 33232, 'loss/train': 1.4916679859161377} +03/05/2022 04:31:15 - INFO - codeparrot_training - Skipping example with length 506 (seq_length=1024) +03/05/2022 04:31:19 - INFO - codeparrot_training - Step 33233: {'lr': 0.0004470400733970518, 'samples': 17015808, 'steps': 33233, 'loss/train': 2.416391134262085} +03/05/2022 04:31:23 - INFO - codeparrot_training - Step 33234: {'lr': 0.0004470368072105846, 'samples': 17016320, 'steps': 33234, 'loss/train': 2.341555595397949} +03/05/2022 04:31:23 - INFO - codeparrot_training - Skipping example with length 682 (seq_length=1024) +03/05/2022 04:31:28 - INFO - codeparrot_training - Step 33235: {'lr': 0.00044703354093533564, 'samples': 17016832, 'steps': 33235, 'loss/train': 0.9006397724151611} +03/05/2022 04:31:31 - INFO - codeparrot_training - Step 33236: {'lr': 0.0004470302745713065, 'samples': 17017344, 'steps': 33236, 'loss/train': 1.2152900695800781} +03/05/2022 04:31:32 - INFO - codeparrot_training - Skipping example with length 554 (seq_length=1024) +03/05/2022 04:31:36 - INFO - codeparrot_training - Step 33237: {'lr': 0.0004470270081184985, 'samples': 17017856, 'steps': 33237, 'loss/train': 0.8020053505897522} +03/05/2022 04:31:40 - INFO - codeparrot_training - Step 33238: {'lr': 0.00044702374157691316, 'samples': 17018368, 'steps': 33238, 'loss/train': 2.1624271869659424} +03/05/2022 04:31:41 - INFO - codeparrot_training - Skipping example with length 358 (seq_length=1024) +03/05/2022 04:31:45 - INFO - codeparrot_training - Step 33239: {'lr': 0.00044702047494655194, 'samples': 17018880, 'steps': 33239, 'loss/train': 1.036012887954712} +03/05/2022 04:31:48 - INFO - codeparrot_training - Step 33240: {'lr': 0.0004470172082274164, 'samples': 17019392, 'steps': 33240, 'loss/train': 1.9231829643249512} +03/05/2022 04:31:50 - INFO - codeparrot_training - Skipping example with length 472 (seq_length=1024) +03/05/2022 04:31:53 - INFO - codeparrot_training - Step 33241: {'lr': 0.0004470139414195079, 'samples': 17019904, 'steps': 33241, 'loss/train': 1.0617188215255737} +03/05/2022 04:31:57 - INFO - codeparrot_training - Step 33242: {'lr': 0.00044701067452282796, 'samples': 17020416, 'steps': 33242, 'loss/train': 2.1453857421875} +03/05/2022 04:31:59 - INFO - codeparrot_training - Skipping example with length 323 (seq_length=1024) +03/05/2022 04:32:02 - INFO - codeparrot_training - Step 33243: {'lr': 0.00044700740753737806, 'samples': 17020928, 'steps': 33243, 'loss/train': 1.3970568180084229} +03/05/2022 04:32:05 - INFO - codeparrot_training - Step 33244: {'lr': 0.0004470041404631597, 'samples': 17021440, 'steps': 33244, 'loss/train': 1.851447343826294} +03/05/2022 04:32:08 - INFO - codeparrot_training - Skipping example with length 339 (seq_length=1024) +03/05/2022 04:32:10 - INFO - codeparrot_training - Step 33245: {'lr': 0.0004470008733001742, 'samples': 17021952, 'steps': 33245, 'loss/train': 0.7055865526199341} +03/05/2022 04:32:14 - INFO - codeparrot_training - Step 33246: {'lr': 0.0004469976060484233, 'samples': 17022464, 'steps': 33246, 'loss/train': 1.4836117029190063} +03/05/2022 04:32:16 - INFO - codeparrot_training - Skipping example with length 650 (seq_length=1024) +03/05/2022 04:32:19 - INFO - codeparrot_training - Step 33247: {'lr': 0.00044699433870790817, 'samples': 17022976, 'steps': 33247, 'loss/train': 1.7269686460494995} +03/05/2022 04:32:22 - INFO - codeparrot_training - Step 33248: {'lr': 0.00044699107127863056, 'samples': 17023488, 'steps': 33248, 'loss/train': 2.044891595840454} +03/05/2022 04:32:25 - INFO - codeparrot_training - Skipping example with length 232 (seq_length=1024) +03/05/2022 04:32:27 - INFO - codeparrot_training - Step 33249: {'lr': 0.0004469878037605917, 'samples': 17024000, 'steps': 33249, 'loss/train': 1.8798165321350098} +03/05/2022 04:32:31 - INFO - codeparrot_training - Step 33250: {'lr': 0.0004469845361537933, 'samples': 17024512, 'steps': 33250, 'loss/train': 0.14328764379024506} +03/05/2022 04:32:33 - INFO - codeparrot_training - Skipping example with length 171 (seq_length=1024) +03/05/2022 04:32:36 - INFO - codeparrot_training - Step 33251: {'lr': 0.0004469812684582366, 'samples': 17025024, 'steps': 33251, 'loss/train': 1.9625693559646606} +03/05/2022 04:32:39 - INFO - codeparrot_training - Step 33252: {'lr': 0.00044697800067392327, 'samples': 17025536, 'steps': 33252, 'loss/train': 1.0423429012298584} +03/05/2022 04:32:42 - INFO - codeparrot_training - Skipping example with length 668 (seq_length=1024) +03/05/2022 04:32:44 - INFO - codeparrot_training - Step 33253: {'lr': 0.00044697473280085455, 'samples': 17026048, 'steps': 33253, 'loss/train': 1.9206043481826782} +03/05/2022 04:32:47 - INFO - codeparrot_training - Step 33254: {'lr': 0.0004469714648390322, 'samples': 17026560, 'steps': 33254, 'loss/train': 1.9566144943237305} +03/05/2022 04:32:50 - INFO - codeparrot_training - Skipping example with length 173 (seq_length=1024) +03/05/2022 04:32:53 - INFO - codeparrot_training - Step 33255: {'lr': 0.00044696819678845744, 'samples': 17027072, 'steps': 33255, 'loss/train': 1.5201117992401123} +03/05/2022 04:32:56 - INFO - codeparrot_training - Step 33256: {'lr': 0.000446964928649132, 'samples': 17027584, 'steps': 33256, 'loss/train': 0.567852258682251} +03/05/2022 04:32:58 - INFO - codeparrot_training - Skipping example with length 11 (seq_length=1024) +03/05/2022 04:33:01 - INFO - codeparrot_training - Step 33257: {'lr': 0.00044696166042105704, 'samples': 17028096, 'steps': 33257, 'loss/train': 1.8542073965072632} +03/05/2022 04:33:04 - INFO - codeparrot_training - Step 33258: {'lr': 0.0004469583921042343, 'samples': 17028608, 'steps': 33258, 'loss/train': 1.3847225904464722} +03/05/2022 04:33:07 - INFO - codeparrot_training - Skipping example with length 189 (seq_length=1024) +03/05/2022 04:33:10 - INFO - codeparrot_training - Step 33259: {'lr': 0.0004469551236986651, 'samples': 17029120, 'steps': 33259, 'loss/train': 1.7156076431274414} +03/05/2022 04:33:13 - INFO - codeparrot_training - Step 33260: {'lr': 0.00044695185520435087, 'samples': 17029632, 'steps': 33260, 'loss/train': 2.145132064819336} +03/05/2022 04:33:15 - INFO - codeparrot_training - Skipping example with length 623 (seq_length=1024) +03/05/2022 04:33:18 - INFO - codeparrot_training - Step 33261: {'lr': 0.00044694858662129333, 'samples': 17030144, 'steps': 33261, 'loss/train': 1.4747002124786377} +03/05/2022 04:33:21 - INFO - codeparrot_training - Step 33262: {'lr': 0.0004469453179494938, 'samples': 17030656, 'steps': 33262, 'loss/train': 1.712813138961792} +03/05/2022 04:33:24 - INFO - codeparrot_training - Skipping example with length 431 (seq_length=1024) +03/05/2022 04:33:27 - INFO - codeparrot_training - Step 33263: {'lr': 0.00044694204918895367, 'samples': 17031168, 'steps': 33263, 'loss/train': 1.0600396394729614} +03/05/2022 04:33:30 - INFO - codeparrot_training - Step 33264: {'lr': 0.0004469387803396745, 'samples': 17031680, 'steps': 33264, 'loss/train': 1.320888876914978} +03/05/2022 04:33:32 - INFO - codeparrot_training - Skipping example with length 228 (seq_length=1024) +03/05/2022 04:33:35 - INFO - codeparrot_training - Step 33265: {'lr': 0.0004469355114016577, 'samples': 17032192, 'steps': 33265, 'loss/train': 1.923216462135315} +03/05/2022 04:33:38 - INFO - codeparrot_training - Step 33266: {'lr': 0.00044693224237490485, 'samples': 17032704, 'steps': 33266, 'loss/train': 1.7750978469848633} +03/05/2022 04:33:41 - INFO - codeparrot_training - Skipping example with length 367 (seq_length=1024) +03/05/2022 04:33:43 - INFO - codeparrot_training - Step 33267: {'lr': 0.00044692897325941737, 'samples': 17033216, 'steps': 33267, 'loss/train': 1.8400615453720093} +03/05/2022 04:33:47 - INFO - codeparrot_training - Step 33268: {'lr': 0.00044692570405519683, 'samples': 17033728, 'steps': 33268, 'loss/train': 2.481304407119751} +03/05/2022 04:33:49 - INFO - codeparrot_training - Skipping example with length 1008 (seq_length=1024) +03/05/2022 04:33:52 - INFO - codeparrot_training - Step 33269: {'lr': 0.0004469224347622445, 'samples': 17034240, 'steps': 33269, 'loss/train': 0.9251644611358643} +03/05/2022 04:33:55 - INFO - codeparrot_training - Step 33270: {'lr': 0.000446919165380562, 'samples': 17034752, 'steps': 33270, 'loss/train': 2.0589897632598877} +03/05/2022 04:33:59 - INFO - codeparrot_training - Step 33271: {'lr': 0.0004469158959101507, 'samples': 17035264, 'steps': 33271, 'loss/train': 1.8704736232757568} +03/05/2022 04:33:59 - INFO - codeparrot_training - Skipping example with length 856 (seq_length=1024) +03/05/2022 04:34:04 - INFO - codeparrot_training - Step 33272: {'lr': 0.00044691262635101223, 'samples': 17035776, 'steps': 33272, 'loss/train': 0.5479095578193665} +03/05/2022 04:34:07 - INFO - codeparrot_training - Step 33273: {'lr': 0.0004469093567031479, 'samples': 17036288, 'steps': 33273, 'loss/train': 1.7991565465927124} +03/05/2022 04:34:07 - INFO - codeparrot_training - Skipping example with length 705 (seq_length=1024) +03/05/2022 04:34:12 - INFO - codeparrot_training - Step 33274: {'lr': 0.00044690608696655923, 'samples': 17036800, 'steps': 33274, 'loss/train': 1.4176887273788452} +03/05/2022 04:34:15 - INFO - codeparrot_training - Step 33275: {'lr': 0.0004469028171412478, 'samples': 17037312, 'steps': 33275, 'loss/train': 1.7971992492675781} +03/05/2022 04:34:15 - INFO - codeparrot_training - Skipping example with length 121 (seq_length=1024) +03/05/2022 04:34:21 - INFO - codeparrot_training - Step 33276: {'lr': 0.00044689954722721494, 'samples': 17037824, 'steps': 33276, 'loss/train': 1.417471170425415} +03/05/2022 04:34:23 - INFO - codeparrot_training - Skipping example with length 364 (seq_length=1024) +03/05/2022 04:34:26 - INFO - codeparrot_training - Step 33277: {'lr': 0.0004468962772244622, 'samples': 17038336, 'steps': 33277, 'loss/train': 3.3851616382598877} +03/05/2022 04:34:29 - INFO - codeparrot_training - Step 33278: {'lr': 0.00044689300713299105, 'samples': 17038848, 'steps': 33278, 'loss/train': 1.1838024854660034} +03/05/2022 04:34:32 - INFO - codeparrot_training - Skipping example with length 574 (seq_length=1024) +03/05/2022 04:34:34 - INFO - codeparrot_training - Step 33279: {'lr': 0.0004468897369528029, 'samples': 17039360, 'steps': 33279, 'loss/train': 2.1633739471435547} +03/05/2022 04:34:37 - INFO - codeparrot_training - Step 33280: {'lr': 0.00044688646668389933, 'samples': 17039872, 'steps': 33280, 'loss/train': 1.347037672996521} +03/05/2022 04:34:40 - INFO - codeparrot_training - Skipping example with length 401 (seq_length=1024) +03/05/2022 04:34:43 - INFO - codeparrot_training - Step 33281: {'lr': 0.0004468831963262817, 'samples': 17040384, 'steps': 33281, 'loss/train': 2.2109601497650146} +03/05/2022 04:34:46 - INFO - codeparrot_training - Step 33282: {'lr': 0.00044687992587995155, 'samples': 17040896, 'steps': 33282, 'loss/train': 1.8926875591278076} +03/05/2022 04:34:48 - INFO - codeparrot_training - Skipping example with length 570 (seq_length=1024) +03/05/2022 04:34:51 - INFO - codeparrot_training - Step 33283: {'lr': 0.0004468766553449104, 'samples': 17041408, 'steps': 33283, 'loss/train': 1.2865020036697388} +03/05/2022 04:34:54 - INFO - codeparrot_training - Step 33284: {'lr': 0.00044687338472115964, 'samples': 17041920, 'steps': 33284, 'loss/train': 1.406243920326233} +03/05/2022 04:34:57 - INFO - codeparrot_training - Skipping example with length 269 (seq_length=1024) +03/05/2022 04:35:00 - INFO - codeparrot_training - Step 33285: {'lr': 0.00044687011400870074, 'samples': 17042432, 'steps': 33285, 'loss/train': 1.6059579849243164} +03/05/2022 04:35:03 - INFO - codeparrot_training - Step 33286: {'lr': 0.00044686684320753524, 'samples': 17042944, 'steps': 33286, 'loss/train': 1.5593130588531494} +03/05/2022 04:35:05 - INFO - codeparrot_training - Skipping example with length 985 (seq_length=1024) +03/05/2022 04:35:08 - INFO - codeparrot_training - Step 33287: {'lr': 0.00044686357231766454, 'samples': 17043456, 'steps': 33287, 'loss/train': 1.787016749382019} +03/05/2022 04:35:11 - INFO - codeparrot_training - Step 33288: {'lr': 0.00044686030133909017, 'samples': 17043968, 'steps': 33288, 'loss/train': 1.9975470304489136} +03/05/2022 04:35:14 - INFO - codeparrot_training - Skipping example with length 37 (seq_length=1024) +03/05/2022 04:35:17 - INFO - codeparrot_training - Step 33289: {'lr': 0.00044685703027181364, 'samples': 17044480, 'steps': 33289, 'loss/train': 1.8950200080871582} +03/05/2022 04:35:20 - INFO - codeparrot_training - Step 33290: {'lr': 0.0004468537591158363, 'samples': 17044992, 'steps': 33290, 'loss/train': 1.9059292078018188} +03/05/2022 04:35:22 - INFO - codeparrot_training - Skipping example with length 860 (seq_length=1024) +03/05/2022 04:35:25 - INFO - codeparrot_training - Step 33291: {'lr': 0.0004468504878711597, 'samples': 17045504, 'steps': 33291, 'loss/train': 1.7182505130767822} +03/05/2022 04:35:28 - INFO - codeparrot_training - Step 33292: {'lr': 0.00044684721653778537, 'samples': 17046016, 'steps': 33292, 'loss/train': 1.0436699390411377} +03/05/2022 04:35:31 - INFO - codeparrot_training - Skipping example with length 191 (seq_length=1024) +03/05/2022 04:35:33 - INFO - codeparrot_training - Step 33293: {'lr': 0.00044684394511571463, 'samples': 17046528, 'steps': 33293, 'loss/train': 1.7925264835357666} +03/05/2022 04:35:37 - INFO - codeparrot_training - Step 33294: {'lr': 0.00044684067360494905, 'samples': 17047040, 'steps': 33294, 'loss/train': 1.5657933950424194} +03/05/2022 04:35:39 - INFO - codeparrot_training - Skipping example with length 980 (seq_length=1024) +03/05/2022 04:35:42 - INFO - codeparrot_training - Step 33295: {'lr': 0.00044683740200549015, 'samples': 17047552, 'steps': 33295, 'loss/train': 1.1063350439071655} +03/05/2022 04:35:45 - INFO - codeparrot_training - Step 33296: {'lr': 0.00044683413031733945, 'samples': 17048064, 'steps': 33296, 'loss/train': 1.6962965726852417} +03/05/2022 04:35:48 - INFO - codeparrot_training - Skipping example with length 889 (seq_length=1024) +03/05/2022 04:35:50 - INFO - codeparrot_training - Step 33297: {'lr': 0.00044683085854049814, 'samples': 17048576, 'steps': 33297, 'loss/train': 2.3267552852630615} +03/05/2022 04:35:54 - INFO - codeparrot_training - Step 33298: {'lr': 0.00044682758667496806, 'samples': 17049088, 'steps': 33298, 'loss/train': 2.485488176345825} +03/05/2022 04:35:56 - INFO - codeparrot_training - Skipping example with length 623 (seq_length=1024) +03/05/2022 04:35:59 - INFO - codeparrot_training - Step 33299: {'lr': 0.00044682431472075035, 'samples': 17049600, 'steps': 33299, 'loss/train': 2.0528550148010254} +03/05/2022 04:36:02 - INFO - codeparrot_training - Step 33300: {'lr': 0.00044682104267784674, 'samples': 17050112, 'steps': 33300, 'loss/train': 1.6780948638916016} +03/05/2022 04:36:04 - INFO - codeparrot_training - Skipping example with length 708 (seq_length=1024) +03/05/2022 04:36:07 - INFO - codeparrot_training - Step 33301: {'lr': 0.0004468177705462585, 'samples': 17050624, 'steps': 33301, 'loss/train': 2.031189203262329} +03/05/2022 04:36:10 - INFO - codeparrot_training - Step 33302: {'lr': 0.0004468144983259873, 'samples': 17051136, 'steps': 33302, 'loss/train': 2.366976022720337} +03/05/2022 04:36:13 - INFO - codeparrot_training - Skipping example with length 607 (seq_length=1024) +03/05/2022 04:36:16 - INFO - codeparrot_training - Step 33303: {'lr': 0.0004468112260170345, 'samples': 17051648, 'steps': 33303, 'loss/train': 2.0559298992156982} +03/05/2022 04:36:19 - INFO - codeparrot_training - Step 33304: {'lr': 0.0004468079536194016, 'samples': 17052160, 'steps': 33304, 'loss/train': 1.322758674621582} +03/05/2022 04:36:21 - INFO - codeparrot_training - Skipping example with length 796 (seq_length=1024) +03/05/2022 04:36:24 - INFO - codeparrot_training - Step 33305: {'lr': 0.00044680468113309006, 'samples': 17052672, 'steps': 33305, 'loss/train': 1.6497762203216553} +03/05/2022 04:36:27 - INFO - codeparrot_training - Step 33306: {'lr': 0.0004468014085581014, 'samples': 17053184, 'steps': 33306, 'loss/train': 1.5704318284988403} +03/05/2022 04:36:30 - INFO - codeparrot_training - Skipping example with length 37 (seq_length=1024) +03/05/2022 04:36:33 - INFO - codeparrot_training - Step 33307: {'lr': 0.0004467981358944371, 'samples': 17053696, 'steps': 33307, 'loss/train': 2.2079720497131348} +03/05/2022 04:36:36 - INFO - codeparrot_training - Step 33308: {'lr': 0.0004467948631420985, 'samples': 17054208, 'steps': 33308, 'loss/train': 2.0205180644989014} +03/05/2022 04:36:38 - INFO - codeparrot_training - Skipping example with length 31 (seq_length=1024) +03/05/2022 04:36:41 - INFO - codeparrot_training - Step 33309: {'lr': 0.0004467915903010872, 'samples': 17054720, 'steps': 33309, 'loss/train': 1.8146395683288574} +03/05/2022 04:36:44 - INFO - codeparrot_training - Step 33310: {'lr': 0.0004467883173714047, 'samples': 17055232, 'steps': 33310, 'loss/train': 1.1737422943115234} +03/05/2022 04:36:46 - INFO - codeparrot_training - Skipping example with length 593 (seq_length=1024) +03/05/2022 04:36:49 - INFO - codeparrot_training - Step 33311: {'lr': 0.0004467850443530523, 'samples': 17055744, 'steps': 33311, 'loss/train': 1.9512014389038086} +03/05/2022 04:36:53 - INFO - codeparrot_training - Step 33312: {'lr': 0.0004467817712460317, 'samples': 17056256, 'steps': 33312, 'loss/train': 1.3705593347549438} +03/05/2022 04:36:55 - INFO - codeparrot_training - Skipping example with length 557 (seq_length=1024) +03/05/2022 04:36:58 - INFO - codeparrot_training - Step 33313: {'lr': 0.00044677849805034424, 'samples': 17056768, 'steps': 33313, 'loss/train': 1.1737432479858398} +03/05/2022 04:37:01 - INFO - codeparrot_training - Step 33314: {'lr': 0.0004467752247659914, 'samples': 17057280, 'steps': 33314, 'loss/train': 1.5484893321990967} +03/05/2022 04:37:03 - INFO - codeparrot_training - Skipping example with length 267 (seq_length=1024) +03/05/2022 04:37:06 - INFO - codeparrot_training - Step 33315: {'lr': 0.00044677195139297476, 'samples': 17057792, 'steps': 33315, 'loss/train': 0.7366610765457153} +03/05/2022 04:37:09 - INFO - codeparrot_training - Step 33316: {'lr': 0.00044676867793129574, 'samples': 17058304, 'steps': 33316, 'loss/train': 1.3753629922866821} +03/05/2022 04:37:12 - INFO - codeparrot_training - Skipping example with length 518 (seq_length=1024) +03/05/2022 04:37:15 - INFO - codeparrot_training - Step 33317: {'lr': 0.00044676540438095565, 'samples': 17058816, 'steps': 33317, 'loss/train': 1.3672655820846558} +03/05/2022 04:37:18 - INFO - codeparrot_training - Step 33318: {'lr': 0.0004467621307419562, 'samples': 17059328, 'steps': 33318, 'loss/train': 1.6080365180969238} +03/05/2022 04:37:20 - INFO - codeparrot_training - Skipping example with length 778 (seq_length=1024) +03/05/2022 04:37:23 - INFO - codeparrot_training - Step 33319: {'lr': 0.00044675885701429873, 'samples': 17059840, 'steps': 33319, 'loss/train': 1.674177646636963} +03/05/2022 04:37:26 - INFO - codeparrot_training - Step 33320: {'lr': 0.00044675558319798477, 'samples': 17060352, 'steps': 33320, 'loss/train': 1.8963091373443604} +03/05/2022 04:37:28 - INFO - codeparrot_training - Skipping example with length 767 (seq_length=1024) +03/05/2022 04:37:31 - INFO - codeparrot_training - Step 33321: {'lr': 0.00044675230929301575, 'samples': 17060864, 'steps': 33321, 'loss/train': 1.3053467273712158} +03/05/2022 04:37:34 - INFO - codeparrot_training - Step 33322: {'lr': 0.0004467490352993932, 'samples': 17061376, 'steps': 33322, 'loss/train': 1.0580475330352783} +03/05/2022 04:37:36 - INFO - codeparrot_training - Skipping example with length 317 (seq_length=1024) +03/05/2022 04:37:40 - INFO - codeparrot_training - Step 33323: {'lr': 0.00044674576121711855, 'samples': 17061888, 'steps': 33323, 'loss/train': 0.9874007105827332} +03/05/2022 04:37:43 - INFO - codeparrot_training - Step 33324: {'lr': 0.00044674248704619333, 'samples': 17062400, 'steps': 33324, 'loss/train': 0.4970065653324127} +03/05/2022 04:37:45 - INFO - codeparrot_training - Skipping example with length 398 (seq_length=1024) +03/05/2022 04:37:49 - INFO - codeparrot_training - Step 33325: {'lr': 0.000446739212786619, 'samples': 17062912, 'steps': 33325, 'loss/train': 1.5615367889404297} +03/05/2022 04:37:52 - INFO - codeparrot_training - Step 33326: {'lr': 0.000446735938438397, 'samples': 17063424, 'steps': 33326, 'loss/train': 0.8223859667778015} +03/05/2022 04:37:55 - INFO - codeparrot_training - Step 33327: {'lr': 0.0004467326640015288, 'samples': 17063936, 'steps': 33327, 'loss/train': 6.371712684631348} +03/05/2022 04:37:57 - INFO - codeparrot_training - Skipping example with length 987 (seq_length=1024) +03/05/2022 04:38:01 - INFO - codeparrot_training - Step 33328: {'lr': 0.00044672938947601593, 'samples': 17064448, 'steps': 33328, 'loss/train': 1.2918379306793213} +03/05/2022 04:38:04 - INFO - codeparrot_training - Step 33329: {'lr': 0.00044672611486185976, 'samples': 17064960, 'steps': 33329, 'loss/train': 1.909144401550293} +03/05/2022 04:38:05 - INFO - codeparrot_training - Skipping example with length 178 (seq_length=1024) +03/05/2022 04:38:09 - INFO - codeparrot_training - Step 33330: {'lr': 0.0004467228401590619, 'samples': 17065472, 'steps': 33330, 'loss/train': 0.6293220520019531} +03/05/2022 04:38:12 - INFO - codeparrot_training - Step 33331: {'lr': 0.00044671956536762375, 'samples': 17065984, 'steps': 33331, 'loss/train': 1.6965147256851196} +03/05/2022 04:38:14 - INFO - codeparrot_training - Skipping example with length 785 (seq_length=1024) +03/05/2022 04:38:18 - INFO - codeparrot_training - Step 33332: {'lr': 0.00044671629048754683, 'samples': 17066496, 'steps': 33332, 'loss/train': 1.2985069751739502} +03/05/2022 04:38:21 - INFO - codeparrot_training - Step 33333: {'lr': 0.00044671301551883253, 'samples': 17067008, 'steps': 33333, 'loss/train': 1.6386150121688843} +03/05/2022 04:38:23 - INFO - codeparrot_training - Skipping example with length 870 (seq_length=1024) +03/05/2022 04:38:26 - INFO - codeparrot_training - Step 33334: {'lr': 0.0004467097404614824, 'samples': 17067520, 'steps': 33334, 'loss/train': 1.2853312492370605} +03/05/2022 04:38:29 - INFO - codeparrot_training - Step 33335: {'lr': 0.0004467064653154979, 'samples': 17068032, 'steps': 33335, 'loss/train': 1.718184232711792} +03/05/2022 04:38:31 - INFO - codeparrot_training - Skipping example with length 590 (seq_length=1024) +03/05/2022 04:38:35 - INFO - codeparrot_training - Step 33336: {'lr': 0.0004467031900808805, 'samples': 17068544, 'steps': 33336, 'loss/train': 1.5432883501052856} +03/05/2022 04:38:38 - INFO - codeparrot_training - Step 33337: {'lr': 0.00044669991475763173, 'samples': 17069056, 'steps': 33337, 'loss/train': 1.5116682052612305} +03/05/2022 04:38:41 - INFO - codeparrot_training - Skipping example with length 136 (seq_length=1024) +03/05/2022 04:38:43 - INFO - codeparrot_training - Step 33338: {'lr': 0.00044669663934575294, 'samples': 17069568, 'steps': 33338, 'loss/train': 1.0382428169250488} +03/05/2022 04:38:46 - INFO - codeparrot_training - Step 33339: {'lr': 0.0004466933638452457, 'samples': 17070080, 'steps': 33339, 'loss/train': 1.6291375160217285} +03/05/2022 04:38:49 - INFO - codeparrot_training - Skipping example with length 188 (seq_length=1024) +03/05/2022 04:38:52 - INFO - codeparrot_training - Step 33340: {'lr': 0.0004466900882561115, 'samples': 17070592, 'steps': 33340, 'loss/train': 1.359604835510254} +03/05/2022 04:38:55 - INFO - codeparrot_training - Step 33341: {'lr': 0.00044668681257835173, 'samples': 17071104, 'steps': 33341, 'loss/train': 1.8115434646606445} +03/05/2022 04:38:57 - INFO - codeparrot_training - Skipping example with length 344 (seq_length=1024) +03/05/2022 04:39:00 - INFO - codeparrot_training - Step 33342: {'lr': 0.00044668353681196794, 'samples': 17071616, 'steps': 33342, 'loss/train': 1.2806613445281982} +03/05/2022 04:39:03 - INFO - codeparrot_training - Step 33343: {'lr': 0.0004466802609569616, 'samples': 17072128, 'steps': 33343, 'loss/train': 1.1015074253082275} +03/05/2022 04:39:06 - INFO - codeparrot_training - Skipping example with length 317 (seq_length=1024) +03/05/2022 04:39:09 - INFO - codeparrot_training - Step 33344: {'lr': 0.00044667698501333415, 'samples': 17072640, 'steps': 33344, 'loss/train': 1.0961458683013916} +03/05/2022 04:39:12 - INFO - codeparrot_training - Step 33345: {'lr': 0.0004466737089810871, 'samples': 17073152, 'steps': 33345, 'loss/train': 1.7168333530426025} +03/05/2022 04:39:15 - INFO - codeparrot_training - Skipping example with length 327 (seq_length=1024) +03/05/2022 04:39:17 - INFO - codeparrot_training - Step 33346: {'lr': 0.00044667043286022193, 'samples': 17073664, 'steps': 33346, 'loss/train': 2.0690042972564697} +03/05/2022 04:39:20 - INFO - codeparrot_training - Step 33347: {'lr': 0.00044666715665074, 'samples': 17074176, 'steps': 33347, 'loss/train': 0.11862774938344955} +03/05/2022 04:39:23 - INFO - codeparrot_training - Skipping example with length 913 (seq_length=1024) +03/05/2022 04:39:26 - INFO - codeparrot_training - Step 33348: {'lr': 0.0004466638803526429, 'samples': 17074688, 'steps': 33348, 'loss/train': 1.5842550992965698} +03/05/2022 04:39:29 - INFO - codeparrot_training - Step 33349: {'lr': 0.0004466606039659322, 'samples': 17075200, 'steps': 33349, 'loss/train': 1.3628886938095093} +03/05/2022 04:39:32 - INFO - codeparrot_training - Step 33350: {'lr': 0.0004466573274906092, 'samples': 17075712, 'steps': 33350, 'loss/train': 0.8586089015007019} +03/05/2022 04:39:32 - INFO - codeparrot_training - Skipping example with length 160 (seq_length=1024) +03/05/2022 04:39:37 - INFO - codeparrot_training - Step 33351: {'lr': 0.0004466540509266754, 'samples': 17076224, 'steps': 33351, 'loss/train': 2.026029586791992} +03/05/2022 04:39:41 - INFO - codeparrot_training - Step 33352: {'lr': 0.0004466507742741325, 'samples': 17076736, 'steps': 33352, 'loss/train': 1.7219226360321045} +03/05/2022 04:39:41 - INFO - codeparrot_training - Skipping example with length 9 (seq_length=1024) +03/05/2022 04:39:46 - INFO - codeparrot_training - Step 33353: {'lr': 0.0004466474975329816, 'samples': 17077248, 'steps': 33353, 'loss/train': 1.8644887208938599} +03/05/2022 04:39:49 - INFO - codeparrot_training - Step 33354: {'lr': 0.0004466442207032244, 'samples': 17077760, 'steps': 33354, 'loss/train': 2.2709760665893555} +03/05/2022 04:39:49 - INFO - codeparrot_training - Skipping example with length 732 (seq_length=1024) +03/05/2022 04:39:54 - INFO - codeparrot_training - Step 33355: {'lr': 0.00044664094378486243, 'samples': 17078272, 'steps': 33355, 'loss/train': 1.9272695779800415} +03/05/2022 04:39:57 - INFO - codeparrot_training - Step 33356: {'lr': 0.00044663766677789706, 'samples': 17078784, 'steps': 33356, 'loss/train': 1.887320876121521} +03/05/2022 04:39:57 - INFO - codeparrot_training - Skipping example with length 967 (seq_length=1024) +03/05/2022 04:40:03 - INFO - codeparrot_training - Step 33357: {'lr': 0.0004466343896823297, 'samples': 17079296, 'steps': 33357, 'loss/train': 1.4393413066864014} +03/05/2022 04:40:06 - INFO - codeparrot_training - Step 33358: {'lr': 0.000446631112498162, 'samples': 17079808, 'steps': 33358, 'loss/train': 1.8494728803634644} +03/05/2022 04:40:06 - INFO - codeparrot_training - Skipping example with length 963 (seq_length=1024) +03/05/2022 04:40:11 - INFO - codeparrot_training - Step 33359: {'lr': 0.0004466278352253954, 'samples': 17080320, 'steps': 33359, 'loss/train': 1.3775429725646973} +03/05/2022 04:40:14 - INFO - codeparrot_training - Step 33360: {'lr': 0.00044662455786403124, 'samples': 17080832, 'steps': 33360, 'loss/train': 1.511925220489502} +03/05/2022 04:40:14 - INFO - codeparrot_training - Skipping example with length 987 (seq_length=1024) +03/05/2022 04:40:20 - INFO - codeparrot_training - Step 33361: {'lr': 0.0004466212804140711, 'samples': 17081344, 'steps': 33361, 'loss/train': 1.0644581317901611} +03/05/2022 04:40:23 - INFO - codeparrot_training - Skipping example with length 734 (seq_length=1024) +03/05/2022 04:40:25 - INFO - codeparrot_training - Step 33362: {'lr': 0.00044661800287551653, 'samples': 17081856, 'steps': 33362, 'loss/train': 2.0496010780334473} +03/05/2022 04:40:28 - INFO - codeparrot_training - Step 33363: {'lr': 0.00044661472524836886, 'samples': 17082368, 'steps': 33363, 'loss/train': 2.2401201725006104} +03/05/2022 04:40:31 - INFO - codeparrot_training - Skipping example with length 675 (seq_length=1024) +03/05/2022 04:40:34 - INFO - codeparrot_training - Step 33364: {'lr': 0.00044661144753262963, 'samples': 17082880, 'steps': 33364, 'loss/train': 1.7566076517105103} +03/05/2022 04:40:37 - INFO - codeparrot_training - Step 33365: {'lr': 0.0004466081697283003, 'samples': 17083392, 'steps': 33365, 'loss/train': 2.299621105194092} +03/05/2022 04:40:40 - INFO - codeparrot_training - Step 33366: {'lr': 0.00044660489183538237, 'samples': 17083904, 'steps': 33366, 'loss/train': 1.6577858924865723} +03/05/2022 04:40:40 - INFO - codeparrot_training - Skipping example with length 31 (seq_length=1024) +03/05/2022 04:40:45 - INFO - codeparrot_training - Step 33367: {'lr': 0.0004466016138538773, 'samples': 17084416, 'steps': 33367, 'loss/train': 2.9881908893585205} +03/05/2022 04:40:49 - INFO - codeparrot_training - Step 33368: {'lr': 0.0004465983357837866, 'samples': 17084928, 'steps': 33368, 'loss/train': 1.9357060194015503} +03/05/2022 04:40:49 - INFO - codeparrot_training - Skipping example with length 57 (seq_length=1024) +03/05/2022 04:40:54 - INFO - codeparrot_training - Step 33369: {'lr': 0.00044659505762511176, 'samples': 17085440, 'steps': 33369, 'loss/train': 1.5760473012924194} +03/05/2022 04:40:57 - INFO - codeparrot_training - Step 33370: {'lr': 0.00044659177937785417, 'samples': 17085952, 'steps': 33370, 'loss/train': 1.2440972328186035} +03/05/2022 04:40:57 - INFO - codeparrot_training - Skipping example with length 852 (seq_length=1024) +03/05/2022 04:41:03 - INFO - codeparrot_training - Step 33371: {'lr': 0.0004465885010420154, 'samples': 17086464, 'steps': 33371, 'loss/train': 1.8743789196014404} +03/05/2022 04:41:06 - INFO - codeparrot_training - Step 33372: {'lr': 0.0004465852226175968, 'samples': 17086976, 'steps': 33372, 'loss/train': 0.9144407510757446} +03/05/2022 04:41:07 - INFO - codeparrot_training - Skipping example with length 936 (seq_length=1024) +03/05/2022 04:41:11 - INFO - codeparrot_training - Step 33373: {'lr': 0.00044658194410460004, 'samples': 17087488, 'steps': 33373, 'loss/train': 1.1332484483718872} +03/05/2022 04:41:14 - INFO - codeparrot_training - Step 33374: {'lr': 0.0004465786655030264, 'samples': 17088000, 'steps': 33374, 'loss/train': 1.340173602104187} +03/05/2022 04:41:15 - INFO - codeparrot_training - Skipping example with length 851 (seq_length=1024) +03/05/2022 04:41:19 - INFO - codeparrot_training - Step 33375: {'lr': 0.00044657538681287746, 'samples': 17088512, 'steps': 33375, 'loss/train': 2.267954111099243} +03/05/2022 04:41:23 - INFO - codeparrot_training - Step 33376: {'lr': 0.0004465721080341547, 'samples': 17089024, 'steps': 33376, 'loss/train': 1.4547932147979736} +03/05/2022 04:41:23 - INFO - codeparrot_training - Skipping example with length 359 (seq_length=1024) +03/05/2022 04:41:28 - INFO - codeparrot_training - Step 33377: {'lr': 0.0004465688291668596, 'samples': 17089536, 'steps': 33377, 'loss/train': 1.074089527130127} +03/05/2022 04:41:31 - INFO - codeparrot_training - Step 33378: {'lr': 0.00044656555021099363, 'samples': 17090048, 'steps': 33378, 'loss/train': 1.950627326965332} +03/05/2022 04:41:31 - INFO - codeparrot_training - Skipping example with length 579 (seq_length=1024) +03/05/2022 04:41:36 - INFO - codeparrot_training - Step 33379: {'lr': 0.00044656227116655824, 'samples': 17090560, 'steps': 33379, 'loss/train': 2.3485255241394043} +03/05/2022 04:41:39 - INFO - codeparrot_training - Step 33380: {'lr': 0.00044655899203355486, 'samples': 17091072, 'steps': 33380, 'loss/train': 1.6018450260162354} +03/05/2022 04:41:40 - INFO - codeparrot_training - Skipping example with length 782 (seq_length=1024) +03/05/2022 04:41:45 - INFO - codeparrot_training - Step 33381: {'lr': 0.0004465557128119852, 'samples': 17091584, 'steps': 33381, 'loss/train': 0.8849830031394958} +03/05/2022 04:41:48 - INFO - codeparrot_training - Step 33382: {'lr': 0.00044655243350185037, 'samples': 17092096, 'steps': 33382, 'loss/train': 1.4541374444961548} +03/05/2022 04:41:49 - INFO - codeparrot_training - Skipping example with length 193 (seq_length=1024) +03/05/2022 04:41:54 - INFO - codeparrot_training - Step 33383: {'lr': 0.0004465491541031522, 'samples': 17092608, 'steps': 33383, 'loss/train': 1.1984227895736694} +03/05/2022 04:41:57 - INFO - codeparrot_training - Step 33384: {'lr': 0.00044654587461589193, 'samples': 17093120, 'steps': 33384, 'loss/train': 1.6082019805908203} +03/05/2022 04:42:00 - INFO - codeparrot_training - Step 33385: {'lr': 0.0004465425950400711, 'samples': 17093632, 'steps': 33385, 'loss/train': 2.2624125480651855} +03/05/2022 04:42:00 - INFO - codeparrot_training - Skipping example with length 281 (seq_length=1024) +03/05/2022 04:42:05 - INFO - codeparrot_training - Step 33386: {'lr': 0.00044653931537569125, 'samples': 17094144, 'steps': 33386, 'loss/train': 1.5172392129898071} +03/05/2022 04:42:08 - INFO - codeparrot_training - Step 33387: {'lr': 0.0004465360356227538, 'samples': 17094656, 'steps': 33387, 'loss/train': 1.4819080829620361} +03/05/2022 04:42:08 - INFO - codeparrot_training - Skipping example with length 1012 (seq_length=1024) +03/05/2022 04:42:14 - INFO - codeparrot_training - Step 33388: {'lr': 0.0004465327557812603, 'samples': 17095168, 'steps': 33388, 'loss/train': 2.3148624897003174} +03/05/2022 04:42:17 - INFO - codeparrot_training - Step 33389: {'lr': 0.0004465294758512121, 'samples': 17095680, 'steps': 33389, 'loss/train': 2.1063382625579834} +03/05/2022 04:42:17 - INFO - codeparrot_training - Skipping example with length 272 (seq_length=1024) +03/05/2022 04:42:22 - INFO - codeparrot_training - Step 33390: {'lr': 0.0004465261958326108, 'samples': 17096192, 'steps': 33390, 'loss/train': 1.6761436462402344} +03/05/2022 04:42:25 - INFO - codeparrot_training - Skipping example with length 921 (seq_length=1024) +03/05/2022 04:42:28 - INFO - codeparrot_training - Step 33391: {'lr': 0.0004465229157254578, 'samples': 17096704, 'steps': 33391, 'loss/train': 2.060272216796875} +03/05/2022 04:42:31 - INFO - codeparrot_training - Step 33392: {'lr': 0.0004465196355297546, 'samples': 17097216, 'steps': 33392, 'loss/train': 1.938143253326416} +03/05/2022 04:42:34 - INFO - codeparrot_training - Step 33393: {'lr': 0.0004465163552455027, 'samples': 17097728, 'steps': 33393, 'loss/train': 1.614751935005188} +03/05/2022 04:42:34 - INFO - codeparrot_training - Skipping example with length 640 (seq_length=1024) +03/05/2022 04:42:39 - INFO - codeparrot_training - Step 33394: {'lr': 0.0004465130748727036, 'samples': 17098240, 'steps': 33394, 'loss/train': 1.8033032417297363} +03/05/2022 04:42:42 - INFO - codeparrot_training - Step 33395: {'lr': 0.0004465097944113587, 'samples': 17098752, 'steps': 33395, 'loss/train': 1.4509755373001099} +03/05/2022 04:42:43 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 04:42:48 - INFO - codeparrot_training - Step 33396: {'lr': 0.00044650651386146954, 'samples': 17099264, 'steps': 33396, 'loss/train': 1.9044692516326904} +03/05/2022 04:42:51 - INFO - codeparrot_training - Step 33397: {'lr': 0.00044650323322303757, 'samples': 17099776, 'steps': 33397, 'loss/train': 1.2850303649902344} +03/05/2022 04:42:51 - INFO - codeparrot_training - Skipping example with length 250 (seq_length=1024) +03/05/2022 04:42:56 - INFO - codeparrot_training - Step 33398: {'lr': 0.0004464999524960642, 'samples': 17100288, 'steps': 33398, 'loss/train': 1.4102160930633545} +03/05/2022 04:42:59 - INFO - codeparrot_training - Step 33399: {'lr': 0.0004464966716805511, 'samples': 17100800, 'steps': 33399, 'loss/train': 1.8585915565490723} +03/05/2022 04:42:59 - INFO - codeparrot_training - Skipping example with length 595 (seq_length=1024) +03/05/2022 04:43:05 - INFO - codeparrot_training - Step 33400: {'lr': 0.0004464933907764996, 'samples': 17101312, 'steps': 33400, 'loss/train': 2.7101783752441406} +03/05/2022 04:43:07 - INFO - codeparrot_training - Skipping example with length 83 (seq_length=1024) +03/05/2022 04:43:10 - INFO - codeparrot_training - Step 33401: {'lr': 0.0004464901097839112, 'samples': 17101824, 'steps': 33401, 'loss/train': 1.620274543762207} +03/05/2022 04:43:13 - INFO - codeparrot_training - Step 33402: {'lr': 0.00044648682870278733, 'samples': 17102336, 'steps': 33402, 'loss/train': 1.240896224975586} +03/05/2022 04:43:18 - INFO - codeparrot_training - Step 33403: {'lr': 0.0004464835475331296, 'samples': 17102848, 'steps': 33403, 'loss/train': 1.7425428628921509} +03/05/2022 04:43:21 - INFO - codeparrot_training - Step 33404: {'lr': 0.0004464802662749394, 'samples': 17103360, 'steps': 33404, 'loss/train': 0.7599107623100281} +03/05/2022 04:43:24 - INFO - codeparrot_training - Skipping example with length 312 (seq_length=1024) +03/05/2022 04:43:27 - INFO - codeparrot_training - Step 33405: {'lr': 0.00044647698492821826, 'samples': 17103872, 'steps': 33405, 'loss/train': 1.1987831592559814} +03/05/2022 04:43:30 - INFO - codeparrot_training - Step 33406: {'lr': 0.00044647370349296757, 'samples': 17104384, 'steps': 33406, 'loss/train': 1.1481199264526367} +03/05/2022 04:43:32 - INFO - codeparrot_training - Skipping example with length 794 (seq_length=1024) +03/05/2022 04:43:35 - INFO - codeparrot_training - Step 33407: {'lr': 0.00044647042196918884, 'samples': 17104896, 'steps': 33407, 'loss/train': 1.1245368719100952} +03/05/2022 04:43:38 - INFO - codeparrot_training - Step 33408: {'lr': 0.00044646714035688365, 'samples': 17105408, 'steps': 33408, 'loss/train': 1.613560438156128} +03/05/2022 04:43:41 - INFO - codeparrot_training - Skipping example with length 487 (seq_length=1024) +03/05/2022 04:43:44 - INFO - codeparrot_training - Step 33409: {'lr': 0.00044646385865605335, 'samples': 17105920, 'steps': 33409, 'loss/train': 0.648435115814209} +03/05/2022 04:43:47 - INFO - codeparrot_training - Step 33410: {'lr': 0.0004464605768666995, 'samples': 17106432, 'steps': 33410, 'loss/train': 2.1573431491851807} +03/05/2022 04:43:49 - INFO - codeparrot_training - Skipping example with length 907 (seq_length=1024) +03/05/2022 04:43:52 - INFO - codeparrot_training - Step 33411: {'lr': 0.0004464572949888235, 'samples': 17106944, 'steps': 33411, 'loss/train': 1.7899521589279175} +03/05/2022 04:43:55 - INFO - codeparrot_training - Step 33412: {'lr': 0.0004464540130224268, 'samples': 17107456, 'steps': 33412, 'loss/train': 1.4265230894088745} +03/05/2022 04:43:57 - INFO - codeparrot_training - Skipping example with length 153 (seq_length=1024) +03/05/2022 04:44:00 - INFO - codeparrot_training - Step 33413: {'lr': 0.0004464507309675111, 'samples': 17107968, 'steps': 33413, 'loss/train': 0.9691981673240662} +03/05/2022 04:44:04 - INFO - codeparrot_training - Step 33414: {'lr': 0.00044644744882407767, 'samples': 17108480, 'steps': 33414, 'loss/train': 1.7132285833358765} +03/05/2022 04:44:06 - INFO - codeparrot_training - Skipping example with length 830 (seq_length=1024) +03/05/2022 04:44:09 - INFO - codeparrot_training - Step 33415: {'lr': 0.00044644416659212806, 'samples': 17108992, 'steps': 33415, 'loss/train': 1.0552632808685303} +03/05/2022 04:44:12 - INFO - codeparrot_training - Step 33416: {'lr': 0.00044644088427166375, 'samples': 17109504, 'steps': 33416, 'loss/train': 2.1172711849212646} +03/05/2022 04:44:14 - INFO - codeparrot_training - Skipping example with length 138 (seq_length=1024) +03/05/2022 04:44:17 - INFO - codeparrot_training - Step 33417: {'lr': 0.00044643760186268615, 'samples': 17110016, 'steps': 33417, 'loss/train': 2.0257163047790527} +03/05/2022 04:44:20 - INFO - codeparrot_training - Step 33418: {'lr': 0.00044643431936519683, 'samples': 17110528, 'steps': 33418, 'loss/train': 1.0607872009277344} +03/05/2022 04:44:23 - INFO - codeparrot_training - Skipping example with length 707 (seq_length=1024) +03/05/2022 04:44:26 - INFO - codeparrot_training - Step 33419: {'lr': 0.00044643103677919726, 'samples': 17111040, 'steps': 33419, 'loss/train': 1.671301245689392} +03/05/2022 04:44:29 - INFO - codeparrot_training - Step 33420: {'lr': 0.00044642775410468896, 'samples': 17111552, 'steps': 33420, 'loss/train': 0.9080524444580078} +03/05/2022 04:44:31 - INFO - codeparrot_training - Skipping example with length 759 (seq_length=1024) +03/05/2022 04:44:34 - INFO - codeparrot_training - Step 33421: {'lr': 0.00044642447134167316, 'samples': 17112064, 'steps': 33421, 'loss/train': 1.5299229621887207} +03/05/2022 04:44:37 - INFO - codeparrot_training - Step 33422: {'lr': 0.00044642118849015167, 'samples': 17112576, 'steps': 33422, 'loss/train': 1.1376054286956787} +03/05/2022 04:44:40 - INFO - codeparrot_training - Skipping example with length 604 (seq_length=1024) +03/05/2022 04:44:43 - INFO - codeparrot_training - Step 33423: {'lr': 0.0004464179055501258, 'samples': 17113088, 'steps': 33423, 'loss/train': 2.105508327484131} +03/05/2022 04:44:46 - INFO - codeparrot_training - Step 33424: {'lr': 0.00044641462252159705, 'samples': 17113600, 'steps': 33424, 'loss/train': 1.3555563688278198} +03/05/2022 04:44:51 - INFO - codeparrot_training - Step 33425: {'lr': 0.0004464113394045669, 'samples': 17114112, 'steps': 33425, 'loss/train': 1.564305067062378} +03/05/2022 04:44:54 - INFO - codeparrot_training - Step 33426: {'lr': 0.00044640805619903677, 'samples': 17114624, 'steps': 33426, 'loss/train': 1.4706215858459473} +03/05/2022 04:44:56 - INFO - codeparrot_training - Skipping example with length 489 (seq_length=1024) +03/05/2022 04:45:00 - INFO - codeparrot_training - Step 33427: {'lr': 0.00044640477290500824, 'samples': 17115136, 'steps': 33427, 'loss/train': 1.8843681812286377} +03/05/2022 04:45:03 - INFO - codeparrot_training - Step 33428: {'lr': 0.00044640148952248285, 'samples': 17115648, 'steps': 33428, 'loss/train': 1.6479525566101074} +03/05/2022 04:45:05 - INFO - codeparrot_training - Skipping example with length 359 (seq_length=1024) +03/05/2022 04:45:08 - INFO - codeparrot_training - Step 33429: {'lr': 0.00044639820605146184, 'samples': 17116160, 'steps': 33429, 'loss/train': 2.1154611110687256} +03/05/2022 04:45:11 - INFO - codeparrot_training - Step 33430: {'lr': 0.0004463949224919469, 'samples': 17116672, 'steps': 33430, 'loss/train': 1.2566444873809814} +03/05/2022 04:45:13 - INFO - codeparrot_training - Skipping example with length 341 (seq_length=1024) +03/05/2022 04:45:16 - INFO - codeparrot_training - Step 33431: {'lr': 0.0004463916388439394, 'samples': 17117184, 'steps': 33431, 'loss/train': 1.4414485692977905} +03/05/2022 04:45:20 - INFO - codeparrot_training - Step 33432: {'lr': 0.00044638835510744094, 'samples': 17117696, 'steps': 33432, 'loss/train': 1.686241626739502} +03/05/2022 04:45:21 - INFO - codeparrot_training - Skipping example with length 686 (seq_length=1024) +03/05/2022 04:45:25 - INFO - codeparrot_training - Step 33433: {'lr': 0.0004463850712824528, 'samples': 17118208, 'steps': 33433, 'loss/train': 2.1638596057891846} +03/05/2022 04:45:28 - INFO - codeparrot_training - Step 33434: {'lr': 0.0004463817873689766, 'samples': 17118720, 'steps': 33434, 'loss/train': 1.3323029279708862} +03/05/2022 04:45:30 - INFO - codeparrot_training - Skipping example with length 275 (seq_length=1024) +03/05/2022 04:45:33 - INFO - codeparrot_training - Step 33435: {'lr': 0.00044637850336701386, 'samples': 17119232, 'steps': 33435, 'loss/train': 1.509308099746704} +03/05/2022 04:45:37 - INFO - codeparrot_training - Step 33436: {'lr': 0.000446375219276566, 'samples': 17119744, 'steps': 33436, 'loss/train': 1.8432215452194214} +03/05/2022 04:45:38 - INFO - codeparrot_training - Skipping example with length 744 (seq_length=1024) +03/05/2022 04:45:42 - INFO - codeparrot_training - Step 33437: {'lr': 0.0004463719350976344, 'samples': 17120256, 'steps': 33437, 'loss/train': 1.8857122659683228} +03/05/2022 04:45:45 - INFO - codeparrot_training - Step 33438: {'lr': 0.0004463686508302207, 'samples': 17120768, 'steps': 33438, 'loss/train': 0.5965262651443481} +03/05/2022 04:45:47 - INFO - codeparrot_training - Skipping example with length 679 (seq_length=1024) +03/05/2022 04:45:50 - INFO - codeparrot_training - Step 33439: {'lr': 0.00044636536647432636, 'samples': 17121280, 'steps': 33439, 'loss/train': 1.1440011262893677} +03/05/2022 04:45:53 - INFO - codeparrot_training - Step 33440: {'lr': 0.00044636208202995277, 'samples': 17121792, 'steps': 33440, 'loss/train': 1.6265612840652466} +03/05/2022 04:45:55 - INFO - codeparrot_training - Skipping example with length 309 (seq_length=1024) +03/05/2022 04:45:59 - INFO - codeparrot_training - Step 33441: {'lr': 0.0004463587974971014, 'samples': 17122304, 'steps': 33441, 'loss/train': 1.9647272825241089} +03/05/2022 04:46:02 - INFO - codeparrot_training - Step 33442: {'lr': 0.0004463555128757739, 'samples': 17122816, 'steps': 33442, 'loss/train': 1.262209415435791} +03/05/2022 04:46:03 - INFO - codeparrot_training - Skipping example with length 121 (seq_length=1024) +03/05/2022 04:46:07 - INFO - codeparrot_training - Step 33443: {'lr': 0.00044635222816597153, 'samples': 17123328, 'steps': 33443, 'loss/train': 1.3243591785430908} +03/05/2022 04:46:10 - INFO - codeparrot_training - Step 33444: {'lr': 0.0004463489433676959, 'samples': 17123840, 'steps': 33444, 'loss/train': 1.7063919305801392} +03/05/2022 04:46:12 - INFO - codeparrot_training - Skipping example with length 684 (seq_length=1024) +03/05/2022 04:46:16 - INFO - codeparrot_training - Step 33445: {'lr': 0.00044634565848094854, 'samples': 17124352, 'steps': 33445, 'loss/train': 0.9963560104370117} +03/05/2022 04:46:19 - INFO - codeparrot_training - Step 33446: {'lr': 0.0004463423735057308, 'samples': 17124864, 'steps': 33446, 'loss/train': 1.8027663230895996} +03/05/2022 04:46:21 - INFO - codeparrot_training - Skipping example with length 957 (seq_length=1024) +03/05/2022 04:46:24 - INFO - codeparrot_training - Step 33447: {'lr': 0.00044633908844204424, 'samples': 17125376, 'steps': 33447, 'loss/train': 1.5296945571899414} +03/05/2022 04:46:27 - INFO - codeparrot_training - Step 33448: {'lr': 0.0004463358032898903, 'samples': 17125888, 'steps': 33448, 'loss/train': 2.0157408714294434} +03/05/2022 04:46:29 - INFO - codeparrot_training - Skipping example with length 788 (seq_length=1024) +03/05/2022 04:46:32 - INFO - codeparrot_training - Step 33449: {'lr': 0.00044633251804927044, 'samples': 17126400, 'steps': 33449, 'loss/train': 3.288628578186035} +03/05/2022 04:46:36 - INFO - codeparrot_training - Step 33450: {'lr': 0.0004463292327201862, 'samples': 17126912, 'steps': 33450, 'loss/train': 2.045158863067627} +03/05/2022 04:46:37 - INFO - codeparrot_training - Skipping example with length 447 (seq_length=1024) +03/05/2022 04:46:41 - INFO - codeparrot_training - Step 33451: {'lr': 0.0004463259473026391, 'samples': 17127424, 'steps': 33451, 'loss/train': 2.069981098175049} +03/05/2022 04:46:44 - INFO - codeparrot_training - Step 33452: {'lr': 0.0004463226617966305, 'samples': 17127936, 'steps': 33452, 'loss/train': 1.3332791328430176} +03/05/2022 04:46:46 - INFO - codeparrot_training - Skipping example with length 693 (seq_length=1024) +03/05/2022 04:46:49 - INFO - codeparrot_training - Step 33453: {'lr': 0.00044631937620216196, 'samples': 17128448, 'steps': 33453, 'loss/train': 1.7970229387283325} +03/05/2022 04:46:53 - INFO - codeparrot_training - Step 33454: {'lr': 0.00044631609051923494, 'samples': 17128960, 'steps': 33454, 'loss/train': 1.7123819589614868} +03/05/2022 04:46:54 - INFO - codeparrot_training - Skipping example with length 865 (seq_length=1024) +03/05/2022 04:46:58 - INFO - codeparrot_training - Step 33455: {'lr': 0.00044631280474785086, 'samples': 17129472, 'steps': 33455, 'loss/train': 1.5462727546691895} +03/05/2022 04:47:01 - INFO - codeparrot_training - Step 33456: {'lr': 0.0004463095188880113, 'samples': 17129984, 'steps': 33456, 'loss/train': 1.3446537256240845} +03/05/2022 04:47:02 - INFO - codeparrot_training - Skipping example with length 188 (seq_length=1024) +03/05/2022 04:47:06 - INFO - codeparrot_training - Step 33457: {'lr': 0.00044630623293971775, 'samples': 17130496, 'steps': 33457, 'loss/train': 1.1698766946792603} +03/05/2022 04:47:09 - INFO - codeparrot_training - Step 33458: {'lr': 0.0004463029469029716, 'samples': 17131008, 'steps': 33458, 'loss/train': 1.8038116693496704} +03/05/2022 04:47:11 - INFO - codeparrot_training - Skipping example with length 34 (seq_length=1024) +03/05/2022 04:47:14 - INFO - codeparrot_training - Step 33459: {'lr': 0.0004462996607777743, 'samples': 17131520, 'steps': 33459, 'loss/train': 1.4883025884628296} +03/05/2022 04:47:18 - INFO - codeparrot_training - Step 33460: {'lr': 0.00044629637456412754, 'samples': 17132032, 'steps': 33460, 'loss/train': 1.9204295873641968} +03/05/2022 04:47:19 - INFO - codeparrot_training - Skipping example with length 624 (seq_length=1024) +03/05/2022 04:47:23 - INFO - codeparrot_training - Step 33461: {'lr': 0.0004462930882620325, 'samples': 17132544, 'steps': 33461, 'loss/train': 1.6651878356933594} +03/05/2022 04:47:26 - INFO - codeparrot_training - Step 33462: {'lr': 0.0004462898018714909, 'samples': 17133056, 'steps': 33462, 'loss/train': 1.9412455558776855} +03/05/2022 04:47:27 - INFO - codeparrot_training - Skipping example with length 889 (seq_length=1024) +03/05/2022 04:47:32 - INFO - codeparrot_training - Step 33463: {'lr': 0.0004462865153925042, 'samples': 17133568, 'steps': 33463, 'loss/train': 1.9131163358688354} +03/05/2022 04:47:35 - INFO - codeparrot_training - Step 33464: {'lr': 0.00044628322882507375, 'samples': 17134080, 'steps': 33464, 'loss/train': 6.435811519622803} +03/05/2022 04:47:36 - INFO - codeparrot_training - Skipping example with length 870 (seq_length=1024) +03/05/2022 04:47:40 - INFO - codeparrot_training - Step 33465: {'lr': 0.0004462799421692012, 'samples': 17134592, 'steps': 33465, 'loss/train': 2.3551957607269287} +03/05/2022 04:47:43 - INFO - codeparrot_training - Step 33466: {'lr': 0.0004462766554248878, 'samples': 17135104, 'steps': 33466, 'loss/train': 1.803325891494751} +03/05/2022 04:47:45 - INFO - codeparrot_training - Skipping example with length 215 (seq_length=1024) +03/05/2022 04:47:48 - INFO - codeparrot_training - Step 33467: {'lr': 0.0004462733685921353, 'samples': 17135616, 'steps': 33467, 'loss/train': 1.8293875455856323} +03/05/2022 04:47:51 - INFO - codeparrot_training - Step 33468: {'lr': 0.000446270081670945, 'samples': 17136128, 'steps': 33468, 'loss/train': 2.119594097137451} +03/05/2022 04:47:53 - INFO - codeparrot_training - Skipping example with length 621 (seq_length=1024) +03/05/2022 04:47:57 - INFO - codeparrot_training - Step 33469: {'lr': 0.0004462667946613184, 'samples': 17136640, 'steps': 33469, 'loss/train': 2.3080646991729736} +03/05/2022 04:48:00 - INFO - codeparrot_training - Step 33470: {'lr': 0.00044626350756325707, 'samples': 17137152, 'steps': 33470, 'loss/train': 2.174365520477295} +03/05/2022 04:48:01 - INFO - codeparrot_training - Skipping example with length 408 (seq_length=1024) +03/05/2022 04:48:05 - INFO - codeparrot_training - Step 33471: {'lr': 0.0004462602203767624, 'samples': 17137664, 'steps': 33471, 'loss/train': 1.5706700086593628} +03/05/2022 04:48:08 - INFO - codeparrot_training - Step 33472: {'lr': 0.0004462569331018359, 'samples': 17138176, 'steps': 33472, 'loss/train': 2.118823528289795} +03/05/2022 04:48:10 - INFO - codeparrot_training - Skipping example with length 509 (seq_length=1024) +03/05/2022 04:48:14 - INFO - codeparrot_training - Step 33473: {'lr': 0.00044625364573847904, 'samples': 17138688, 'steps': 33473, 'loss/train': 3.0985913276672363} +03/05/2022 04:48:17 - INFO - codeparrot_training - Step 33474: {'lr': 0.0004462503582866933, 'samples': 17139200, 'steps': 33474, 'loss/train': 1.7558958530426025} +03/05/2022 04:48:19 - INFO - codeparrot_training - Skipping example with length 177 (seq_length=1024) +03/05/2022 04:48:22 - INFO - codeparrot_training - Step 33475: {'lr': 0.00044624707074648017, 'samples': 17139712, 'steps': 33475, 'loss/train': 4.688785076141357} +03/05/2022 04:48:25 - INFO - codeparrot_training - Step 33476: {'lr': 0.0004462437831178412, 'samples': 17140224, 'steps': 33476, 'loss/train': 1.8062219619750977} +03/05/2022 04:48:27 - INFO - codeparrot_training - Skipping example with length 761 (seq_length=1024) +03/05/2022 04:48:31 - INFO - codeparrot_training - Step 33477: {'lr': 0.00044624049540077784, 'samples': 17140736, 'steps': 33477, 'loss/train': 1.7763456106185913} +03/05/2022 04:48:34 - INFO - codeparrot_training - Step 33478: {'lr': 0.0004462372075952914, 'samples': 17141248, 'steps': 33478, 'loss/train': 1.7571529150009155} +03/05/2022 04:48:36 - INFO - codeparrot_training - Skipping example with length 703 (seq_length=1024) +03/05/2022 04:48:39 - INFO - codeparrot_training - Step 33479: {'lr': 0.0004462339197013836, 'samples': 17141760, 'steps': 33479, 'loss/train': 1.3733891248703003} +03/05/2022 04:48:42 - INFO - codeparrot_training - Step 33480: {'lr': 0.00044623063171905585, 'samples': 17142272, 'steps': 33480, 'loss/train': 1.0368611812591553} +03/05/2022 04:48:44 - INFO - codeparrot_training - Skipping example with length 215 (seq_length=1024) +03/05/2022 04:48:47 - INFO - codeparrot_training - Step 33481: {'lr': 0.0004462273436483095, 'samples': 17142784, 'steps': 33481, 'loss/train': 1.9818273782730103} +03/05/2022 04:48:51 - INFO - codeparrot_training - Step 33482: {'lr': 0.00044622405548914627, 'samples': 17143296, 'steps': 33482, 'loss/train': 4.651758670806885} +03/05/2022 04:48:53 - INFO - codeparrot_training - Skipping example with length 981 (seq_length=1024) +03/05/2022 04:48:56 - INFO - codeparrot_training - Step 33483: {'lr': 0.00044622076724156747, 'samples': 17143808, 'steps': 33483, 'loss/train': 1.781371831893921} +03/05/2022 04:48:59 - INFO - codeparrot_training - Step 33484: {'lr': 0.00044621747890557454, 'samples': 17144320, 'steps': 33484, 'loss/train': 2.4993910789489746} +03/05/2022 04:49:01 - INFO - codeparrot_training - Skipping example with length 11 (seq_length=1024) +03/05/2022 04:49:04 - INFO - codeparrot_training - Step 33485: {'lr': 0.0004462141904811691, 'samples': 17144832, 'steps': 33485, 'loss/train': 1.9342212677001953} +03/05/2022 04:49:08 - INFO - codeparrot_training - Step 33486: {'lr': 0.00044621090196835254, 'samples': 17145344, 'steps': 33486, 'loss/train': 0.09061639755964279} +03/05/2022 04:49:09 - INFO - codeparrot_training - Skipping example with length 193 (seq_length=1024) +03/05/2022 04:49:13 - INFO - codeparrot_training - Step 33487: {'lr': 0.00044620761336712646, 'samples': 17145856, 'steps': 33487, 'loss/train': 2.005896806716919} +03/05/2022 04:49:16 - INFO - codeparrot_training - Step 33488: {'lr': 0.00044620432467749215, 'samples': 17146368, 'steps': 33488, 'loss/train': 1.2757248878479004} +03/05/2022 04:49:18 - INFO - codeparrot_training - Skipping example with length 318 (seq_length=1024) +03/05/2022 04:49:22 - INFO - codeparrot_training - Step 33489: {'lr': 0.0004462010358994513, 'samples': 17146880, 'steps': 33489, 'loss/train': 1.0555795431137085} +03/05/2022 04:49:25 - INFO - codeparrot_training - Step 33490: {'lr': 0.0004461977470330052, 'samples': 17147392, 'steps': 33490, 'loss/train': 1.8667715787887573} +03/05/2022 04:49:28 - INFO - codeparrot_training - Skipping example with length 757 (seq_length=1024) +03/05/2022 04:49:30 - INFO - codeparrot_training - Step 33491: {'lr': 0.00044619445807815545, 'samples': 17147904, 'steps': 33491, 'loss/train': 0.5039077997207642} +03/05/2022 04:49:33 - INFO - codeparrot_training - Step 33492: {'lr': 0.00044619116903490356, 'samples': 17148416, 'steps': 33492, 'loss/train': 1.5600253343582153} +03/05/2022 04:49:36 - INFO - codeparrot_training - Skipping example with length 618 (seq_length=1024) +03/05/2022 04:49:39 - INFO - codeparrot_training - Step 33493: {'lr': 0.00044618787990325086, 'samples': 17148928, 'steps': 33493, 'loss/train': 1.9713783264160156} +03/05/2022 04:49:42 - INFO - codeparrot_training - Step 33494: {'lr': 0.000446184590683199, 'samples': 17149440, 'steps': 33494, 'loss/train': 1.550588607788086} +03/05/2022 04:49:44 - INFO - codeparrot_training - Skipping example with length 504 (seq_length=1024) +03/05/2022 04:49:47 - INFO - codeparrot_training - Step 33495: {'lr': 0.00044618130137474935, 'samples': 17149952, 'steps': 33495, 'loss/train': 1.7003018856048584} +03/05/2022 04:49:50 - INFO - codeparrot_training - Step 33496: {'lr': 0.0004461780119779034, 'samples': 17150464, 'steps': 33496, 'loss/train': 1.414426326751709} +03/05/2022 04:49:53 - INFO - codeparrot_training - Skipping example with length 499 (seq_length=1024) +03/05/2022 04:49:55 - INFO - codeparrot_training - Step 33497: {'lr': 0.0004461747224926628, 'samples': 17150976, 'steps': 33497, 'loss/train': 1.8659199476242065} +03/05/2022 04:49:59 - INFO - codeparrot_training - Step 33498: {'lr': 0.0004461714329190288, 'samples': 17151488, 'steps': 33498, 'loss/train': 2.3922362327575684} +03/05/2022 04:50:01 - INFO - codeparrot_training - Skipping example with length 476 (seq_length=1024) +03/05/2022 04:50:04 - INFO - codeparrot_training - Step 33499: {'lr': 0.00044616814325700293, 'samples': 17152000, 'steps': 33499, 'loss/train': 1.8888484239578247} +03/05/2022 04:50:07 - INFO - codeparrot_training - Step 33500: {'lr': 0.0004461648535065869, 'samples': 17152512, 'steps': 33500, 'loss/train': 2.139421224594116} +03/05/2022 04:50:10 - INFO - codeparrot_training - Skipping example with length 587 (seq_length=1024) +03/05/2022 04:50:13 - INFO - codeparrot_training - Step 33501: {'lr': 0.0004461615636677818, 'samples': 17153024, 'steps': 33501, 'loss/train': 1.6973953247070312} +03/05/2022 04:50:16 - INFO - codeparrot_training - Step 33502: {'lr': 0.0004461582737405895, 'samples': 17153536, 'steps': 33502, 'loss/train': 1.3614157438278198} +03/05/2022 04:50:18 - INFO - codeparrot_training - Skipping example with length 127 (seq_length=1024) +03/05/2022 04:50:21 - INFO - codeparrot_training - Step 33503: {'lr': 0.00044615498372501116, 'samples': 17154048, 'steps': 33503, 'loss/train': 1.9766550064086914} +03/05/2022 04:50:24 - INFO - codeparrot_training - Step 33504: {'lr': 0.00044615169362104856, 'samples': 17154560, 'steps': 33504, 'loss/train': 2.0890936851501465} +03/05/2022 04:50:27 - INFO - codeparrot_training - Skipping example with length 1016 (seq_length=1024) +03/05/2022 04:50:30 - INFO - codeparrot_training - Step 33505: {'lr': 0.00044614840342870293, 'samples': 17155072, 'steps': 33505, 'loss/train': 1.7183324098587036} +03/05/2022 04:50:33 - INFO - codeparrot_training - Step 33506: {'lr': 0.0004461451131479759, 'samples': 17155584, 'steps': 33506, 'loss/train': 1.9086568355560303} +03/05/2022 04:50:35 - INFO - codeparrot_training - Skipping example with length 833 (seq_length=1024) +03/05/2022 04:50:38 - INFO - codeparrot_training - Step 33507: {'lr': 0.0004461418227788689, 'samples': 17156096, 'steps': 33507, 'loss/train': 2.0103378295898438} +03/05/2022 04:50:41 - INFO - codeparrot_training - Step 33508: {'lr': 0.00044613853232138343, 'samples': 17156608, 'steps': 33508, 'loss/train': 1.9204638004302979} +03/05/2022 04:50:43 - INFO - codeparrot_training - Skipping example with length 224 (seq_length=1024) +03/05/2022 04:50:47 - INFO - codeparrot_training - Step 33509: {'lr': 0.0004461352417755209, 'samples': 17157120, 'steps': 33509, 'loss/train': 2.0305142402648926} +03/05/2022 04:50:50 - INFO - codeparrot_training - Step 33510: {'lr': 0.0004461319511412829, 'samples': 17157632, 'steps': 33510, 'loss/train': 1.619326114654541} +03/05/2022 04:50:52 - INFO - codeparrot_training - Skipping example with length 149 (seq_length=1024) +03/05/2022 04:50:55 - INFO - codeparrot_training - Step 33511: {'lr': 0.00044612866041867093, 'samples': 17158144, 'steps': 33511, 'loss/train': 2.0225210189819336} +03/05/2022 04:50:58 - INFO - codeparrot_training - Step 33512: {'lr': 0.0004461253696076863, 'samples': 17158656, 'steps': 33512, 'loss/train': 1.3889366388320923} +03/05/2022 04:51:00 - INFO - codeparrot_training - Skipping example with length 457 (seq_length=1024) +03/05/2022 04:51:04 - INFO - codeparrot_training - Step 33513: {'lr': 0.00044612207870833073, 'samples': 17159168, 'steps': 33513, 'loss/train': 1.4979047775268555} +03/05/2022 04:51:07 - INFO - codeparrot_training - Step 33514: {'lr': 0.0004461187877206055, 'samples': 17159680, 'steps': 33514, 'loss/train': 1.6080878973007202} +03/05/2022 04:51:09 - INFO - codeparrot_training - Skipping example with length 210 (seq_length=1024) +03/05/2022 04:51:12 - INFO - codeparrot_training - Step 33515: {'lr': 0.00044611549664451216, 'samples': 17160192, 'steps': 33515, 'loss/train': 1.774382472038269} +03/05/2022 04:51:15 - INFO - codeparrot_training - Step 33516: {'lr': 0.0004461122054800522, 'samples': 17160704, 'steps': 33516, 'loss/train': 1.6848671436309814} +03/05/2022 04:51:17 - INFO - codeparrot_training - Skipping example with length 257 (seq_length=1024) +03/05/2022 04:51:20 - INFO - codeparrot_training - Step 33517: {'lr': 0.00044610891422722714, 'samples': 17161216, 'steps': 33517, 'loss/train': 1.154137134552002} +03/05/2022 04:51:24 - INFO - codeparrot_training - Step 33518: {'lr': 0.00044610562288603846, 'samples': 17161728, 'steps': 33518, 'loss/train': 1.846269130706787} +03/05/2022 04:51:26 - INFO - codeparrot_training - Skipping example with length 566 (seq_length=1024) +03/05/2022 04:51:29 - INFO - codeparrot_training - Step 33519: {'lr': 0.00044610233145648756, 'samples': 17162240, 'steps': 33519, 'loss/train': 1.8281073570251465} +03/05/2022 04:51:32 - INFO - codeparrot_training - Step 33520: {'lr': 0.00044609903993857603, 'samples': 17162752, 'steps': 33520, 'loss/train': 1.4997453689575195} +03/05/2022 04:51:34 - INFO - codeparrot_training - Skipping example with length 812 (seq_length=1024) +03/05/2022 04:51:37 - INFO - codeparrot_training - Step 33521: {'lr': 0.0004460957483323052, 'samples': 17163264, 'steps': 33521, 'loss/train': 2.154050827026367} +03/05/2022 04:51:40 - INFO - codeparrot_training - Step 33522: {'lr': 0.0004460924566376767, 'samples': 17163776, 'steps': 33522, 'loss/train': 1.5889368057250977} +03/05/2022 04:51:43 - INFO - codeparrot_training - Skipping example with length 507 (seq_length=1024) +03/05/2022 04:51:46 - INFO - codeparrot_training - Step 33523: {'lr': 0.00044608916485469195, 'samples': 17164288, 'steps': 33523, 'loss/train': 1.9227056503295898} +03/05/2022 04:51:49 - INFO - codeparrot_training - Step 33524: {'lr': 0.0004460858729833525, 'samples': 17164800, 'steps': 33524, 'loss/train': 1.7285442352294922} +03/05/2022 04:51:51 - INFO - codeparrot_training - Skipping example with length 187 (seq_length=1024) +03/05/2022 04:51:54 - INFO - codeparrot_training - Step 33525: {'lr': 0.0004460825810236598, 'samples': 17165312, 'steps': 33525, 'loss/train': 1.899969458580017} +03/05/2022 04:51:57 - INFO - codeparrot_training - Step 33526: {'lr': 0.00044607928897561524, 'samples': 17165824, 'steps': 33526, 'loss/train': 2.687861204147339} +03/05/2022 04:52:03 - INFO - codeparrot_training - Step 33527: {'lr': 0.0004460759968392204, 'samples': 17166336, 'steps': 33527, 'loss/train': 1.2853384017944336} +03/05/2022 04:52:06 - INFO - codeparrot_training - Step 33528: {'lr': 0.0004460727046144768, 'samples': 17166848, 'steps': 33528, 'loss/train': 2.344062089920044} +03/05/2022 04:52:09 - INFO - codeparrot_training - Step 33529: {'lr': 0.00044606941230138574, 'samples': 17167360, 'steps': 33529, 'loss/train': 1.0734360218048096} +03/05/2022 04:52:09 - INFO - codeparrot_training - Skipping example with length 228 (seq_length=1024) +03/05/2022 04:52:14 - INFO - codeparrot_training - Step 33530: {'lr': 0.0004460661198999489, 'samples': 17167872, 'steps': 33530, 'loss/train': 1.2307394742965698} +03/05/2022 04:52:18 - INFO - codeparrot_training - Step 33531: {'lr': 0.0004460628274101677, 'samples': 17168384, 'steps': 33531, 'loss/train': 1.8025763034820557} +03/05/2022 04:52:18 - INFO - codeparrot_training - Skipping example with length 645 (seq_length=1024) +03/05/2022 04:52:23 - INFO - codeparrot_training - Step 33532: {'lr': 0.0004460595348320436, 'samples': 17168896, 'steps': 33532, 'loss/train': 1.5134105682373047} +03/05/2022 04:52:26 - INFO - codeparrot_training - Skipping example with length 910 (seq_length=1024) +03/05/2022 04:52:28 - INFO - codeparrot_training - Step 33533: {'lr': 0.0004460562421655782, 'samples': 17169408, 'steps': 33533, 'loss/train': 1.0199304819107056} +03/05/2022 04:52:31 - INFO - codeparrot_training - Step 33534: {'lr': 0.0004460529494107727, 'samples': 17169920, 'steps': 33534, 'loss/train': 1.6037136316299438} +03/05/2022 04:52:35 - INFO - codeparrot_training - Step 33535: {'lr': 0.00044604965656762884, 'samples': 17170432, 'steps': 33535, 'loss/train': 1.4356862306594849} +03/05/2022 04:52:35 - INFO - codeparrot_training - Skipping example with length 793 (seq_length=1024) +03/05/2022 04:52:40 - INFO - codeparrot_training - Step 33536: {'lr': 0.0004460463636361481, 'samples': 17170944, 'steps': 33536, 'loss/train': 2.2424275875091553} +03/05/2022 04:52:43 - INFO - codeparrot_training - Step 33537: {'lr': 0.00044604307061633187, 'samples': 17171456, 'steps': 33537, 'loss/train': 1.8621257543563843} +03/05/2022 04:52:43 - INFO - codeparrot_training - Skipping example with length 375 (seq_length=1024) +03/05/2022 04:52:48 - INFO - codeparrot_training - Step 33538: {'lr': 0.0004460397775081816, 'samples': 17171968, 'steps': 33538, 'loss/train': 2.135127305984497} +03/05/2022 04:52:52 - INFO - codeparrot_training - Step 33539: {'lr': 0.00044603648431169884, 'samples': 17172480, 'steps': 33539, 'loss/train': 1.007950782775879} +03/05/2022 04:52:52 - INFO - codeparrot_training - Skipping example with length 640 (seq_length=1024) +03/05/2022 04:52:58 - INFO - codeparrot_training - Step 33540: {'lr': 0.0004460331910268851, 'samples': 17172992, 'steps': 33540, 'loss/train': 0.6041748523712158} +03/05/2022 04:53:01 - INFO - codeparrot_training - Step 33541: {'lr': 0.0004460298976537418, 'samples': 17173504, 'steps': 33541, 'loss/train': 2.115260362625122} +03/05/2022 04:53:04 - INFO - codeparrot_training - Step 33542: {'lr': 0.00044602660419227046, 'samples': 17174016, 'steps': 33542, 'loss/train': 1.0270541906356812} +03/05/2022 04:53:04 - INFO - codeparrot_training - Skipping example with length 269 (seq_length=1024) +03/05/2022 04:53:09 - INFO - codeparrot_training - Step 33543: {'lr': 0.0004460233106424726, 'samples': 17174528, 'steps': 33543, 'loss/train': 0.8249497413635254} +03/05/2022 04:53:12 - INFO - codeparrot_training - Skipping example with length 109 (seq_length=1024) +03/05/2022 04:53:15 - INFO - codeparrot_training - Step 33544: {'lr': 0.00044602001700434963, 'samples': 17175040, 'steps': 33544, 'loss/train': 1.8265620470046997} +03/05/2022 04:53:18 - INFO - codeparrot_training - Step 33545: {'lr': 0.00044601672327790304, 'samples': 17175552, 'steps': 33545, 'loss/train': 2.3485727310180664} +03/05/2022 04:53:21 - INFO - codeparrot_training - Step 33546: {'lr': 0.00044601342946313437, 'samples': 17176064, 'steps': 33546, 'loss/train': 1.3221460580825806} +03/05/2022 04:53:21 - INFO - codeparrot_training - Skipping example with length 164 (seq_length=1024) +03/05/2022 04:53:26 - INFO - codeparrot_training - Step 33547: {'lr': 0.0004460101355600451, 'samples': 17176576, 'steps': 33547, 'loss/train': 0.8309028744697571} +03/05/2022 04:53:29 - INFO - codeparrot_training - Step 33548: {'lr': 0.0004460068415686366, 'samples': 17177088, 'steps': 33548, 'loss/train': 2.366419553756714} +03/05/2022 04:53:29 - INFO - codeparrot_training - Skipping example with length 354 (seq_length=1024) +03/05/2022 04:53:35 - INFO - codeparrot_training - Step 33549: {'lr': 0.0004460035474889105, 'samples': 17177600, 'steps': 33549, 'loss/train': 1.4740426540374756} +03/05/2022 04:53:38 - INFO - codeparrot_training - Skipping example with length 79 (seq_length=1024) +03/05/2022 04:53:40 - INFO - codeparrot_training - Step 33550: {'lr': 0.00044600025332086824, 'samples': 17178112, 'steps': 33550, 'loss/train': 2.2679879665374756} +03/05/2022 04:53:43 - INFO - codeparrot_training - Step 33551: {'lr': 0.0004459969590645113, 'samples': 17178624, 'steps': 33551, 'loss/train': 2.0823307037353516} +03/05/2022 04:53:46 - INFO - codeparrot_training - Skipping example with length 35 (seq_length=1024) +03/05/2022 04:53:48 - INFO - codeparrot_training - Step 33552: {'lr': 0.000445993664719841, 'samples': 17179136, 'steps': 33552, 'loss/train': 1.7948023080825806} +03/05/2022 04:53:52 - INFO - codeparrot_training - Step 33553: {'lr': 0.0004459903702868592, 'samples': 17179648, 'steps': 33553, 'loss/train': 1.6942301988601685} +03/05/2022 04:53:55 - INFO - codeparrot_training - Step 33554: {'lr': 0.00044598707576556706, 'samples': 17180160, 'steps': 33554, 'loss/train': 1.7522468566894531} +03/05/2022 04:53:55 - INFO - codeparrot_training - Skipping example with length 207 (seq_length=1024) +03/05/2022 04:54:01 - INFO - codeparrot_training - Step 33555: {'lr': 0.00044598378115596614, 'samples': 17180672, 'steps': 33555, 'loss/train': 2.0756826400756836} +03/05/2022 04:54:04 - INFO - codeparrot_training - Step 33556: {'lr': 0.000445980486458058, 'samples': 17181184, 'steps': 33556, 'loss/train': 2.170283317565918} +03/05/2022 04:54:07 - INFO - codeparrot_training - Step 33557: {'lr': 0.0004459771916718441, 'samples': 17181696, 'steps': 33557, 'loss/train': 2.1352639198303223} +03/05/2022 04:54:07 - INFO - codeparrot_training - Skipping example with length 956 (seq_length=1024) +03/05/2022 04:54:12 - INFO - codeparrot_training - Step 33558: {'lr': 0.0004459738967973258, 'samples': 17182208, 'steps': 33558, 'loss/train': 1.466123104095459} +03/05/2022 04:54:15 - INFO - codeparrot_training - Step 33559: {'lr': 0.00044597060183450477, 'samples': 17182720, 'steps': 33559, 'loss/train': 1.218019723892212} +03/05/2022 04:54:15 - INFO - codeparrot_training - Skipping example with length 913 (seq_length=1024) +03/05/2022 04:54:21 - INFO - codeparrot_training - Step 33560: {'lr': 0.00044596730678338236, 'samples': 17183232, 'steps': 33560, 'loss/train': 1.660805106163025} +03/05/2022 04:54:24 - INFO - codeparrot_training - Step 33561: {'lr': 0.0004459640116439602, 'samples': 17183744, 'steps': 33561, 'loss/train': 1.7097482681274414} +03/05/2022 04:54:24 - INFO - codeparrot_training - Skipping example with length 156 (seq_length=1024) +03/05/2022 04:54:29 - INFO - codeparrot_training - Step 33562: {'lr': 0.0004459607164162396, 'samples': 17184256, 'steps': 33562, 'loss/train': 1.9240474700927734} +03/05/2022 04:54:32 - INFO - codeparrot_training - Step 33563: {'lr': 0.00044595742110022216, 'samples': 17184768, 'steps': 33563, 'loss/train': 1.6915699243545532} +03/05/2022 04:54:32 - INFO - codeparrot_training - Skipping example with length 440 (seq_length=1024) +03/05/2022 04:54:38 - INFO - codeparrot_training - Step 33564: {'lr': 0.00044595412569590934, 'samples': 17185280, 'steps': 33564, 'loss/train': 1.898544192314148} +03/05/2022 04:54:40 - INFO - codeparrot_training - Skipping example with length 847 (seq_length=1024) +03/05/2022 04:54:43 - INFO - codeparrot_training - Step 33565: {'lr': 0.0004459508302033025, 'samples': 17185792, 'steps': 33565, 'loss/train': 1.4834462404251099} +03/05/2022 04:54:46 - INFO - codeparrot_training - Step 33566: {'lr': 0.00044594753462240335, 'samples': 17186304, 'steps': 33566, 'loss/train': 1.7808737754821777} +03/05/2022 04:54:49 - INFO - codeparrot_training - Skipping example with length 391 (seq_length=1024) +03/05/2022 04:54:51 - INFO - codeparrot_training - Step 33567: {'lr': 0.0004459442389532132, 'samples': 17186816, 'steps': 33567, 'loss/train': 1.721524953842163} +03/05/2022 04:54:55 - INFO - codeparrot_training - Step 33568: {'lr': 0.0004459409431957337, 'samples': 17187328, 'steps': 33568, 'loss/train': 4.255745887756348} +03/05/2022 04:54:58 - INFO - codeparrot_training - Step 33569: {'lr': 0.00044593764734996615, 'samples': 17187840, 'steps': 33569, 'loss/train': 2.6696643829345703} +03/05/2022 04:54:58 - INFO - codeparrot_training - Skipping example with length 1014 (seq_length=1024) +03/05/2022 04:55:03 - INFO - codeparrot_training - Step 33570: {'lr': 0.00044593435141591215, 'samples': 17188352, 'steps': 33570, 'loss/train': 2.147439956665039} +03/05/2022 04:55:06 - INFO - codeparrot_training - Step 33571: {'lr': 0.00044593105539357313, 'samples': 17188864, 'steps': 33571, 'loss/train': 1.6487151384353638} +03/05/2022 04:55:07 - INFO - codeparrot_training - Skipping example with length 196 (seq_length=1024) +03/05/2022 04:55:12 - INFO - codeparrot_training - Step 33572: {'lr': 0.00044592775928295063, 'samples': 17189376, 'steps': 33572, 'loss/train': 1.1814044713974} +03/05/2022 04:55:15 - INFO - codeparrot_training - Step 33573: {'lr': 0.0004459244630840461, 'samples': 17189888, 'steps': 33573, 'loss/train': 1.4722651243209839} +03/05/2022 04:55:16 - INFO - codeparrot_training - Skipping example with length 458 (seq_length=1024) +03/05/2022 04:55:20 - INFO - codeparrot_training - Step 33574: {'lr': 0.000445921166796861, 'samples': 17190400, 'steps': 33574, 'loss/train': 2.474961042404175} +03/05/2022 04:55:24 - INFO - codeparrot_training - Step 33575: {'lr': 0.00044591787042139684, 'samples': 17190912, 'steps': 33575, 'loss/train': 2.0909111499786377} +03/05/2022 04:55:25 - INFO - codeparrot_training - Skipping example with length 777 (seq_length=1024) +03/05/2022 04:55:29 - INFO - codeparrot_training - Step 33576: {'lr': 0.0004459145739576552, 'samples': 17191424, 'steps': 33576, 'loss/train': 1.3652796745300293} +03/05/2022 04:55:32 - INFO - codeparrot_training - Step 33577: {'lr': 0.0004459112774056374, 'samples': 17191936, 'steps': 33577, 'loss/train': 1.6046525239944458} +03/05/2022 04:55:33 - INFO - codeparrot_training - Skipping example with length 317 (seq_length=1024) +03/05/2022 04:55:37 - INFO - codeparrot_training - Step 33578: {'lr': 0.000445907980765345, 'samples': 17192448, 'steps': 33578, 'loss/train': 1.1817234754562378} +03/05/2022 04:55:41 - INFO - codeparrot_training - Step 33579: {'lr': 0.00044590468403677954, 'samples': 17192960, 'steps': 33579, 'loss/train': 2.0022499561309814} +03/05/2022 04:55:42 - INFO - codeparrot_training - Skipping example with length 956 (seq_length=1024) +03/05/2022 04:55:46 - INFO - codeparrot_training - Step 33580: {'lr': 0.00044590138721994243, 'samples': 17193472, 'steps': 33580, 'loss/train': 1.7402523756027222} +03/05/2022 04:55:49 - INFO - codeparrot_training - Step 33581: {'lr': 0.00044589809031483517, 'samples': 17193984, 'steps': 33581, 'loss/train': 0.8934062719345093} +03/05/2022 04:55:50 - INFO - codeparrot_training - Skipping example with length 478 (seq_length=1024) +03/05/2022 04:55:54 - INFO - codeparrot_training - Step 33582: {'lr': 0.0004458947933214592, 'samples': 17194496, 'steps': 33582, 'loss/train': 1.0886738300323486} +03/05/2022 04:55:57 - INFO - codeparrot_training - Step 33583: {'lr': 0.0004458914962398162, 'samples': 17195008, 'steps': 33583, 'loss/train': 1.9218090772628784} +03/05/2022 04:55:59 - INFO - codeparrot_training - Skipping example with length 474 (seq_length=1024) +03/05/2022 04:56:03 - INFO - codeparrot_training - Step 33584: {'lr': 0.0004458881990699074, 'samples': 17195520, 'steps': 33584, 'loss/train': 1.6360738277435303} +03/05/2022 04:56:06 - INFO - codeparrot_training - Step 33585: {'lr': 0.00044588490181173435, 'samples': 17196032, 'steps': 33585, 'loss/train': 2.3009421825408936} +03/05/2022 04:56:07 - INFO - codeparrot_training - Skipping example with length 980 (seq_length=1024) +03/05/2022 04:56:11 - INFO - codeparrot_training - Step 33586: {'lr': 0.0004458816044652987, 'samples': 17196544, 'steps': 33586, 'loss/train': 1.613369345664978} +03/05/2022 04:56:14 - INFO - codeparrot_training - Step 33587: {'lr': 0.00044587830703060176, 'samples': 17197056, 'steps': 33587, 'loss/train': 1.50320565700531} +03/05/2022 04:56:16 - INFO - codeparrot_training - Skipping example with length 262 (seq_length=1024) +03/05/2022 04:56:20 - INFO - codeparrot_training - Step 33588: {'lr': 0.00044587500950764514, 'samples': 17197568, 'steps': 33588, 'loss/train': 1.6947509050369263} +03/05/2022 04:56:23 - INFO - codeparrot_training - Step 33589: {'lr': 0.0004458717118964302, 'samples': 17198080, 'steps': 33589, 'loss/train': 1.8883278369903564} +03/05/2022 04:56:24 - INFO - codeparrot_training - Skipping example with length 259 (seq_length=1024) +03/05/2022 04:56:28 - INFO - codeparrot_training - Step 33590: {'lr': 0.0004458684141969585, 'samples': 17198592, 'steps': 33590, 'loss/train': 2.057932138442993} +03/05/2022 04:56:31 - INFO - codeparrot_training - Step 33591: {'lr': 0.0004458651164092315, 'samples': 17199104, 'steps': 33591, 'loss/train': 1.848440408706665} +03/05/2022 04:56:32 - INFO - codeparrot_training - Skipping example with length 461 (seq_length=1024) +03/05/2022 04:56:36 - INFO - codeparrot_training - Step 33592: {'lr': 0.00044586181853325076, 'samples': 17199616, 'steps': 33592, 'loss/train': 1.581458330154419} +03/05/2022 04:56:40 - INFO - codeparrot_training - Step 33593: {'lr': 0.0004458585205690177, 'samples': 17200128, 'steps': 33593, 'loss/train': 1.6954840421676636} +03/05/2022 04:56:40 - INFO - codeparrot_training - Skipping example with length 30 (seq_length=1024) +03/05/2022 04:56:45 - INFO - codeparrot_training - Step 33594: {'lr': 0.0004458552225165338, 'samples': 17200640, 'steps': 33594, 'loss/train': 1.615804672241211} +03/05/2022 04:56:48 - INFO - codeparrot_training - Step 33595: {'lr': 0.00044585192437580044, 'samples': 17201152, 'steps': 33595, 'loss/train': 1.721587061882019} +03/05/2022 04:56:49 - INFO - codeparrot_training - Skipping example with length 988 (seq_length=1024) +03/05/2022 04:56:53 - INFO - codeparrot_training - Step 33596: {'lr': 0.0004458486261468194, 'samples': 17201664, 'steps': 33596, 'loss/train': 2.47548246383667} +03/05/2022 04:56:56 - INFO - codeparrot_training - Step 33597: {'lr': 0.0004458453278295919, 'samples': 17202176, 'steps': 33597, 'loss/train': 1.5795776844024658} +03/05/2022 04:56:57 - INFO - codeparrot_training - Skipping example with length 837 (seq_length=1024) +03/05/2022 04:57:02 - INFO - codeparrot_training - Step 33598: {'lr': 0.00044584202942411956, 'samples': 17202688, 'steps': 33598, 'loss/train': 0.5867262482643127} +03/05/2022 04:57:05 - INFO - codeparrot_training - Step 33599: {'lr': 0.00044583873093040376, 'samples': 17203200, 'steps': 33599, 'loss/train': 1.1657555103302002} +03/05/2022 04:57:06 - INFO - codeparrot_training - Skipping example with length 223 (seq_length=1024) +03/05/2022 04:57:10 - INFO - codeparrot_training - Step 33600: {'lr': 0.00044583543234844616, 'samples': 17203712, 'steps': 33600, 'loss/train': 1.5614173412322998} +03/05/2022 04:57:13 - INFO - codeparrot_training - Step 33601: {'lr': 0.00044583213367824806, 'samples': 17204224, 'steps': 33601, 'loss/train': 1.2548081874847412} +03/05/2022 04:57:14 - INFO - codeparrot_training - Skipping example with length 765 (seq_length=1024) +03/05/2022 04:57:19 - INFO - codeparrot_training - Step 33602: {'lr': 0.00044582883491981097, 'samples': 17204736, 'steps': 33602, 'loss/train': 1.2465648651123047} +03/05/2022 04:57:22 - INFO - codeparrot_training - Step 33603: {'lr': 0.0004458255360731365, 'samples': 17205248, 'steps': 33603, 'loss/train': 6.62829065322876} +03/05/2022 04:57:23 - INFO - codeparrot_training - Skipping example with length 222 (seq_length=1024) +03/05/2022 04:57:27 - INFO - codeparrot_training - Step 33604: {'lr': 0.00044582223713822606, 'samples': 17205760, 'steps': 33604, 'loss/train': 1.3546030521392822} +03/05/2022 04:57:30 - INFO - codeparrot_training - Step 33605: {'lr': 0.0004458189381150811, 'samples': 17206272, 'steps': 33605, 'loss/train': 0.9507414698600769} +03/05/2022 04:57:32 - INFO - codeparrot_training - Skipping example with length 408 (seq_length=1024) +03/05/2022 04:57:35 - INFO - codeparrot_training - Step 33606: {'lr': 0.00044581563900370326, 'samples': 17206784, 'steps': 33606, 'loss/train': 1.8144936561584473} +03/05/2022 04:57:39 - INFO - codeparrot_training - Step 33607: {'lr': 0.0004458123398040938, 'samples': 17207296, 'steps': 33607, 'loss/train': 1.7711725234985352} +03/05/2022 04:57:40 - INFO - codeparrot_training - Skipping example with length 838 (seq_length=1024) +03/05/2022 04:57:44 - INFO - codeparrot_training - Step 33608: {'lr': 0.0004458090405162544, 'samples': 17207808, 'steps': 33608, 'loss/train': 2.3273074626922607} +03/05/2022 04:57:47 - INFO - codeparrot_training - Step 33609: {'lr': 0.0004458057411401864, 'samples': 17208320, 'steps': 33609, 'loss/train': 1.1190072298049927} +03/05/2022 04:57:48 - INFO - codeparrot_training - Skipping example with length 263 (seq_length=1024) +03/05/2022 04:57:52 - INFO - codeparrot_training - Step 33610: {'lr': 0.00044580244167589136, 'samples': 17208832, 'steps': 33610, 'loss/train': 1.1245813369750977} +03/05/2022 04:57:55 - INFO - codeparrot_training - Step 33611: {'lr': 0.00044579914212337083, 'samples': 17209344, 'steps': 33611, 'loss/train': 1.9975531101226807} +03/05/2022 04:57:57 - INFO - codeparrot_training - Skipping example with length 371 (seq_length=1024) +03/05/2022 04:58:01 - INFO - codeparrot_training - Step 33612: {'lr': 0.00044579584248262617, 'samples': 17209856, 'steps': 33612, 'loss/train': 0.705410361289978} +03/05/2022 04:58:04 - INFO - codeparrot_training - Step 33613: {'lr': 0.0004457925427536589, 'samples': 17210368, 'steps': 33613, 'loss/train': 0.8843287229537964} +03/05/2022 04:58:05 - INFO - codeparrot_training - Skipping example with length 788 (seq_length=1024) +03/05/2022 04:58:09 - INFO - codeparrot_training - Step 33614: {'lr': 0.0004457892429364706, 'samples': 17210880, 'steps': 33614, 'loss/train': 3.421769142150879} +03/05/2022 04:58:12 - INFO - codeparrot_training - Step 33615: {'lr': 0.00044578594303106266, 'samples': 17211392, 'steps': 33615, 'loss/train': 2.469468116760254} +03/05/2022 04:58:14 - INFO - codeparrot_training - Skipping example with length 278 (seq_length=1024) +03/05/2022 04:58:18 - INFO - codeparrot_training - Step 33616: {'lr': 0.00044578264303743654, 'samples': 17211904, 'steps': 33616, 'loss/train': 2.1370832920074463} +03/05/2022 04:58:21 - INFO - codeparrot_training - Step 33617: {'lr': 0.00044577934295559387, 'samples': 17212416, 'steps': 33617, 'loss/train': 1.5723105669021606} +03/05/2022 04:58:22 - INFO - codeparrot_training - Skipping example with length 557 (seq_length=1024) +03/05/2022 04:58:26 - INFO - codeparrot_training - Step 33618: {'lr': 0.000445776042785536, 'samples': 17212928, 'steps': 33618, 'loss/train': 1.4440356492996216} +03/05/2022 04:58:29 - INFO - codeparrot_training - Step 33619: {'lr': 0.00044577274252726454, 'samples': 17213440, 'steps': 33619, 'loss/train': 2.382261276245117} +03/05/2022 04:58:30 - INFO - codeparrot_training - Skipping example with length 303 (seq_length=1024) +03/05/2022 04:58:34 - INFO - codeparrot_training - Step 33620: {'lr': 0.00044576944218078075, 'samples': 17213952, 'steps': 33620, 'loss/train': 2.131185293197632} +03/05/2022 04:58:38 - INFO - codeparrot_training - Step 33621: {'lr': 0.00044576614174608644, 'samples': 17214464, 'steps': 33621, 'loss/train': 0.9500150680541992} +03/05/2022 04:58:39 - INFO - codeparrot_training - Skipping example with length 106 (seq_length=1024) +03/05/2022 04:58:43 - INFO - codeparrot_training - Step 33622: {'lr': 0.0004457628412231828, 'samples': 17214976, 'steps': 33622, 'loss/train': 1.390385627746582} +03/05/2022 04:58:46 - INFO - codeparrot_training - Step 33623: {'lr': 0.0004457595406120715, 'samples': 17215488, 'steps': 33623, 'loss/train': 0.5399864315986633} +03/05/2022 04:58:47 - INFO - codeparrot_training - Skipping example with length 576 (seq_length=1024) +03/05/2022 04:58:51 - INFO - codeparrot_training - Step 33624: {'lr': 0.000445756239912754, 'samples': 17216000, 'steps': 33624, 'loss/train': 1.595068335533142} +03/05/2022 04:58:54 - INFO - codeparrot_training - Step 33625: {'lr': 0.00044575293912523173, 'samples': 17216512, 'steps': 33625, 'loss/train': 1.950323462486267} +03/05/2022 04:58:55 - INFO - codeparrot_training - Skipping example with length 868 (seq_length=1024) +03/05/2022 04:59:00 - INFO - codeparrot_training - Step 33626: {'lr': 0.0004457496382495062, 'samples': 17217024, 'steps': 33626, 'loss/train': 1.7496206760406494} +03/05/2022 04:59:03 - INFO - codeparrot_training - Step 33627: {'lr': 0.00044574633728557887, 'samples': 17217536, 'steps': 33627, 'loss/train': 1.1294909715652466} +03/05/2022 04:59:04 - INFO - codeparrot_training - Skipping example with length 981 (seq_length=1024) +03/05/2022 04:59:08 - INFO - codeparrot_training - Step 33628: {'lr': 0.0004457430362334513, 'samples': 17218048, 'steps': 33628, 'loss/train': 1.6096266508102417} +03/05/2022 04:59:11 - INFO - codeparrot_training - Step 33629: {'lr': 0.00044573973509312494, 'samples': 17218560, 'steps': 33629, 'loss/train': 1.583948016166687} +03/05/2022 04:59:12 - INFO - codeparrot_training - Skipping example with length 451 (seq_length=1024) +03/05/2022 04:59:16 - INFO - codeparrot_training - Step 33630: {'lr': 0.00044573643386460127, 'samples': 17219072, 'steps': 33630, 'loss/train': 1.1936426162719727} +03/05/2022 04:59:20 - INFO - codeparrot_training - Step 33631: {'lr': 0.00044573313254788176, 'samples': 17219584, 'steps': 33631, 'loss/train': 1.6899062395095825} +03/05/2022 04:59:20 - INFO - codeparrot_training - Skipping example with length 279 (seq_length=1024) +03/05/2022 04:59:25 - INFO - codeparrot_training - Step 33632: {'lr': 0.00044572983114296794, 'samples': 17220096, 'steps': 33632, 'loss/train': 0.1501224786043167} +03/05/2022 04:59:28 - INFO - codeparrot_training - Step 33633: {'lr': 0.00044572652964986126, 'samples': 17220608, 'steps': 33633, 'loss/train': 2.015028953552246} +03/05/2022 04:59:29 - INFO - codeparrot_training - Skipping example with length 339 (seq_length=1024) +03/05/2022 04:59:33 - INFO - codeparrot_training - Step 33634: {'lr': 0.0004457232280685633, 'samples': 17221120, 'steps': 33634, 'loss/train': 0.7074772119522095} +03/05/2022 04:59:37 - INFO - codeparrot_training - Step 33635: {'lr': 0.0004457199263990754, 'samples': 17221632, 'steps': 33635, 'loss/train': 1.3326743841171265} +03/05/2022 04:59:37 - INFO - codeparrot_training - Skipping example with length 752 (seq_length=1024) +03/05/2022 04:59:42 - INFO - codeparrot_training - Step 33636: {'lr': 0.0004457166246413992, 'samples': 17222144, 'steps': 33636, 'loss/train': 1.376373052597046} +03/05/2022 04:59:45 - INFO - codeparrot_training - Step 33637: {'lr': 0.000445713322795536, 'samples': 17222656, 'steps': 33637, 'loss/train': 2.1918740272521973} +03/05/2022 04:59:46 - INFO - codeparrot_training - Skipping example with length 75 (seq_length=1024) +03/05/2022 04:59:50 - INFO - codeparrot_training - Step 33638: {'lr': 0.0004457100208614875, 'samples': 17223168, 'steps': 33638, 'loss/train': 2.098397970199585} +03/05/2022 04:59:54 - INFO - codeparrot_training - Step 33639: {'lr': 0.00044570671883925497, 'samples': 17223680, 'steps': 33639, 'loss/train': 1.5802254676818848} +03/05/2022 04:59:54 - INFO - codeparrot_training - Skipping example with length 211 (seq_length=1024) +03/05/2022 04:59:59 - INFO - codeparrot_training - Step 33640: {'lr': 0.00044570341672884006, 'samples': 17224192, 'steps': 33640, 'loss/train': 1.905474305152893} +03/05/2022 05:00:02 - INFO - codeparrot_training - Step 33641: {'lr': 0.0004457001145302443, 'samples': 17224704, 'steps': 33641, 'loss/train': 1.2486696243286133} +03/05/2022 05:00:03 - INFO - codeparrot_training - Skipping example with length 91 (seq_length=1024) +03/05/2022 05:00:07 - INFO - codeparrot_training - Step 33642: {'lr': 0.00044569681224346897, 'samples': 17225216, 'steps': 33642, 'loss/train': 1.3094062805175781} +03/05/2022 05:00:11 - INFO - codeparrot_training - Step 33643: {'lr': 0.0004456935098685158, 'samples': 17225728, 'steps': 33643, 'loss/train': 1.9922659397125244} +03/05/2022 05:00:11 - INFO - codeparrot_training - Skipping example with length 618 (seq_length=1024) +03/05/2022 05:00:16 - INFO - codeparrot_training - Step 33644: {'lr': 0.000445690207405386, 'samples': 17226240, 'steps': 33644, 'loss/train': 1.4570302963256836} +03/05/2022 05:00:19 - INFO - codeparrot_training - Step 33645: {'lr': 0.00044568690485408125, 'samples': 17226752, 'steps': 33645, 'loss/train': 0.9996280074119568} +03/05/2022 05:00:19 - INFO - codeparrot_training - Skipping example with length 448 (seq_length=1024) +03/05/2022 05:00:24 - INFO - codeparrot_training - Step 33646: {'lr': 0.0004456836022146031, 'samples': 17227264, 'steps': 33646, 'loss/train': 2.374741315841675} +03/05/2022 05:00:27 - INFO - codeparrot_training - Step 33647: {'lr': 0.00044568029948695287, 'samples': 17227776, 'steps': 33647, 'loss/train': 2.6301186084747314} +03/05/2022 05:00:27 - INFO - codeparrot_training - Skipping example with length 647 (seq_length=1024) +03/05/2022 05:00:33 - INFO - codeparrot_training - Step 33648: {'lr': 0.0004456769966711321, 'samples': 17228288, 'steps': 33648, 'loss/train': 2.1099252700805664} +03/05/2022 05:00:36 - INFO - codeparrot_training - Step 33649: {'lr': 0.00044567369376714226, 'samples': 17228800, 'steps': 33649, 'loss/train': 2.3198187351226807} +03/05/2022 05:00:36 - INFO - codeparrot_training - Skipping example with length 148 (seq_length=1024) +03/05/2022 05:00:41 - INFO - codeparrot_training - Step 33650: {'lr': 0.00044567039077498497, 'samples': 17229312, 'steps': 33650, 'loss/train': 1.2144025564193726} +03/05/2022 05:00:44 - INFO - codeparrot_training - Step 33651: {'lr': 0.00044566708769466155, 'samples': 17229824, 'steps': 33651, 'loss/train': 2.1446759700775146} +03/05/2022 05:00:44 - INFO - codeparrot_training - Skipping example with length 691 (seq_length=1024) +03/05/2022 05:00:50 - INFO - codeparrot_training - Step 33652: {'lr': 0.00044566378452617363, 'samples': 17230336, 'steps': 33652, 'loss/train': 1.5498212575912476} +03/05/2022 05:00:53 - INFO - codeparrot_training - Step 33653: {'lr': 0.0004456604812695226, 'samples': 17230848, 'steps': 33653, 'loss/train': 1.553038239479065} +03/05/2022 05:00:53 - INFO - codeparrot_training - Skipping example with length 312 (seq_length=1024) +03/05/2022 05:00:58 - INFO - codeparrot_training - Step 33654: {'lr': 0.0004456571779247099, 'samples': 17231360, 'steps': 33654, 'loss/train': 2.5553789138793945} +03/05/2022 05:01:01 - INFO - codeparrot_training - Step 33655: {'lr': 0.0004456538744917372, 'samples': 17231872, 'steps': 33655, 'loss/train': 1.6805498600006104} +03/05/2022 05:01:01 - INFO - codeparrot_training - Skipping example with length 482 (seq_length=1024) +03/05/2022 05:01:07 - INFO - codeparrot_training - Step 33656: {'lr': 0.0004456505709706059, 'samples': 17232384, 'steps': 33656, 'loss/train': 1.2175822257995605} +03/05/2022 05:01:10 - INFO - codeparrot_training - Step 33657: {'lr': 0.0004456472673613174, 'samples': 17232896, 'steps': 33657, 'loss/train': 1.2269105911254883} +03/05/2022 05:01:10 - INFO - codeparrot_training - Skipping example with length 221 (seq_length=1024) +03/05/2022 05:01:15 - INFO - codeparrot_training - Step 33658: {'lr': 0.00044564396366387327, 'samples': 17233408, 'steps': 33658, 'loss/train': 1.058402180671692} +03/05/2022 05:01:18 - INFO - codeparrot_training - Skipping example with length 75 (seq_length=1024) +03/05/2022 05:01:20 - INFO - codeparrot_training - Step 33659: {'lr': 0.000445640659878275, 'samples': 17233920, 'steps': 33659, 'loss/train': 1.510990858078003} +03/05/2022 05:01:24 - INFO - codeparrot_training - Step 33660: {'lr': 0.00044563735600452407, 'samples': 17234432, 'steps': 33660, 'loss/train': 1.5986733436584473} +03/05/2022 05:01:26 - INFO - codeparrot_training - Skipping example with length 384 (seq_length=1024) +03/05/2022 05:01:29 - INFO - codeparrot_training - Step 33661: {'lr': 0.000445634052042622, 'samples': 17234944, 'steps': 33661, 'loss/train': 2.0537829399108887} +03/05/2022 05:01:32 - INFO - codeparrot_training - Step 33662: {'lr': 0.00044563074799257015, 'samples': 17235456, 'steps': 33662, 'loss/train': 1.6863192319869995} +03/05/2022 05:01:35 - INFO - codeparrot_training - Skipping example with length 732 (seq_length=1024) +03/05/2022 05:01:38 - INFO - codeparrot_training - Step 33663: {'lr': 0.0004456274438543702, 'samples': 17235968, 'steps': 33663, 'loss/train': 1.6375967264175415} +03/05/2022 05:01:41 - INFO - codeparrot_training - Step 33664: {'lr': 0.0004456241396280234, 'samples': 17236480, 'steps': 33664, 'loss/train': 1.3035353422164917} +03/05/2022 05:01:43 - INFO - codeparrot_training - Skipping example with length 264 (seq_length=1024) +03/05/2022 05:01:46 - INFO - codeparrot_training - Step 33665: {'lr': 0.00044562083531353154, 'samples': 17236992, 'steps': 33665, 'loss/train': 1.5329054594039917} +03/05/2022 05:01:49 - INFO - codeparrot_training - Step 33666: {'lr': 0.00044561753091089585, 'samples': 17237504, 'steps': 33666, 'loss/train': 1.654770016670227} +03/05/2022 05:01:52 - INFO - codeparrot_training - Skipping example with length 196 (seq_length=1024) +03/05/2022 05:01:55 - INFO - codeparrot_training - Step 33667: {'lr': 0.00044561422642011794, 'samples': 17238016, 'steps': 33667, 'loss/train': 1.2918373346328735} +03/05/2022 05:01:58 - INFO - codeparrot_training - Step 33668: {'lr': 0.00044561092184119933, 'samples': 17238528, 'steps': 33668, 'loss/train': 2.4394679069519043} +03/05/2022 05:02:01 - INFO - codeparrot_training - Skipping example with length 499 (seq_length=1024) +03/05/2022 05:02:03 - INFO - codeparrot_training - Step 33669: {'lr': 0.00044560761717414143, 'samples': 17239040, 'steps': 33669, 'loss/train': 1.4597721099853516} +03/05/2022 05:02:06 - INFO - codeparrot_training - Step 33670: {'lr': 0.0004456043124189458, 'samples': 17239552, 'steps': 33670, 'loss/train': 2.2803752422332764} +03/05/2022 05:02:09 - INFO - codeparrot_training - Step 33671: {'lr': 0.00044560100757561386, 'samples': 17240064, 'steps': 33671, 'loss/train': 1.3685790300369263} +03/05/2022 05:02:09 - INFO - codeparrot_training - Skipping example with length 878 (seq_length=1024) +03/05/2022 05:02:15 - INFO - codeparrot_training - Step 33672: {'lr': 0.000445597702644147, 'samples': 17240576, 'steps': 33672, 'loss/train': 2.761289596557617} +03/05/2022 05:02:18 - INFO - codeparrot_training - Skipping example with length 403 (seq_length=1024) +03/05/2022 05:02:20 - INFO - codeparrot_training - Step 33673: {'lr': 0.000445594397624547, 'samples': 17241088, 'steps': 33673, 'loss/train': 0.3266843855381012} +03/05/2022 05:02:23 - INFO - codeparrot_training - Step 33674: {'lr': 0.0004455910925168151, 'samples': 17241600, 'steps': 33674, 'loss/train': 2.0801889896392822} +03/05/2022 05:02:26 - INFO - codeparrot_training - Step 33675: {'lr': 0.0004455877873209529, 'samples': 17242112, 'steps': 33675, 'loss/train': 1.4737094640731812} +03/05/2022 05:02:26 - INFO - codeparrot_training - Skipping example with length 805 (seq_length=1024) +03/05/2022 05:02:32 - INFO - codeparrot_training - Step 33676: {'lr': 0.00044558448203696184, 'samples': 17242624, 'steps': 33676, 'loss/train': 1.157250165939331} +03/05/2022 05:02:35 - INFO - codeparrot_training - Step 33677: {'lr': 0.0004455811766648434, 'samples': 17243136, 'steps': 33677, 'loss/train': 1.2672345638275146} +03/05/2022 05:02:35 - INFO - codeparrot_training - Skipping example with length 41 (seq_length=1024) +03/05/2022 05:02:40 - INFO - codeparrot_training - Step 33678: {'lr': 0.0004455778712045992, 'samples': 17243648, 'steps': 33678, 'loss/train': 1.787611722946167} +03/05/2022 05:02:44 - INFO - codeparrot_training - Step 33679: {'lr': 0.0004455745656562306, 'samples': 17244160, 'steps': 33679, 'loss/train': 1.708083152770996} +03/05/2022 05:02:44 - INFO - codeparrot_training - Skipping example with length 404 (seq_length=1024) +03/05/2022 05:02:49 - INFO - codeparrot_training - Step 33680: {'lr': 0.000445571260019739, 'samples': 17244672, 'steps': 33680, 'loss/train': 1.9811404943466187} +03/05/2022 05:02:52 - INFO - codeparrot_training - Skipping example with length 720 (seq_length=1024) +03/05/2022 05:02:54 - INFO - codeparrot_training - Step 33681: {'lr': 0.00044556795429512617, 'samples': 17245184, 'steps': 33681, 'loss/train': 1.4627286195755005} +03/05/2022 05:02:57 - INFO - codeparrot_training - Step 33682: {'lr': 0.0004455646484823933, 'samples': 17245696, 'steps': 33682, 'loss/train': 1.8636199235916138} +03/05/2022 05:03:00 - INFO - codeparrot_training - Skipping example with length 141 (seq_length=1024) +03/05/2022 05:03:03 - INFO - codeparrot_training - Step 33683: {'lr': 0.00044556134258154215, 'samples': 17246208, 'steps': 33683, 'loss/train': 1.9720185995101929} +03/05/2022 05:03:06 - INFO - codeparrot_training - Step 33684: {'lr': 0.000445558036592574, 'samples': 17246720, 'steps': 33684, 'loss/train': 1.9168349504470825} +03/05/2022 05:03:09 - INFO - codeparrot_training - Skipping example with length 917 (seq_length=1024) +03/05/2022 05:03:11 - INFO - codeparrot_training - Step 33685: {'lr': 0.0004455547305154904, 'samples': 17247232, 'steps': 33685, 'loss/train': 1.6605573892593384} +03/05/2022 05:03:14 - INFO - codeparrot_training - Step 33686: {'lr': 0.00044555142435029284, 'samples': 17247744, 'steps': 33686, 'loss/train': 1.5331995487213135} +03/05/2022 05:03:17 - INFO - codeparrot_training - Skipping example with length 254 (seq_length=1024) +03/05/2022 05:03:19 - INFO - codeparrot_training - Step 33687: {'lr': 0.0004455481180969829, 'samples': 17248256, 'steps': 33687, 'loss/train': 1.9314182996749878} +03/05/2022 05:03:23 - INFO - codeparrot_training - Step 33688: {'lr': 0.00044554481175556194, 'samples': 17248768, 'steps': 33688, 'loss/train': 1.829451084136963} +03/05/2022 05:03:25 - INFO - codeparrot_training - Skipping example with length 768 (seq_length=1024) +03/05/2022 05:03:28 - INFO - codeparrot_training - Step 33689: {'lr': 0.00044554150532603154, 'samples': 17249280, 'steps': 33689, 'loss/train': 1.144074559211731} +03/05/2022 05:03:31 - INFO - codeparrot_training - Step 33690: {'lr': 0.00044553819880839313, 'samples': 17249792, 'steps': 33690, 'loss/train': 0.22657983005046844} +03/05/2022 05:03:34 - INFO - codeparrot_training - Skipping example with length 663 (seq_length=1024) +03/05/2022 05:03:36 - INFO - codeparrot_training - Step 33691: {'lr': 0.0004455348922026483, 'samples': 17250304, 'steps': 33691, 'loss/train': 1.9718066453933716} +03/05/2022 05:03:40 - INFO - codeparrot_training - Step 33692: {'lr': 0.00044553158550879833, 'samples': 17250816, 'steps': 33692, 'loss/train': 1.3945564031600952} +03/05/2022 05:03:42 - INFO - codeparrot_training - Skipping example with length 41 (seq_length=1024) +03/05/2022 05:03:45 - INFO - codeparrot_training - Step 33693: {'lr': 0.00044552827872684493, 'samples': 17251328, 'steps': 33693, 'loss/train': 1.8999449014663696} +03/05/2022 05:03:48 - INFO - codeparrot_training - Step 33694: {'lr': 0.00044552497185678953, 'samples': 17251840, 'steps': 33694, 'loss/train': 1.8301559686660767} +03/05/2022 05:03:51 - INFO - codeparrot_training - Step 33695: {'lr': 0.00044552166489863354, 'samples': 17252352, 'steps': 33695, 'loss/train': 1.7804909944534302} +03/05/2022 05:03:52 - INFO - codeparrot_training - Skipping example with length 316 (seq_length=1024) +03/05/2022 05:03:57 - INFO - codeparrot_training - Step 33696: {'lr': 0.0004455183578523785, 'samples': 17252864, 'steps': 33696, 'loss/train': 2.107941150665283} +03/05/2022 05:04:00 - INFO - codeparrot_training - Step 33697: {'lr': 0.00044551505071802587, 'samples': 17253376, 'steps': 33697, 'loss/train': 1.8297739028930664} +03/05/2022 05:04:00 - INFO - codeparrot_training - Skipping example with length 274 (seq_length=1024) +03/05/2022 05:04:05 - INFO - codeparrot_training - Step 33698: {'lr': 0.00044551174349557733, 'samples': 17253888, 'steps': 33698, 'loss/train': 1.0970057249069214} +03/05/2022 05:04:08 - INFO - codeparrot_training - Step 33699: {'lr': 0.0004455084361850341, 'samples': 17254400, 'steps': 33699, 'loss/train': 1.9417939186096191} +03/05/2022 05:04:09 - INFO - codeparrot_training - Skipping example with length 155 (seq_length=1024) +03/05/2022 05:04:14 - INFO - codeparrot_training - Step 33700: {'lr': 0.00044550512878639784, 'samples': 17254912, 'steps': 33700, 'loss/train': 1.7972487211227417} +03/05/2022 05:04:17 - INFO - codeparrot_training - Step 33701: {'lr': 0.0004455018212996699, 'samples': 17255424, 'steps': 33701, 'loss/train': 2.2850606441497803} +03/05/2022 05:04:17 - INFO - codeparrot_training - Skipping example with length 123 (seq_length=1024) +03/05/2022 05:04:22 - INFO - codeparrot_training - Step 33702: {'lr': 0.0004454985137248519, 'samples': 17255936, 'steps': 33702, 'loss/train': 1.8021314144134521} +03/05/2022 05:04:25 - INFO - codeparrot_training - Step 33703: {'lr': 0.00044549520606194525, 'samples': 17256448, 'steps': 33703, 'loss/train': 1.2692856788635254} +03/05/2022 05:04:25 - INFO - codeparrot_training - Skipping example with length 80 (seq_length=1024) +03/05/2022 05:04:31 - INFO - codeparrot_training - Step 33704: {'lr': 0.00044549189831095157, 'samples': 17256960, 'steps': 33704, 'loss/train': 1.375137209892273} +03/05/2022 05:04:34 - INFO - codeparrot_training - Step 33705: {'lr': 0.0004454885904718722, 'samples': 17257472, 'steps': 33705, 'loss/train': 1.8190932273864746} +03/05/2022 05:04:34 - INFO - codeparrot_training - Skipping example with length 572 (seq_length=1024) +03/05/2022 05:04:39 - INFO - codeparrot_training - Step 33706: {'lr': 0.0004454852825447087, 'samples': 17257984, 'steps': 33706, 'loss/train': 1.2892558574676514} +03/05/2022 05:04:42 - INFO - codeparrot_training - Step 33707: {'lr': 0.0004454819745294625, 'samples': 17258496, 'steps': 33707, 'loss/train': 1.6673616170883179} +03/05/2022 05:04:42 - INFO - codeparrot_training - Skipping example with length 267 (seq_length=1024) +03/05/2022 05:04:47 - INFO - codeparrot_training - Step 33708: {'lr': 0.0004454786664261352, 'samples': 17259008, 'steps': 33708, 'loss/train': 2.1652064323425293} +03/05/2022 05:04:51 - INFO - codeparrot_training - Step 33709: {'lr': 0.0004454753582347282, 'samples': 17259520, 'steps': 33709, 'loss/train': 2.2581276893615723} +03/05/2022 05:04:51 - INFO - codeparrot_training - Skipping example with length 464 (seq_length=1024) +03/05/2022 05:04:56 - INFO - codeparrot_training - Step 33710: {'lr': 0.00044547204995524305, 'samples': 17260032, 'steps': 33710, 'loss/train': 1.7837741374969482} +03/05/2022 05:04:59 - INFO - codeparrot_training - Step 33711: {'lr': 0.00044546874158768115, 'samples': 17260544, 'steps': 33711, 'loss/train': 0.9483580589294434} +03/05/2022 05:05:00 - INFO - codeparrot_training - Skipping example with length 673 (seq_length=1024) +03/05/2022 05:05:05 - INFO - codeparrot_training - Step 33712: {'lr': 0.00044546543313204415, 'samples': 17261056, 'steps': 33712, 'loss/train': 1.9283761978149414} +03/05/2022 05:05:08 - INFO - codeparrot_training - Step 33713: {'lr': 0.00044546212458833334, 'samples': 17261568, 'steps': 33713, 'loss/train': 0.5830368995666504} +03/05/2022 05:05:08 - INFO - codeparrot_training - Skipping example with length 369 (seq_length=1024) +03/05/2022 05:05:13 - INFO - codeparrot_training - Step 33714: {'lr': 0.00044545881595655035, 'samples': 17262080, 'steps': 33714, 'loss/train': 1.3765771389007568} +03/05/2022 05:05:16 - INFO - codeparrot_training - Step 33715: {'lr': 0.00044545550723669664, 'samples': 17262592, 'steps': 33715, 'loss/train': 1.6600160598754883} +03/05/2022 05:05:17 - INFO - codeparrot_training - Skipping example with length 200 (seq_length=1024) +03/05/2022 05:05:22 - INFO - codeparrot_training - Step 33716: {'lr': 0.00044545219842877373, 'samples': 17263104, 'steps': 33716, 'loss/train': 1.7852420806884766} +03/05/2022 05:05:25 - INFO - codeparrot_training - Step 33717: {'lr': 0.000445448889532783, 'samples': 17263616, 'steps': 33717, 'loss/train': 1.0261931419372559} +03/05/2022 05:05:26 - INFO - codeparrot_training - Skipping example with length 56 (seq_length=1024) +03/05/2022 05:05:30 - INFO - codeparrot_training - Step 33718: {'lr': 0.0004454455805487261, 'samples': 17264128, 'steps': 33718, 'loss/train': 1.9580744504928589} +03/05/2022 05:05:33 - INFO - codeparrot_training - Step 33719: {'lr': 0.0004454422714766043, 'samples': 17264640, 'steps': 33719, 'loss/train': 0.932378888130188} +03/05/2022 05:05:34 - INFO - codeparrot_training - Skipping example with length 74 (seq_length=1024) +03/05/2022 05:05:39 - INFO - codeparrot_training - Step 33720: {'lr': 0.00044543896231641935, 'samples': 17265152, 'steps': 33720, 'loss/train': 1.8244143724441528} +03/05/2022 05:05:42 - INFO - codeparrot_training - Step 33721: {'lr': 0.00044543565306817256, 'samples': 17265664, 'steps': 33721, 'loss/train': 1.4012575149536133} +03/05/2022 05:05:42 - INFO - codeparrot_training - Skipping example with length 489 (seq_length=1024) +03/05/2022 05:05:47 - INFO - codeparrot_training - Step 33722: {'lr': 0.00044543234373186556, 'samples': 17266176, 'steps': 33722, 'loss/train': 1.9865909814834595} +03/05/2022 05:05:50 - INFO - codeparrot_training - Step 33723: {'lr': 0.0004454290343074997, 'samples': 17266688, 'steps': 33723, 'loss/train': 1.8939869403839111} +03/05/2022 05:05:51 - INFO - codeparrot_training - Skipping example with length 324 (seq_length=1024) +03/05/2022 05:05:56 - INFO - codeparrot_training - Step 33724: {'lr': 0.00044542572479507655, 'samples': 17267200, 'steps': 33724, 'loss/train': 1.3141834735870361} +03/05/2022 05:05:59 - INFO - codeparrot_training - Step 33725: {'lr': 0.00044542241519459757, 'samples': 17267712, 'steps': 33725, 'loss/train': 0.9781323075294495} +03/05/2022 05:05:59 - INFO - codeparrot_training - Skipping example with length 72 (seq_length=1024) +03/05/2022 05:06:04 - INFO - codeparrot_training - Step 33726: {'lr': 0.0004454191055060643, 'samples': 17268224, 'steps': 33726, 'loss/train': 0.10506538301706314} +03/05/2022 05:06:07 - INFO - codeparrot_training - Step 33727: {'lr': 0.00044541579572947814, 'samples': 17268736, 'steps': 33727, 'loss/train': 0.9335793852806091} +03/05/2022 05:06:07 - INFO - codeparrot_training - Skipping example with length 537 (seq_length=1024) +03/05/2022 05:06:12 - INFO - codeparrot_training - Step 33728: {'lr': 0.0004454124858648407, 'samples': 17269248, 'steps': 33728, 'loss/train': 2.2470526695251465} +03/05/2022 05:06:15 - INFO - codeparrot_training - Step 33729: {'lr': 0.00044540917591215335, 'samples': 17269760, 'steps': 33729, 'loss/train': 2.5497844219207764} +03/05/2022 05:06:16 - INFO - codeparrot_training - Skipping example with length 479 (seq_length=1024) +03/05/2022 05:06:21 - INFO - codeparrot_training - Step 33730: {'lr': 0.0004454058658714177, 'samples': 17270272, 'steps': 33730, 'loss/train': 1.4950462579727173} +03/05/2022 05:06:24 - INFO - codeparrot_training - Step 33731: {'lr': 0.0004454025557426351, 'samples': 17270784, 'steps': 33731, 'loss/train': 1.3171472549438477} +03/05/2022 05:06:24 - INFO - codeparrot_training - Skipping example with length 171 (seq_length=1024) +03/05/2022 05:06:29 - INFO - codeparrot_training - Step 33732: {'lr': 0.00044539924552580723, 'samples': 17271296, 'steps': 33732, 'loss/train': 1.650871992111206} +03/05/2022 05:06:32 - INFO - codeparrot_training - Step 33733: {'lr': 0.0004453959352209354, 'samples': 17271808, 'steps': 33733, 'loss/train': 2.8467471599578857} +03/05/2022 05:06:33 - INFO - codeparrot_training - Skipping example with length 868 (seq_length=1024) +03/05/2022 05:06:38 - INFO - codeparrot_training - Step 33734: {'lr': 0.0004453926248280212, 'samples': 17272320, 'steps': 33734, 'loss/train': 2.093609571456909} +03/05/2022 05:06:41 - INFO - codeparrot_training - Step 33735: {'lr': 0.0004453893143470661, 'samples': 17272832, 'steps': 33735, 'loss/train': 1.088821291923523} +03/05/2022 05:06:41 - INFO - codeparrot_training - Skipping example with length 287 (seq_length=1024) +03/05/2022 05:06:46 - INFO - codeparrot_training - Step 33736: {'lr': 0.0004453860037780716, 'samples': 17273344, 'steps': 33736, 'loss/train': 1.8031758069992065} +03/05/2022 05:06:49 - INFO - codeparrot_training - Step 33737: {'lr': 0.00044538269312103916, 'samples': 17273856, 'steps': 33737, 'loss/train': 1.9554144144058228} +03/05/2022 05:06:50 - INFO - codeparrot_training - Skipping example with length 497 (seq_length=1024) +03/05/2022 05:06:55 - INFO - codeparrot_training - Step 33738: {'lr': 0.00044537938237597033, 'samples': 17274368, 'steps': 33738, 'loss/train': 1.7630200386047363} +03/05/2022 05:06:58 - INFO - codeparrot_training - Step 33739: {'lr': 0.00044537607154286645, 'samples': 17274880, 'steps': 33739, 'loss/train': 1.7588212490081787} +03/05/2022 05:06:58 - INFO - codeparrot_training - Skipping example with length 931 (seq_length=1024) +03/05/2022 05:07:03 - INFO - codeparrot_training - Step 33740: {'lr': 0.00044537276062172926, 'samples': 17275392, 'steps': 33740, 'loss/train': 0.8729655742645264} +03/05/2022 05:07:06 - INFO - codeparrot_training - Step 33741: {'lr': 0.0004453694496125601, 'samples': 17275904, 'steps': 33741, 'loss/train': 1.7710518836975098} +03/05/2022 05:07:07 - INFO - codeparrot_training - Skipping example with length 797 (seq_length=1024) +03/05/2022 05:07:11 - INFO - codeparrot_training - Step 33742: {'lr': 0.0004453661385153604, 'samples': 17276416, 'steps': 33742, 'loss/train': 1.3548460006713867} +03/05/2022 05:07:15 - INFO - codeparrot_training - Step 33743: {'lr': 0.0004453628273301318, 'samples': 17276928, 'steps': 33743, 'loss/train': 2.101663112640381} +03/05/2022 05:07:15 - INFO - codeparrot_training - Skipping example with length 474 (seq_length=1024) +03/05/2022 05:07:20 - INFO - codeparrot_training - Step 33744: {'lr': 0.0004453595160568757, 'samples': 17277440, 'steps': 33744, 'loss/train': 1.1055561304092407} +03/05/2022 05:07:23 - INFO - codeparrot_training - Step 33745: {'lr': 0.0004453562046955937, 'samples': 17277952, 'steps': 33745, 'loss/train': 1.6239638328552246} +03/05/2022 05:07:23 - INFO - codeparrot_training - Skipping example with length 589 (seq_length=1024) +03/05/2022 05:07:28 - INFO - codeparrot_training - Step 33746: {'lr': 0.00044535289324628704, 'samples': 17278464, 'steps': 33746, 'loss/train': 1.0564157962799072} +03/05/2022 05:07:31 - INFO - codeparrot_training - Step 33747: {'lr': 0.00044534958170895753, 'samples': 17278976, 'steps': 33747, 'loss/train': 2.8480093479156494} +03/05/2022 05:07:31 - INFO - codeparrot_training - Skipping example with length 453 (seq_length=1024) +03/05/2022 05:07:37 - INFO - codeparrot_training - Step 33748: {'lr': 0.0004453462700836064, 'samples': 17279488, 'steps': 33748, 'loss/train': 1.6007373332977295} +03/05/2022 05:07:39 - INFO - codeparrot_training - Skipping example with length 74 (seq_length=1024) +03/05/2022 05:07:42 - INFO - codeparrot_training - Step 33749: {'lr': 0.0004453429583702353, 'samples': 17280000, 'steps': 33749, 'loss/train': 1.042931079864502} +03/05/2022 05:07:45 - INFO - codeparrot_training - Step 33750: {'lr': 0.0004453396465688457, 'samples': 17280512, 'steps': 33750, 'loss/train': 1.9030508995056152} +03/05/2022 05:07:48 - INFO - codeparrot_training - Skipping example with length 189 (seq_length=1024) +03/05/2022 05:07:50 - INFO - codeparrot_training - Step 33751: {'lr': 0.00044533633467943906, 'samples': 17281024, 'steps': 33751, 'loss/train': 1.9037073850631714} +03/05/2022 05:07:53 - INFO - codeparrot_training - Step 33752: {'lr': 0.00044533302270201693, 'samples': 17281536, 'steps': 33752, 'loss/train': 2.302919387817383} +03/05/2022 05:07:56 - INFO - codeparrot_training - Skipping example with length 676 (seq_length=1024) +03/05/2022 05:07:59 - INFO - codeparrot_training - Step 33753: {'lr': 0.00044532971063658067, 'samples': 17282048, 'steps': 33753, 'loss/train': 0.705392599105835} +03/05/2022 05:08:02 - INFO - codeparrot_training - Step 33754: {'lr': 0.00044532639848313187, 'samples': 17282560, 'steps': 33754, 'loss/train': 1.4967677593231201} +03/05/2022 05:08:05 - INFO - codeparrot_training - Skipping example with length 810 (seq_length=1024) +03/05/2022 05:08:07 - INFO - codeparrot_training - Step 33755: {'lr': 0.0004453230862416721, 'samples': 17283072, 'steps': 33755, 'loss/train': 2.220360040664673} +03/05/2022 05:08:10 - INFO - codeparrot_training - Step 33756: {'lr': 0.00044531977391220267, 'samples': 17283584, 'steps': 33756, 'loss/train': 2.1588869094848633} +03/05/2022 05:08:13 - INFO - codeparrot_training - Skipping example with length 367 (seq_length=1024) +03/05/2022 05:08:16 - INFO - codeparrot_training - Step 33757: {'lr': 0.00044531646149472516, 'samples': 17284096, 'steps': 33757, 'loss/train': 1.6332528591156006} +03/05/2022 05:08:19 - INFO - codeparrot_training - Step 33758: {'lr': 0.00044531314898924116, 'samples': 17284608, 'steps': 33758, 'loss/train': 1.7397618293762207} +03/05/2022 05:08:22 - INFO - codeparrot_training - Step 33759: {'lr': 0.00044530983639575193, 'samples': 17285120, 'steps': 33759, 'loss/train': 1.399461030960083} +03/05/2022 05:08:22 - INFO - codeparrot_training - Skipping example with length 977 (seq_length=1024) +03/05/2022 05:08:27 - INFO - codeparrot_training - Step 33760: {'lr': 0.00044530652371425916, 'samples': 17285632, 'steps': 33760, 'loss/train': 2.4070591926574707} +03/05/2022 05:08:30 - INFO - codeparrot_training - Skipping example with length 636 (seq_length=1024) +03/05/2022 05:08:33 - INFO - codeparrot_training - Step 33761: {'lr': 0.00044530321094476434, 'samples': 17286144, 'steps': 33761, 'loss/train': 1.8661472797393799} +03/05/2022 05:08:36 - INFO - codeparrot_training - Step 33762: {'lr': 0.0004452998980872689, 'samples': 17286656, 'steps': 33762, 'loss/train': 1.3632087707519531} +03/05/2022 05:08:39 - INFO - codeparrot_training - Skipping example with length 325 (seq_length=1024) +03/05/2022 05:08:41 - INFO - codeparrot_training - Step 33763: {'lr': 0.0004452965851417743, 'samples': 17287168, 'steps': 33763, 'loss/train': 2.6672725677490234} +03/05/2022 05:08:44 - INFO - codeparrot_training - Step 33764: {'lr': 0.000445293272108282, 'samples': 17287680, 'steps': 33764, 'loss/train': 0.23788543045520782} +03/05/2022 05:08:47 - INFO - codeparrot_training - Skipping example with length 841 (seq_length=1024) +03/05/2022 05:08:50 - INFO - codeparrot_training - Step 33765: {'lr': 0.0004452899589867937, 'samples': 17288192, 'steps': 33765, 'loss/train': 1.3549383878707886} +03/05/2022 05:08:53 - INFO - codeparrot_training - Step 33766: {'lr': 0.00044528664577731073, 'samples': 17288704, 'steps': 33766, 'loss/train': 1.8650872707366943} +03/05/2022 05:08:55 - INFO - codeparrot_training - Skipping example with length 488 (seq_length=1024) +03/05/2022 05:08:58 - INFO - codeparrot_training - Step 33767: {'lr': 0.00044528333247983456, 'samples': 17289216, 'steps': 33767, 'loss/train': 1.3714998960494995} +03/05/2022 05:09:01 - INFO - codeparrot_training - Step 33768: {'lr': 0.0004452800190943667, 'samples': 17289728, 'steps': 33768, 'loss/train': 1.5167347192764282} +03/05/2022 05:09:04 - INFO - codeparrot_training - Skipping example with length 780 (seq_length=1024) +03/05/2022 05:09:07 - INFO - codeparrot_training - Step 33769: {'lr': 0.0004452767056209087, 'samples': 17290240, 'steps': 33769, 'loss/train': 1.6627153158187866} +03/05/2022 05:09:10 - INFO - codeparrot_training - Step 33770: {'lr': 0.0004452733920594621, 'samples': 17290752, 'steps': 33770, 'loss/train': 1.0002191066741943} +03/05/2022 05:09:13 - INFO - codeparrot_training - Step 33771: {'lr': 0.0004452700784100283, 'samples': 17291264, 'steps': 33771, 'loss/train': 0.8183153867721558} +03/05/2022 05:09:15 - INFO - codeparrot_training - Skipping example with length 143 (seq_length=1024) +03/05/2022 05:09:19 - INFO - codeparrot_training - Step 33772: {'lr': 0.0004452667646726088, 'samples': 17291776, 'steps': 33772, 'loss/train': 0.31996601819992065} +03/05/2022 05:09:22 - INFO - codeparrot_training - Step 33773: {'lr': 0.0004452634508472051, 'samples': 17292288, 'steps': 33773, 'loss/train': 2.0209522247314453} +03/05/2022 05:09:23 - INFO - codeparrot_training - Skipping example with length 570 (seq_length=1024) +03/05/2022 05:09:27 - INFO - codeparrot_training - Step 33774: {'lr': 0.0004452601369338187, 'samples': 17292800, 'steps': 33774, 'loss/train': 1.5735650062561035} +03/05/2022 05:09:30 - INFO - codeparrot_training - Step 33775: {'lr': 0.00044525682293245107, 'samples': 17293312, 'steps': 33775, 'loss/train': 2.001319169998169} +03/05/2022 05:09:32 - INFO - codeparrot_training - Skipping example with length 740 (seq_length=1024) +03/05/2022 05:09:36 - INFO - codeparrot_training - Step 33776: {'lr': 0.0004452535088431038, 'samples': 17293824, 'steps': 33776, 'loss/train': 1.1613801717758179} +03/05/2022 05:09:39 - INFO - codeparrot_training - Step 33777: {'lr': 0.00044525019466577824, 'samples': 17294336, 'steps': 33777, 'loss/train': 1.7528420686721802} +03/05/2022 05:09:40 - INFO - codeparrot_training - Skipping example with length 296 (seq_length=1024) +03/05/2022 05:09:44 - INFO - codeparrot_training - Step 33778: {'lr': 0.000445246880400476, 'samples': 17294848, 'steps': 33778, 'loss/train': 2.7505130767822266} +03/05/2022 05:09:47 - INFO - codeparrot_training - Step 33779: {'lr': 0.0004452435660471985, 'samples': 17295360, 'steps': 33779, 'loss/train': 1.506622076034546} +03/05/2022 05:09:49 - INFO - codeparrot_training - Skipping example with length 91 (seq_length=1024) +03/05/2022 05:09:53 - INFO - codeparrot_training - Step 33780: {'lr': 0.00044524025160594735, 'samples': 17295872, 'steps': 33780, 'loss/train': 2.2383944988250732} +03/05/2022 05:09:56 - INFO - codeparrot_training - Step 33781: {'lr': 0.00044523693707672384, 'samples': 17296384, 'steps': 33781, 'loss/train': 1.7786693572998047} +03/05/2022 05:09:57 - INFO - codeparrot_training - Skipping example with length 56 (seq_length=1024) +03/05/2022 05:10:01 - INFO - codeparrot_training - Step 33782: {'lr': 0.0004452336224595296, 'samples': 17296896, 'steps': 33782, 'loss/train': 1.6716578006744385} +03/05/2022 05:10:04 - INFO - codeparrot_training - Step 33783: {'lr': 0.00044523030775436617, 'samples': 17297408, 'steps': 33783, 'loss/train': 1.7751421928405762} +03/05/2022 05:10:06 - INFO - codeparrot_training - Skipping example with length 221 (seq_length=1024) +03/05/2022 05:10:09 - INFO - codeparrot_training - Step 33784: {'lr': 0.00044522699296123495, 'samples': 17297920, 'steps': 33784, 'loss/train': 2.1053643226623535} +03/05/2022 05:10:12 - INFO - codeparrot_training - Step 33785: {'lr': 0.0004452236780801374, 'samples': 17298432, 'steps': 33785, 'loss/train': 1.61186945438385} +03/05/2022 05:10:14 - INFO - codeparrot_training - Skipping example with length 792 (seq_length=1024) +03/05/2022 05:10:18 - INFO - codeparrot_training - Step 33786: {'lr': 0.00044522036311107514, 'samples': 17298944, 'steps': 33786, 'loss/train': 1.1602447032928467} +03/05/2022 05:10:21 - INFO - codeparrot_training - Step 33787: {'lr': 0.0004452170480540496, 'samples': 17299456, 'steps': 33787, 'loss/train': 1.4661749601364136} +03/05/2022 05:10:22 - INFO - codeparrot_training - Skipping example with length 240 (seq_length=1024) +03/05/2022 05:10:26 - INFO - codeparrot_training - Step 33788: {'lr': 0.0004452137329090622, 'samples': 17299968, 'steps': 33788, 'loss/train': 1.896278738975525} +03/05/2022 05:10:29 - INFO - codeparrot_training - Step 33789: {'lr': 0.0004452104176761146, 'samples': 17300480, 'steps': 33789, 'loss/train': 1.8350512981414795} +03/05/2022 05:10:30 - INFO - codeparrot_training - Skipping example with length 135 (seq_length=1024) +03/05/2022 05:10:34 - INFO - codeparrot_training - Step 33790: {'lr': 0.0004452071023552081, 'samples': 17300992, 'steps': 33790, 'loss/train': 1.6936326026916504} +03/05/2022 05:10:38 - INFO - codeparrot_training - Step 33791: {'lr': 0.0004452037869463443, 'samples': 17301504, 'steps': 33791, 'loss/train': 0.8472153544425964} +03/05/2022 05:10:39 - INFO - codeparrot_training - Skipping example with length 5 (seq_length=1024) +03/05/2022 05:10:43 - INFO - codeparrot_training - Step 33792: {'lr': 0.0004452004714495248, 'samples': 17302016, 'steps': 33792, 'loss/train': 1.3669425249099731} +03/05/2022 05:10:46 - INFO - codeparrot_training - Step 33793: {'lr': 0.00044519715586475083, 'samples': 17302528, 'steps': 33793, 'loss/train': 1.0535948276519775} +03/05/2022 05:10:47 - INFO - codeparrot_training - Skipping example with length 376 (seq_length=1024) +03/05/2022 05:10:51 - INFO - codeparrot_training - Step 33794: {'lr': 0.0004451938401920241, 'samples': 17303040, 'steps': 33794, 'loss/train': 2.0635149478912354} +03/05/2022 05:10:54 - INFO - codeparrot_training - Step 33795: {'lr': 0.0004451905244313461, 'samples': 17303552, 'steps': 33795, 'loss/train': 2.5287692546844482} +03/05/2022 05:10:55 - INFO - codeparrot_training - Skipping example with length 332 (seq_length=1024) +03/05/2022 05:11:00 - INFO - codeparrot_training - Step 33796: {'lr': 0.0004451872085827182, 'samples': 17304064, 'steps': 33796, 'loss/train': 2.070211410522461} +03/05/2022 05:11:03 - INFO - codeparrot_training - Step 33797: {'lr': 0.000445183892646142, 'samples': 17304576, 'steps': 33797, 'loss/train': 1.8657327890396118} +03/05/2022 05:11:03 - INFO - codeparrot_training - Skipping example with length 723 (seq_length=1024) +03/05/2022 05:11:08 - INFO - codeparrot_training - Step 33798: {'lr': 0.0004451805766216189, 'samples': 17305088, 'steps': 33798, 'loss/train': 1.003869891166687} +03/05/2022 05:11:11 - INFO - codeparrot_training - Step 33799: {'lr': 0.00044517726050915044, 'samples': 17305600, 'steps': 33799, 'loss/train': 1.5238442420959473} +03/05/2022 05:11:12 - INFO - codeparrot_training - Skipping example with length 994 (seq_length=1024) +03/05/2022 05:11:16 - INFO - codeparrot_training - Step 33800: {'lr': 0.0004451739443087381, 'samples': 17306112, 'steps': 33800, 'loss/train': 2.31925630569458} +03/05/2022 05:11:20 - INFO - codeparrot_training - Step 33801: {'lr': 0.0004451706280203834, 'samples': 17306624, 'steps': 33801, 'loss/train': 1.0048564672470093} +03/05/2022 05:11:20 - INFO - codeparrot_training - Skipping example with length 630 (seq_length=1024) +03/05/2022 05:11:25 - INFO - codeparrot_training - Step 33802: {'lr': 0.0004451673116440879, 'samples': 17307136, 'steps': 33802, 'loss/train': 1.9859715700149536} +03/05/2022 05:11:28 - INFO - codeparrot_training - Step 33803: {'lr': 0.00044516399517985296, 'samples': 17307648, 'steps': 33803, 'loss/train': 1.88052237033844} +03/05/2022 05:11:28 - INFO - codeparrot_training - Skipping example with length 17 (seq_length=1024) +03/05/2022 05:11:33 - INFO - codeparrot_training - Step 33804: {'lr': 0.00044516067862768015, 'samples': 17308160, 'steps': 33804, 'loss/train': 1.3802179098129272} +03/05/2022 05:11:37 - INFO - codeparrot_training - Step 33805: {'lr': 0.00044515736198757095, 'samples': 17308672, 'steps': 33805, 'loss/train': 1.5742433071136475} +03/05/2022 05:11:37 - INFO - codeparrot_training - Skipping example with length 782 (seq_length=1024) +03/05/2022 05:11:42 - INFO - codeparrot_training - Step 33806: {'lr': 0.0004451540452595268, 'samples': 17309184, 'steps': 33806, 'loss/train': 1.2189489603042603} +03/05/2022 05:11:45 - INFO - codeparrot_training - Step 33807: {'lr': 0.0004451507284435494, 'samples': 17309696, 'steps': 33807, 'loss/train': 1.7029753923416138} +03/05/2022 05:11:45 - INFO - codeparrot_training - Skipping example with length 357 (seq_length=1024) +03/05/2022 05:11:50 - INFO - codeparrot_training - Step 33808: {'lr': 0.00044514741153964, 'samples': 17310208, 'steps': 33808, 'loss/train': 2.2779147624969482} +03/05/2022 05:11:54 - INFO - codeparrot_training - Step 33809: {'lr': 0.00044514409454780016, 'samples': 17310720, 'steps': 33809, 'loss/train': 1.4496430158615112} +03/05/2022 05:11:54 - INFO - codeparrot_training - Skipping example with length 447 (seq_length=1024) +03/05/2022 05:11:59 - INFO - codeparrot_training - Step 33810: {'lr': 0.0004451407774680314, 'samples': 17311232, 'steps': 33810, 'loss/train': 1.0583422183990479} +03/05/2022 05:12:02 - INFO - codeparrot_training - Step 33811: {'lr': 0.0004451374603003353, 'samples': 17311744, 'steps': 33811, 'loss/train': 1.4394686222076416} +03/05/2022 05:12:02 - INFO - codeparrot_training - Skipping example with length 782 (seq_length=1024) +03/05/2022 05:12:08 - INFO - codeparrot_training - Step 33812: {'lr': 0.0004451341430447132, 'samples': 17312256, 'steps': 33812, 'loss/train': 1.8045791387557983} +03/05/2022 05:12:11 - INFO - codeparrot_training - Step 33813: {'lr': 0.0004451308257011667, 'samples': 17312768, 'steps': 33813, 'loss/train': 1.6149893999099731} +03/05/2022 05:12:11 - INFO - codeparrot_training - Skipping example with length 469 (seq_length=1024) +03/05/2022 05:12:16 - INFO - codeparrot_training - Step 33814: {'lr': 0.00044512750826969724, 'samples': 17313280, 'steps': 33814, 'loss/train': 2.0532898902893066} +03/05/2022 05:12:19 - INFO - codeparrot_training - Step 33815: {'lr': 0.0004451241907503063, 'samples': 17313792, 'steps': 33815, 'loss/train': 1.2666285037994385} +03/05/2022 05:12:19 - INFO - codeparrot_training - Skipping example with length 61 (seq_length=1024) +03/05/2022 05:12:24 - INFO - codeparrot_training - Step 33816: {'lr': 0.0004451208731429954, 'samples': 17314304, 'steps': 33816, 'loss/train': 2.2859816551208496} +03/05/2022 05:12:28 - INFO - codeparrot_training - Step 33817: {'lr': 0.00044511755544776615, 'samples': 17314816, 'steps': 33817, 'loss/train': 2.349276304244995} +03/05/2022 05:12:28 - INFO - codeparrot_training - Skipping example with length 327 (seq_length=1024) +03/05/2022 05:12:33 - INFO - codeparrot_training - Step 33818: {'lr': 0.0004451142376646199, 'samples': 17315328, 'steps': 33818, 'loss/train': 1.9633797407150269} +03/05/2022 05:12:36 - INFO - codeparrot_training - Skipping example with length 577 (seq_length=1024) +03/05/2022 05:12:38 - INFO - codeparrot_training - Step 33819: {'lr': 0.0004451109197935582, 'samples': 17315840, 'steps': 33819, 'loss/train': 1.80086350440979} +03/05/2022 05:12:41 - INFO - codeparrot_training - Step 33820: {'lr': 0.0004451076018345824, 'samples': 17316352, 'steps': 33820, 'loss/train': 2.1896166801452637} +03/05/2022 05:12:45 - INFO - codeparrot_training - Step 33821: {'lr': 0.0004451042837876943, 'samples': 17316864, 'steps': 33821, 'loss/train': 1.811818242073059} +03/05/2022 05:12:45 - INFO - codeparrot_training - Skipping example with length 788 (seq_length=1024) +03/05/2022 05:12:50 - INFO - codeparrot_training - Step 33822: {'lr': 0.00044510096565289513, 'samples': 17317376, 'steps': 33822, 'loss/train': 2.7449123859405518} +03/05/2022 05:12:53 - INFO - codeparrot_training - Step 33823: {'lr': 0.0004450976474301865, 'samples': 17317888, 'steps': 33823, 'loss/train': 1.874610185623169} +03/05/2022 05:12:53 - INFO - codeparrot_training - Skipping example with length 548 (seq_length=1024) +03/05/2022 05:12:58 - INFO - codeparrot_training - Step 33824: {'lr': 0.0004450943291195698, 'samples': 17318400, 'steps': 33824, 'loss/train': 1.9042495489120483} +03/05/2022 05:13:02 - INFO - codeparrot_training - Step 33825: {'lr': 0.0004450910107210467, 'samples': 17318912, 'steps': 33825, 'loss/train': 2.4449896812438965} +03/05/2022 05:13:02 - INFO - codeparrot_training - Skipping example with length 575 (seq_length=1024) +03/05/2022 05:13:07 - INFO - codeparrot_training - Step 33826: {'lr': 0.00044508769223461863, 'samples': 17319424, 'steps': 33826, 'loss/train': 2.013458251953125} +03/05/2022 05:13:10 - INFO - codeparrot_training - Step 33827: {'lr': 0.00044508437366028695, 'samples': 17319936, 'steps': 33827, 'loss/train': 0.8128820061683655} +03/05/2022 05:13:10 - INFO - codeparrot_training - Skipping example with length 115 (seq_length=1024) +03/05/2022 05:13:15 - INFO - codeparrot_training - Step 33828: {'lr': 0.00044508105499805337, 'samples': 17320448, 'steps': 33828, 'loss/train': 1.38637375831604} +03/05/2022 05:13:18 - INFO - codeparrot_training - Skipping example with length 342 (seq_length=1024) +03/05/2022 05:13:21 - INFO - codeparrot_training - Step 33829: {'lr': 0.0004450777362479192, 'samples': 17320960, 'steps': 33829, 'loss/train': 1.8780635595321655} +03/05/2022 05:13:24 - INFO - codeparrot_training - Step 33830: {'lr': 0.000445074417409886, 'samples': 17321472, 'steps': 33830, 'loss/train': 2.2296218872070312} +03/05/2022 05:13:27 - INFO - codeparrot_training - Step 33831: {'lr': 0.0004450710984839553, 'samples': 17321984, 'steps': 33831, 'loss/train': 1.9975776672363281} +03/05/2022 05:13:27 - INFO - codeparrot_training - Skipping example with length 100 (seq_length=1024) +03/05/2022 05:13:32 - INFO - codeparrot_training - Step 33832: {'lr': 0.00044506777947012863, 'samples': 17322496, 'steps': 33832, 'loss/train': 1.4816038608551025} +03/05/2022 05:13:36 - INFO - codeparrot_training - Step 33833: {'lr': 0.0004450644603684074, 'samples': 17323008, 'steps': 33833, 'loss/train': 2.418100595474243} +03/05/2022 05:13:36 - INFO - codeparrot_training - Skipping example with length 244 (seq_length=1024) +03/05/2022 05:13:41 - INFO - codeparrot_training - Step 33834: {'lr': 0.0004450611411787931, 'samples': 17323520, 'steps': 33834, 'loss/train': 1.075097680091858} +03/05/2022 05:13:44 - INFO - codeparrot_training - Step 33835: {'lr': 0.0004450578219012873, 'samples': 17324032, 'steps': 33835, 'loss/train': 1.541085958480835} +03/05/2022 05:13:44 - INFO - codeparrot_training - Skipping example with length 664 (seq_length=1024) +03/05/2022 05:13:49 - INFO - codeparrot_training - Step 33836: {'lr': 0.00044505450253589144, 'samples': 17324544, 'steps': 33836, 'loss/train': 1.6833947896957397} +03/05/2022 05:13:52 - INFO - codeparrot_training - Step 33837: {'lr': 0.00044505118308260693, 'samples': 17325056, 'steps': 33837, 'loss/train': 2.0897908210754395} +03/05/2022 05:13:52 - INFO - codeparrot_training - Skipping example with length 713 (seq_length=1024) +03/05/2022 05:13:58 - INFO - codeparrot_training - Step 33838: {'lr': 0.0004450478635414355, 'samples': 17325568, 'steps': 33838, 'loss/train': 1.2983777523040771} +03/05/2022 05:14:01 - INFO - codeparrot_training - Step 33839: {'lr': 0.0004450445439123785, 'samples': 17326080, 'steps': 33839, 'loss/train': 2.220438241958618} +03/05/2022 05:14:01 - INFO - codeparrot_training - Skipping example with length 314 (seq_length=1024) +03/05/2022 05:14:06 - INFO - codeparrot_training - Step 33840: {'lr': 0.0004450412241954374, 'samples': 17326592, 'steps': 33840, 'loss/train': 0.99775230884552} +03/05/2022 05:14:09 - INFO - codeparrot_training - Step 33841: {'lr': 0.00044503790439061374, 'samples': 17327104, 'steps': 33841, 'loss/train': 1.569477915763855} +03/05/2022 05:14:09 - INFO - codeparrot_training - Skipping example with length 57 (seq_length=1024) +03/05/2022 05:14:15 - INFO - codeparrot_training - Step 33842: {'lr': 0.000445034584497909, 'samples': 17327616, 'steps': 33842, 'loss/train': 2.365832805633545} +03/05/2022 05:14:18 - INFO - codeparrot_training - Step 33843: {'lr': 0.00044503126451732474, 'samples': 17328128, 'steps': 33843, 'loss/train': 1.1935734748840332} +03/05/2022 05:14:18 - INFO - codeparrot_training - Skipping example with length 352 (seq_length=1024) +03/05/2022 05:14:23 - INFO - codeparrot_training - Step 33844: {'lr': 0.00044502794444886234, 'samples': 17328640, 'steps': 33844, 'loss/train': 2.0076255798339844} +03/05/2022 05:14:26 - INFO - codeparrot_training - Skipping example with length 686 (seq_length=1024) +03/05/2022 05:14:28 - INFO - codeparrot_training - Step 33845: {'lr': 0.00044502462429252336, 'samples': 17329152, 'steps': 33845, 'loss/train': 2.0417819023132324} +03/05/2022 05:14:32 - INFO - codeparrot_training - Step 33846: {'lr': 0.0004450213040483093, 'samples': 17329664, 'steps': 33846, 'loss/train': 1.806931972503662} +03/05/2022 05:14:34 - INFO - codeparrot_training - Skipping example with length 24 (seq_length=1024) +03/05/2022 05:14:37 - INFO - codeparrot_training - Step 33847: {'lr': 0.00044501798371622173, 'samples': 17330176, 'steps': 33847, 'loss/train': 1.3489655256271362} +03/05/2022 05:14:40 - INFO - codeparrot_training - Step 33848: {'lr': 0.00044501466329626197, 'samples': 17330688, 'steps': 33848, 'loss/train': 1.4489156007766724} +03/05/2022 05:14:42 - INFO - codeparrot_training - Skipping example with length 894 (seq_length=1024) +03/05/2022 05:14:45 - INFO - codeparrot_training - Step 33849: {'lr': 0.0004450113427884317, 'samples': 17331200, 'steps': 33849, 'loss/train': 1.8033791780471802} +03/05/2022 05:14:48 - INFO - codeparrot_training - Step 33850: {'lr': 0.00044500802219273224, 'samples': 17331712, 'steps': 33850, 'loss/train': 1.6496083736419678} +03/05/2022 05:14:51 - INFO - codeparrot_training - Skipping example with length 593 (seq_length=1024) +03/05/2022 05:14:54 - INFO - codeparrot_training - Step 33851: {'lr': 0.00044500470150916514, 'samples': 17332224, 'steps': 33851, 'loss/train': 2.935706377029419} +03/05/2022 05:14:57 - INFO - codeparrot_training - Step 33852: {'lr': 0.000445001380737732, 'samples': 17332736, 'steps': 33852, 'loss/train': 1.1448179483413696} +03/05/2022 05:14:59 - INFO - codeparrot_training - Skipping example with length 196 (seq_length=1024) +03/05/2022 05:15:02 - INFO - codeparrot_training - Step 33853: {'lr': 0.0004449980598784343, 'samples': 17333248, 'steps': 33853, 'loss/train': 1.5741881132125854} +03/05/2022 05:15:06 - INFO - codeparrot_training - Step 33854: {'lr': 0.0004449947389312734, 'samples': 17333760, 'steps': 33854, 'loss/train': 1.3452973365783691} +03/05/2022 05:15:08 - INFO - codeparrot_training - Skipping example with length 800 (seq_length=1024) +03/05/2022 05:15:11 - INFO - codeparrot_training - Step 33855: {'lr': 0.00044499141789625086, 'samples': 17334272, 'steps': 33855, 'loss/train': 1.4021207094192505} +03/05/2022 05:15:14 - INFO - codeparrot_training - Step 33856: {'lr': 0.0004449880967733683, 'samples': 17334784, 'steps': 33856, 'loss/train': 2.03263258934021} +03/05/2022 05:15:17 - INFO - codeparrot_training - Skipping example with length 177 (seq_length=1024) +03/05/2022 05:15:19 - INFO - codeparrot_training - Step 33857: {'lr': 0.0004449847755626271, 'samples': 17335296, 'steps': 33857, 'loss/train': 1.3333001136779785} +03/05/2022 05:15:22 - INFO - codeparrot_training - Step 33858: {'lr': 0.0004449814542640287, 'samples': 17335808, 'steps': 33858, 'loss/train': 2.0181546211242676} +03/05/2022 05:15:25 - INFO - codeparrot_training - Skipping example with length 621 (seq_length=1024) +03/05/2022 05:15:28 - INFO - codeparrot_training - Step 33859: {'lr': 0.0004449781328775746, 'samples': 17336320, 'steps': 33859, 'loss/train': 1.504160761833191} +03/05/2022 05:15:31 - INFO - codeparrot_training - Step 33860: {'lr': 0.0004449748114032665, 'samples': 17336832, 'steps': 33860, 'loss/train': 1.5570697784423828} +03/05/2022 05:15:33 - INFO - codeparrot_training - Skipping example with length 18 (seq_length=1024) +03/05/2022 05:15:36 - INFO - codeparrot_training - Step 33861: {'lr': 0.00044497148984110567, 'samples': 17337344, 'steps': 33861, 'loss/train': 4.030794620513916} +03/05/2022 05:15:39 - INFO - codeparrot_training - Step 33862: {'lr': 0.00044496816819109377, 'samples': 17337856, 'steps': 33862, 'loss/train': 1.4438660144805908} +03/05/2022 05:15:42 - INFO - codeparrot_training - Skipping example with length 727 (seq_length=1024) +03/05/2022 05:15:45 - INFO - codeparrot_training - Step 33863: {'lr': 0.0004449648464532322, 'samples': 17338368, 'steps': 33863, 'loss/train': 0.9434030055999756} +03/05/2022 05:15:48 - INFO - codeparrot_training - Step 33864: {'lr': 0.0004449615246275225, 'samples': 17338880, 'steps': 33864, 'loss/train': 2.2798163890838623} +03/05/2022 05:15:50 - INFO - codeparrot_training - Skipping example with length 376 (seq_length=1024) +03/05/2022 05:15:53 - INFO - codeparrot_training - Step 33865: {'lr': 0.000444958202713966, 'samples': 17339392, 'steps': 33865, 'loss/train': 2.1741957664489746} +03/05/2022 05:15:56 - INFO - codeparrot_training - Step 33866: {'lr': 0.0004449548807125645, 'samples': 17339904, 'steps': 33866, 'loss/train': 1.5737000703811646} +03/05/2022 05:15:58 - INFO - codeparrot_training - Skipping example with length 286 (seq_length=1024) +03/05/2022 05:16:01 - INFO - codeparrot_training - Step 33867: {'lr': 0.0004449515586233193, 'samples': 17340416, 'steps': 33867, 'loss/train': 1.1860430240631104} +03/05/2022 05:16:05 - INFO - codeparrot_training - Step 33868: {'lr': 0.0004449482364462319, 'samples': 17340928, 'steps': 33868, 'loss/train': 1.6067126989364624} +03/05/2022 05:16:07 - INFO - codeparrot_training - Skipping example with length 1012 (seq_length=1024) +03/05/2022 05:16:10 - INFO - codeparrot_training - Step 33869: {'lr': 0.0004449449141813039, 'samples': 17341440, 'steps': 33869, 'loss/train': 2.393869400024414} +03/05/2022 05:16:13 - INFO - codeparrot_training - Step 33870: {'lr': 0.00044494159182853667, 'samples': 17341952, 'steps': 33870, 'loss/train': 1.7750999927520752} +03/05/2022 05:16:15 - INFO - codeparrot_training - Skipping example with length 983 (seq_length=1024) +03/05/2022 05:16:18 - INFO - codeparrot_training - Step 33871: {'lr': 0.0004449382693879318, 'samples': 17342464, 'steps': 33871, 'loss/train': 1.7189499139785767} +03/05/2022 05:16:21 - INFO - codeparrot_training - Step 33872: {'lr': 0.0004449349468594908, 'samples': 17342976, 'steps': 33872, 'loss/train': 2.0160794258117676} +03/05/2022 05:16:24 - INFO - codeparrot_training - Skipping example with length 402 (seq_length=1024) +03/05/2022 05:16:27 - INFO - codeparrot_training - Step 33873: {'lr': 0.000444931624243215, 'samples': 17343488, 'steps': 33873, 'loss/train': 1.6569578647613525} +03/05/2022 05:16:30 - INFO - codeparrot_training - Step 33874: {'lr': 0.0004449283015391061, 'samples': 17344000, 'steps': 33874, 'loss/train': 0.6907163262367249} +03/05/2022 05:16:33 - INFO - codeparrot_training - Skipping example with length 336 (seq_length=1024) +03/05/2022 05:16:35 - INFO - codeparrot_training - Step 33875: {'lr': 0.0004449249787471655, 'samples': 17344512, 'steps': 33875, 'loss/train': 1.870224118232727} +03/05/2022 05:16:38 - INFO - codeparrot_training - Step 33876: {'lr': 0.0004449216558673947, 'samples': 17345024, 'steps': 33876, 'loss/train': 1.4474776983261108} +03/05/2022 05:16:41 - INFO - codeparrot_training - Skipping example with length 935 (seq_length=1024) +03/05/2022 05:16:44 - INFO - codeparrot_training - Step 33877: {'lr': 0.0004449183328997952, 'samples': 17345536, 'steps': 33877, 'loss/train': 1.9273661375045776} +03/05/2022 05:16:47 - INFO - codeparrot_training - Step 33878: {'lr': 0.0004449150098443685, 'samples': 17346048, 'steps': 33878, 'loss/train': 1.457001805305481} +03/05/2022 05:16:50 - INFO - codeparrot_training - Step 33879: {'lr': 0.00044491168670111615, 'samples': 17346560, 'steps': 33879, 'loss/train': 1.9852187633514404} +03/05/2022 05:16:50 - INFO - codeparrot_training - Skipping example with length 1019 (seq_length=1024) +03/05/2022 05:16:55 - INFO - codeparrot_training - Step 33880: {'lr': 0.0004449083634700396, 'samples': 17347072, 'steps': 33880, 'loss/train': 1.6012510061264038} +03/05/2022 05:16:59 - INFO - codeparrot_training - Step 33881: {'lr': 0.00044490504015114033, 'samples': 17347584, 'steps': 33881, 'loss/train': 1.7568929195404053} +03/05/2022 05:16:59 - INFO - codeparrot_training - Skipping example with length 542 (seq_length=1024) +03/05/2022 05:17:04 - INFO - codeparrot_training - Step 33882: {'lr': 0.0004449017167444198, 'samples': 17348096, 'steps': 33882, 'loss/train': 1.164212942123413} +03/05/2022 05:17:07 - INFO - codeparrot_training - Step 33883: {'lr': 0.0004448983932498797, 'samples': 17348608, 'steps': 33883, 'loss/train': 1.2414915561676025} +03/05/2022 05:17:07 - INFO - codeparrot_training - Skipping example with length 738 (seq_length=1024) +03/05/2022 05:17:13 - INFO - codeparrot_training - Step 33884: {'lr': 0.00044489506966752127, 'samples': 17349120, 'steps': 33884, 'loss/train': 2.0429930686950684} +03/05/2022 05:17:16 - INFO - codeparrot_training - Step 33885: {'lr': 0.00044489174599734614, 'samples': 17349632, 'steps': 33885, 'loss/train': 0.07579810172319412} +03/05/2022 05:17:16 - INFO - codeparrot_training - Skipping example with length 1016 (seq_length=1024) +03/05/2022 05:17:21 - INFO - codeparrot_training - Step 33886: {'lr': 0.0004448884222393559, 'samples': 17350144, 'steps': 33886, 'loss/train': 2.0461721420288086} +03/05/2022 05:17:24 - INFO - codeparrot_training - Skipping example with length 980 (seq_length=1024) +03/05/2022 05:17:26 - INFO - codeparrot_training - Step 33887: {'lr': 0.00044488509839355183, 'samples': 17350656, 'steps': 33887, 'loss/train': 1.5489851236343384} +03/05/2022 05:17:30 - INFO - codeparrot_training - Step 33888: {'lr': 0.00044488177445993563, 'samples': 17351168, 'steps': 33888, 'loss/train': 1.3924423456192017} +03/05/2022 05:17:32 - INFO - codeparrot_training - Skipping example with length 923 (seq_length=1024) +03/05/2022 05:17:35 - INFO - codeparrot_training - Step 33889: {'lr': 0.0004448784504385086, 'samples': 17351680, 'steps': 33889, 'loss/train': 1.1904181241989136} +03/05/2022 05:17:38 - INFO - codeparrot_training - Step 33890: {'lr': 0.0004448751263292724, 'samples': 17352192, 'steps': 33890, 'loss/train': 2.004229784011841} +03/05/2022 05:17:40 - INFO - codeparrot_training - Skipping example with length 757 (seq_length=1024) +03/05/2022 05:17:43 - INFO - codeparrot_training - Step 33891: {'lr': 0.0004448718021322285, 'samples': 17352704, 'steps': 33891, 'loss/train': 1.819656252861023} +03/05/2022 05:17:47 - INFO - codeparrot_training - Step 33892: {'lr': 0.0004448684778473784, 'samples': 17353216, 'steps': 33892, 'loss/train': 1.5756034851074219} +03/05/2022 05:17:49 - INFO - codeparrot_training - Skipping example with length 871 (seq_length=1024) +03/05/2022 05:17:52 - INFO - codeparrot_training - Step 33893: {'lr': 0.0004448651534747235, 'samples': 17353728, 'steps': 33893, 'loss/train': 1.8945651054382324} +03/05/2022 05:17:55 - INFO - codeparrot_training - Step 33894: {'lr': 0.0004448618290142654, 'samples': 17354240, 'steps': 33894, 'loss/train': 1.8333640098571777} +03/05/2022 05:17:58 - INFO - codeparrot_training - Step 33895: {'lr': 0.0004448585044660055, 'samples': 17354752, 'steps': 33895, 'loss/train': 1.2428842782974243} +03/05/2022 05:17:58 - INFO - codeparrot_training - Skipping example with length 673 (seq_length=1024) +03/05/2022 05:18:04 - INFO - codeparrot_training - Step 33896: {'lr': 0.0004448551798299455, 'samples': 17355264, 'steps': 33896, 'loss/train': 2.686734199523926} +03/05/2022 05:18:07 - INFO - codeparrot_training - Step 33897: {'lr': 0.00044485185510608665, 'samples': 17355776, 'steps': 33897, 'loss/train': 0.8780430555343628} +03/05/2022 05:18:09 - INFO - codeparrot_training - Skipping example with length 902 (seq_length=1024) +03/05/2022 05:18:12 - INFO - codeparrot_training - Step 33898: {'lr': 0.0004448485302944306, 'samples': 17356288, 'steps': 33898, 'loss/train': 1.5389349460601807} +03/05/2022 05:18:16 - INFO - codeparrot_training - Step 33899: {'lr': 0.0004448452053949789, 'samples': 17356800, 'steps': 33899, 'loss/train': 0.6446228623390198} +03/05/2022 05:18:16 - INFO - codeparrot_training - Skipping example with length 949 (seq_length=1024) +03/05/2022 05:18:21 - INFO - codeparrot_training - Step 33900: {'lr': 0.0004448418804077328, 'samples': 17357312, 'steps': 33900, 'loss/train': 1.3159321546554565} +03/05/2022 05:18:24 - INFO - codeparrot_training - Step 33901: {'lr': 0.000444838555332694, 'samples': 17357824, 'steps': 33901, 'loss/train': 1.3943349123001099} +03/05/2022 05:18:25 - INFO - codeparrot_training - Skipping example with length 784 (seq_length=1024) +03/05/2022 05:18:29 - INFO - codeparrot_training - Step 33902: {'lr': 0.000444835230169864, 'samples': 17358336, 'steps': 33902, 'loss/train': 2.0463690757751465} +03/05/2022 05:18:32 - INFO - codeparrot_training - Step 33903: {'lr': 0.00044483190491924427, 'samples': 17358848, 'steps': 33903, 'loss/train': 0.8285592198371887} +03/05/2022 05:18:33 - INFO - codeparrot_training - Skipping example with length 482 (seq_length=1024) +03/05/2022 05:18:38 - INFO - codeparrot_training - Step 33904: {'lr': 0.0004448285795808362, 'samples': 17359360, 'steps': 33904, 'loss/train': 1.7008635997772217} +03/05/2022 05:18:41 - INFO - codeparrot_training - Step 33905: {'lr': 0.00044482525415464144, 'samples': 17359872, 'steps': 33905, 'loss/train': 1.963705062866211} +03/05/2022 05:18:41 - INFO - codeparrot_training - Skipping example with length 997 (seq_length=1024) +03/05/2022 05:18:46 - INFO - codeparrot_training - Step 33906: {'lr': 0.0004448219286406614, 'samples': 17360384, 'steps': 33906, 'loss/train': 1.6571139097213745} +03/05/2022 05:18:49 - INFO - codeparrot_training - Step 33907: {'lr': 0.00044481860303889766, 'samples': 17360896, 'steps': 33907, 'loss/train': 1.851084589958191} +03/05/2022 05:18:50 - INFO - codeparrot_training - Skipping example with length 426 (seq_length=1024) +03/05/2022 05:18:55 - INFO - codeparrot_training - Step 33908: {'lr': 0.0004448152773493516, 'samples': 17361408, 'steps': 33908, 'loss/train': 1.447405457496643} +03/05/2022 05:18:58 - INFO - codeparrot_training - Step 33909: {'lr': 0.0004448119515720248, 'samples': 17361920, 'steps': 33909, 'loss/train': 1.2948707342147827} +03/05/2022 05:18:59 - INFO - codeparrot_training - Skipping example with length 948 (seq_length=1024) +03/05/2022 05:19:03 - INFO - codeparrot_training - Step 33910: {'lr': 0.0004448086257069187, 'samples': 17362432, 'steps': 33910, 'loss/train': 1.6074893474578857} +03/05/2022 05:19:06 - INFO - codeparrot_training - Step 33911: {'lr': 0.00044480529975403496, 'samples': 17362944, 'steps': 33911, 'loss/train': 1.473939061164856} +03/05/2022 05:19:08 - INFO - codeparrot_training - Skipping example with length 202 (seq_length=1024) +03/05/2022 05:19:11 - INFO - codeparrot_training - Step 33912: {'lr': 0.00044480197371337484, 'samples': 17363456, 'steps': 33912, 'loss/train': 1.9812458753585815} +03/05/2022 05:19:15 - INFO - codeparrot_training - Step 33913: {'lr': 0.00044479864758494004, 'samples': 17363968, 'steps': 33913, 'loss/train': 1.9686212539672852} +03/05/2022 05:19:16 - INFO - codeparrot_training - Skipping example with length 400 (seq_length=1024) +03/05/2022 05:19:20 - INFO - codeparrot_training - Step 33914: {'lr': 0.0004447953213687319, 'samples': 17364480, 'steps': 33914, 'loss/train': 1.6838384866714478} +03/05/2022 05:19:23 - INFO - codeparrot_training - Step 33915: {'lr': 0.00044479199506475205, 'samples': 17364992, 'steps': 33915, 'loss/train': 1.1965010166168213} +03/05/2022 05:19:25 - INFO - codeparrot_training - Skipping example with length 675 (seq_length=1024) +03/05/2022 05:19:28 - INFO - codeparrot_training - Step 33916: {'lr': 0.0004447886686730019, 'samples': 17365504, 'steps': 33916, 'loss/train': 0.9995692372322083} +03/05/2022 05:19:32 - INFO - codeparrot_training - Step 33917: {'lr': 0.00044478534219348297, 'samples': 17366016, 'steps': 33917, 'loss/train': 0.9128006100654602} +03/05/2022 05:19:33 - INFO - codeparrot_training - Skipping example with length 585 (seq_length=1024) +03/05/2022 05:19:37 - INFO - codeparrot_training - Step 33918: {'lr': 0.0004447820156261968, 'samples': 17366528, 'steps': 33918, 'loss/train': 0.792133092880249} +03/05/2022 05:19:40 - INFO - codeparrot_training - Step 33919: {'lr': 0.0004447786889711449, 'samples': 17367040, 'steps': 33919, 'loss/train': 1.4905247688293457} +03/05/2022 05:19:41 - INFO - codeparrot_training - Skipping example with length 502 (seq_length=1024) +03/05/2022 05:19:45 - INFO - codeparrot_training - Step 33920: {'lr': 0.00044477536222832867, 'samples': 17367552, 'steps': 33920, 'loss/train': 1.7355396747589111} +03/05/2022 05:19:48 - INFO - codeparrot_training - Step 33921: {'lr': 0.0004447720353977497, 'samples': 17368064, 'steps': 33921, 'loss/train': 0.7810866832733154} +03/05/2022 05:19:50 - INFO - codeparrot_training - Skipping example with length 670 (seq_length=1024) +03/05/2022 05:19:54 - INFO - codeparrot_training - Step 33922: {'lr': 0.0004447687084794094, 'samples': 17368576, 'steps': 33922, 'loss/train': 1.4040842056274414} +03/05/2022 05:19:57 - INFO - codeparrot_training - Step 33923: {'lr': 0.00044476538147330934, 'samples': 17369088, 'steps': 33923, 'loss/train': 1.759506344795227} +03/05/2022 05:19:58 - INFO - codeparrot_training - Skipping example with length 283 (seq_length=1024) +03/05/2022 05:20:02 - INFO - codeparrot_training - Step 33924: {'lr': 0.00044476205437945105, 'samples': 17369600, 'steps': 33924, 'loss/train': 1.163450837135315} +03/05/2022 05:20:05 - INFO - codeparrot_training - Step 33925: {'lr': 0.0004447587271978359, 'samples': 17370112, 'steps': 33925, 'loss/train': 2.066434144973755} +03/05/2022 05:20:06 - INFO - codeparrot_training - Skipping example with length 527 (seq_length=1024) +03/05/2022 05:20:11 - INFO - codeparrot_training - Step 33926: {'lr': 0.0004447553999284656, 'samples': 17370624, 'steps': 33926, 'loss/train': 0.9701665639877319} +03/05/2022 05:20:14 - INFO - codeparrot_training - Step 33927: {'lr': 0.00044475207257134143, 'samples': 17371136, 'steps': 33927, 'loss/train': 1.9336720705032349} +03/05/2022 05:20:15 - INFO - codeparrot_training - Skipping example with length 29 (seq_length=1024) +03/05/2022 05:20:19 - INFO - codeparrot_training - Step 33928: {'lr': 0.000444748745126465, 'samples': 17371648, 'steps': 33928, 'loss/train': 1.7401714324951172} +03/05/2022 05:20:22 - INFO - codeparrot_training - Step 33929: {'lr': 0.0004447454175938378, 'samples': 17372160, 'steps': 33929, 'loss/train': 1.6509641408920288} +03/05/2022 05:20:23 - INFO - codeparrot_training - Skipping example with length 971 (seq_length=1024) +03/05/2022 05:20:28 - INFO - codeparrot_training - Step 33930: {'lr': 0.00044474208997346133, 'samples': 17372672, 'steps': 33930, 'loss/train': 1.3041768074035645} +03/05/2022 05:20:31 - INFO - codeparrot_training - Step 33931: {'lr': 0.00044473876226533703, 'samples': 17373184, 'steps': 33931, 'loss/train': 0.6916566491127014} +03/05/2022 05:20:32 - INFO - codeparrot_training - Skipping example with length 229 (seq_length=1024) +03/05/2022 05:20:36 - INFO - codeparrot_training - Step 33932: {'lr': 0.0004447354344694665, 'samples': 17373696, 'steps': 33932, 'loss/train': 2.3519835472106934} +03/05/2022 05:20:40 - INFO - codeparrot_training - Step 33933: {'lr': 0.0004447321065858512, 'samples': 17374208, 'steps': 33933, 'loss/train': 1.5290069580078125} +03/05/2022 05:20:41 - INFO - codeparrot_training - Skipping example with length 531 (seq_length=1024) +03/05/2022 05:20:45 - INFO - codeparrot_training - Step 33934: {'lr': 0.00044472877861449257, 'samples': 17374720, 'steps': 33934, 'loss/train': 1.1738260984420776} +03/05/2022 05:20:48 - INFO - codeparrot_training - Step 33935: {'lr': 0.00044472545055539213, 'samples': 17375232, 'steps': 33935, 'loss/train': 1.2830862998962402} +03/05/2022 05:20:49 - INFO - codeparrot_training - Skipping example with length 975 (seq_length=1024) +03/05/2022 05:20:53 - INFO - codeparrot_training - Step 33936: {'lr': 0.00044472212240855155, 'samples': 17375744, 'steps': 33936, 'loss/train': 1.4994702339172363} +03/05/2022 05:20:56 - INFO - codeparrot_training - Step 33937: {'lr': 0.0004447187941739721, 'samples': 17376256, 'steps': 33937, 'loss/train': 1.1862730979919434} +03/05/2022 05:20:58 - INFO - codeparrot_training - Skipping example with length 919 (seq_length=1024) +03/05/2022 05:21:02 - INFO - codeparrot_training - Step 33938: {'lr': 0.00044471546585165536, 'samples': 17376768, 'steps': 33938, 'loss/train': 1.1888177394866943} +03/05/2022 05:21:05 - INFO - codeparrot_training - Step 33939: {'lr': 0.0004447121374416028, 'samples': 17377280, 'steps': 33939, 'loss/train': 1.9602402448654175} +03/05/2022 05:21:06 - INFO - codeparrot_training - Skipping example with length 331 (seq_length=1024) +03/05/2022 05:21:10 - INFO - codeparrot_training - Step 33940: {'lr': 0.000444708808943816, 'samples': 17377792, 'steps': 33940, 'loss/train': 1.697003960609436} +03/05/2022 05:21:13 - INFO - codeparrot_training - Step 33941: {'lr': 0.00044470548035829637, 'samples': 17378304, 'steps': 33941, 'loss/train': 0.17559204995632172} +03/05/2022 05:21:14 - INFO - codeparrot_training - Skipping example with length 395 (seq_length=1024) +03/05/2022 05:21:19 - INFO - codeparrot_training - Step 33942: {'lr': 0.00044470215168504554, 'samples': 17378816, 'steps': 33942, 'loss/train': 2.0348830223083496} +03/05/2022 05:21:22 - INFO - codeparrot_training - Step 33943: {'lr': 0.0004446988229240648, 'samples': 17379328, 'steps': 33943, 'loss/train': 0.7638850212097168} +03/05/2022 05:21:23 - INFO - codeparrot_training - Skipping example with length 452 (seq_length=1024) +03/05/2022 05:21:27 - INFO - codeparrot_training - Step 33944: {'lr': 0.00044469549407535593, 'samples': 17379840, 'steps': 33944, 'loss/train': 1.419360637664795} +03/05/2022 05:21:30 - INFO - codeparrot_training - Step 33945: {'lr': 0.0004446921651389202, 'samples': 17380352, 'steps': 33945, 'loss/train': 0.07543662935495377} +03/05/2022 05:21:31 - INFO - codeparrot_training - Skipping example with length 555 (seq_length=1024) +03/05/2022 05:21:35 - INFO - codeparrot_training - Step 33946: {'lr': 0.00044468883611475913, 'samples': 17380864, 'steps': 33946, 'loss/train': 2.2713510990142822} +03/05/2022 05:21:39 - INFO - codeparrot_training - Step 33947: {'lr': 0.00044468550700287436, 'samples': 17381376, 'steps': 33947, 'loss/train': 1.3508340120315552} +03/05/2022 05:21:40 - INFO - codeparrot_training - Skipping example with length 930 (seq_length=1024) +03/05/2022 05:21:44 - INFO - codeparrot_training - Step 33948: {'lr': 0.00044468217780326724, 'samples': 17381888, 'steps': 33948, 'loss/train': 1.675719976425171} +03/05/2022 05:21:47 - INFO - codeparrot_training - Step 33949: {'lr': 0.0004446788485159393, 'samples': 17382400, 'steps': 33949, 'loss/train': 0.7711401581764221} +03/05/2022 05:21:48 - INFO - codeparrot_training - Skipping example with length 937 (seq_length=1024) +03/05/2022 05:21:52 - INFO - codeparrot_training - Step 33950: {'lr': 0.00044467551914089223, 'samples': 17382912, 'steps': 33950, 'loss/train': 1.340704083442688} +03/05/2022 05:21:56 - INFO - codeparrot_training - Step 33951: {'lr': 0.0004446721896781273, 'samples': 17383424, 'steps': 33951, 'loss/train': 0.13692378997802734} +03/05/2022 05:21:56 - INFO - codeparrot_training - Skipping example with length 818 (seq_length=1024) +03/05/2022 05:22:01 - INFO - codeparrot_training - Step 33952: {'lr': 0.00044466886012764603, 'samples': 17383936, 'steps': 33952, 'loss/train': 2.5945584774017334} +03/05/2022 05:22:04 - INFO - codeparrot_training - Step 33953: {'lr': 0.00044466553048944996, 'samples': 17384448, 'steps': 33953, 'loss/train': 1.5927963256835938} +03/05/2022 05:22:05 - INFO - codeparrot_training - Skipping example with length 252 (seq_length=1024) +03/05/2022 05:22:09 - INFO - codeparrot_training - Step 33954: {'lr': 0.0004446622007635407, 'samples': 17384960, 'steps': 33954, 'loss/train': 2.176279067993164} +03/05/2022 05:22:12 - INFO - codeparrot_training - Step 33955: {'lr': 0.0004446588709499196, 'samples': 17385472, 'steps': 33955, 'loss/train': 1.946581482887268} +03/05/2022 05:22:13 - INFO - codeparrot_training - Skipping example with length 207 (seq_length=1024) +03/05/2022 05:22:18 - INFO - codeparrot_training - Step 33956: {'lr': 0.00044465554104858817, 'samples': 17385984, 'steps': 33956, 'loss/train': 1.9513555765151978} +03/05/2022 05:22:21 - INFO - codeparrot_training - Step 33957: {'lr': 0.0004446522110595481, 'samples': 17386496, 'steps': 33957, 'loss/train': 1.7858421802520752} +03/05/2022 05:22:22 - INFO - codeparrot_training - Skipping example with length 939 (seq_length=1024) +03/05/2022 05:22:26 - INFO - codeparrot_training - Step 33958: {'lr': 0.00044464888098280067, 'samples': 17387008, 'steps': 33958, 'loss/train': 1.6601685285568237} +03/05/2022 05:22:29 - INFO - codeparrot_training - Step 33959: {'lr': 0.00044464555081834745, 'samples': 17387520, 'steps': 33959, 'loss/train': 1.634395956993103} +03/05/2022 05:22:30 - INFO - codeparrot_training - Skipping example with length 924 (seq_length=1024) +03/05/2022 05:22:35 - INFO - codeparrot_training - Step 33960: {'lr': 0.00044464222056618996, 'samples': 17388032, 'steps': 33960, 'loss/train': 1.9958555698394775} +03/05/2022 05:22:38 - INFO - codeparrot_training - Step 33961: {'lr': 0.00044463889022632963, 'samples': 17388544, 'steps': 33961, 'loss/train': 2.1417324542999268} +03/05/2022 05:22:39 - INFO - codeparrot_training - Skipping example with length 679 (seq_length=1024) +03/05/2022 05:22:43 - INFO - codeparrot_training - Step 33962: {'lr': 0.0004446355597987681, 'samples': 17389056, 'steps': 33962, 'loss/train': 1.9063613414764404} +03/05/2022 05:22:46 - INFO - codeparrot_training - Step 33963: {'lr': 0.00044463222928350677, 'samples': 17389568, 'steps': 33963, 'loss/train': 2.9024369716644287} +03/05/2022 05:22:47 - INFO - codeparrot_training - Skipping example with length 582 (seq_length=1024) +03/05/2022 05:22:51 - INFO - codeparrot_training - Step 33964: {'lr': 0.0004446288986805471, 'samples': 17390080, 'steps': 33964, 'loss/train': 1.6557780504226685} +03/05/2022 05:22:55 - INFO - codeparrot_training - Step 33965: {'lr': 0.0004446255679898907, 'samples': 17390592, 'steps': 33965, 'loss/train': 1.6633977890014648} +03/05/2022 05:22:55 - INFO - codeparrot_training - Skipping example with length 819 (seq_length=1024) +03/05/2022 05:23:00 - INFO - codeparrot_training - Step 33966: {'lr': 0.000444622237211539, 'samples': 17391104, 'steps': 33966, 'loss/train': 1.3186196088790894} +03/05/2022 05:23:03 - INFO - codeparrot_training - Step 33967: {'lr': 0.00044461890634549364, 'samples': 17391616, 'steps': 33967, 'loss/train': 1.8880226612091064} +03/05/2022 05:23:04 - INFO - codeparrot_training - Skipping example with length 724 (seq_length=1024) +03/05/2022 05:23:08 - INFO - codeparrot_training - Step 33968: {'lr': 0.00044461557539175587, 'samples': 17392128, 'steps': 33968, 'loss/train': 1.1651276350021362} +03/05/2022 05:23:11 - INFO - codeparrot_training - Step 33969: {'lr': 0.0004446122443503274, 'samples': 17392640, 'steps': 33969, 'loss/train': 1.0649319887161255} +03/05/2022 05:23:12 - INFO - codeparrot_training - Skipping example with length 394 (seq_length=1024) +03/05/2022 05:23:17 - INFO - codeparrot_training - Step 33970: {'lr': 0.00044460891322120963, 'samples': 17393152, 'steps': 33970, 'loss/train': 1.6299347877502441} +03/05/2022 05:23:20 - INFO - codeparrot_training - Step 33971: {'lr': 0.000444605582004404, 'samples': 17393664, 'steps': 33971, 'loss/train': 0.9564369320869446} +03/05/2022 05:23:20 - INFO - codeparrot_training - Skipping example with length 696 (seq_length=1024) +03/05/2022 05:23:25 - INFO - codeparrot_training - Step 33972: {'lr': 0.0004446022506999122, 'samples': 17394176, 'steps': 33972, 'loss/train': 1.629865288734436} +03/05/2022 05:23:28 - INFO - codeparrot_training - Step 33973: {'lr': 0.0004445989193077356, 'samples': 17394688, 'steps': 33973, 'loss/train': 1.9565603733062744} +03/05/2022 05:23:29 - INFO - codeparrot_training - Skipping example with length 160 (seq_length=1024) +03/05/2022 05:23:34 - INFO - codeparrot_training - Step 33974: {'lr': 0.0004445955878278758, 'samples': 17395200, 'steps': 33974, 'loss/train': 1.9195678234100342} +03/05/2022 05:23:37 - INFO - codeparrot_training - Step 33975: {'lr': 0.00044459225626033413, 'samples': 17395712, 'steps': 33975, 'loss/train': 0.9503218531608582} +03/05/2022 05:23:37 - INFO - codeparrot_training - Skipping example with length 162 (seq_length=1024) +03/05/2022 05:23:42 - INFO - codeparrot_training - Step 33976: {'lr': 0.00044458892460511225, 'samples': 17396224, 'steps': 33976, 'loss/train': 2.525550127029419} +03/05/2022 05:23:45 - INFO - codeparrot_training - Step 33977: {'lr': 0.0004445855928622116, 'samples': 17396736, 'steps': 33977, 'loss/train': 1.1452312469482422} +03/05/2022 05:23:45 - INFO - codeparrot_training - Skipping example with length 499 (seq_length=1024) +03/05/2022 05:23:50 - INFO - codeparrot_training - Step 33978: {'lr': 0.00044458226103163365, 'samples': 17397248, 'steps': 33978, 'loss/train': 0.6207029223442078} +03/05/2022 05:23:54 - INFO - codeparrot_training - Step 33979: {'lr': 0.0004445789291133799, 'samples': 17397760, 'steps': 33979, 'loss/train': 1.4539440870285034} +03/05/2022 05:23:54 - INFO - codeparrot_training - Skipping example with length 64 (seq_length=1024) +03/05/2022 05:23:59 - INFO - codeparrot_training - Step 33980: {'lr': 0.0004445755971074519, 'samples': 17398272, 'steps': 33980, 'loss/train': 1.0375241041183472} +03/05/2022 05:24:02 - INFO - codeparrot_training - Step 33981: {'lr': 0.0004445722650138512, 'samples': 17398784, 'steps': 33981, 'loss/train': 1.9532052278518677} +03/05/2022 05:24:02 - INFO - codeparrot_training - Skipping example with length 660 (seq_length=1024) +03/05/2022 05:24:07 - INFO - codeparrot_training - Step 33982: {'lr': 0.00044456893283257925, 'samples': 17399296, 'steps': 33982, 'loss/train': 1.2587968111038208} +03/05/2022 05:24:10 - INFO - codeparrot_training - Skipping example with length 45 (seq_length=1024) +03/05/2022 05:24:13 - INFO - codeparrot_training - Step 33983: {'lr': 0.00044456560056363746, 'samples': 17399808, 'steps': 33983, 'loss/train': 1.5715456008911133} +03/05/2022 05:24:16 - INFO - codeparrot_training - Step 33984: {'lr': 0.0004445622682070275, 'samples': 17400320, 'steps': 33984, 'loss/train': 1.4688823223114014} +03/05/2022 05:24:19 - INFO - codeparrot_training - Skipping example with length 779 (seq_length=1024) +03/05/2022 05:24:21 - INFO - codeparrot_training - Step 33985: {'lr': 0.00044455893576275077, 'samples': 17400832, 'steps': 33985, 'loss/train': 1.5532448291778564} +03/05/2022 05:24:24 - INFO - codeparrot_training - Step 33986: {'lr': 0.00044455560323080874, 'samples': 17401344, 'steps': 33986, 'loss/train': 2.2441117763519287} +03/05/2022 05:24:30 - INFO - codeparrot_training - Step 33987: {'lr': 0.00044455227061120296, 'samples': 17401856, 'steps': 33987, 'loss/train': 2.274519920349121} +03/05/2022 05:24:33 - INFO - codeparrot_training - Step 33988: {'lr': 0.000444548937903935, 'samples': 17402368, 'steps': 33988, 'loss/train': 1.8789424896240234} +03/05/2022 05:24:36 - INFO - codeparrot_training - Step 33989: {'lr': 0.0004445456051090062, 'samples': 17402880, 'steps': 33989, 'loss/train': 1.7000093460083008} +03/05/2022 05:24:36 - INFO - codeparrot_training - Skipping example with length 298 (seq_length=1024) +03/05/2022 05:24:41 - INFO - codeparrot_training - Step 33990: {'lr': 0.0004445422722264182, 'samples': 17403392, 'steps': 33990, 'loss/train': 2.164118766784668} +03/05/2022 05:24:44 - INFO - codeparrot_training - Step 33991: {'lr': 0.0004445389392561724, 'samples': 17403904, 'steps': 33991, 'loss/train': 1.7376148700714111} +03/05/2022 05:24:44 - INFO - codeparrot_training - Skipping example with length 12 (seq_length=1024) +03/05/2022 05:24:50 - INFO - codeparrot_training - Step 33992: {'lr': 0.0004445356061982704, 'samples': 17404416, 'steps': 33992, 'loss/train': 1.6368515491485596} +03/05/2022 05:24:53 - INFO - codeparrot_training - Step 33993: {'lr': 0.0004445322730527137, 'samples': 17404928, 'steps': 33993, 'loss/train': 1.713008999824524} +03/05/2022 05:24:53 - INFO - codeparrot_training - Skipping example with length 184 (seq_length=1024) +03/05/2022 05:24:58 - INFO - codeparrot_training - Step 33994: {'lr': 0.0004445289398195037, 'samples': 17405440, 'steps': 33994, 'loss/train': 0.6787934303283691} +03/05/2022 05:25:01 - INFO - codeparrot_training - Step 33995: {'lr': 0.000444525606498642, 'samples': 17405952, 'steps': 33995, 'loss/train': 1.6441653966903687} +03/05/2022 05:25:02 - INFO - codeparrot_training - Skipping example with length 695 (seq_length=1024) +03/05/2022 05:25:06 - INFO - codeparrot_training - Step 33996: {'lr': 0.00044452227309013003, 'samples': 17406464, 'steps': 33996, 'loss/train': 3.624610662460327} +03/05/2022 05:25:10 - INFO - codeparrot_training - Step 33997: {'lr': 0.0004445189395939694, 'samples': 17406976, 'steps': 33997, 'loss/train': 1.5357794761657715} +03/05/2022 05:25:10 - INFO - codeparrot_training - Skipping example with length 317 (seq_length=1024) +03/05/2022 05:25:15 - INFO - codeparrot_training - Step 33998: {'lr': 0.0004445156060101614, 'samples': 17407488, 'steps': 33998, 'loss/train': 1.9015567302703857} +03/05/2022 05:25:18 - INFO - codeparrot_training - Step 33999: {'lr': 0.0004445122723387077, 'samples': 17408000, 'steps': 33999, 'loss/train': 2.327850341796875} +03/05/2022 05:25:18 - INFO - codeparrot_training - Skipping example with length 56 (seq_length=1024) +03/05/2022 05:25:23 - INFO - codeparrot_training - Step 34000: {'lr': 0.0004445089385796099, 'samples': 17408512, 'steps': 34000, 'loss/train': 2.517242670059204} +03/05/2022 05:25:27 - INFO - codeparrot_training - Step 34001: {'lr': 0.0004445056047328693, 'samples': 17409024, 'steps': 34001, 'loss/train': 0.8967128992080688} +03/05/2022 05:25:27 - INFO - codeparrot_training - Skipping example with length 461 (seq_length=1024) +03/05/2022 05:25:32 - INFO - codeparrot_training - Step 34002: {'lr': 0.0004445022707984874, 'samples': 17409536, 'steps': 34002, 'loss/train': 1.659019947052002} +03/05/2022 05:25:35 - INFO - codeparrot_training - Step 34003: {'lr': 0.0004444989367764659, 'samples': 17410048, 'steps': 34003, 'loss/train': 1.7482949495315552} +03/05/2022 05:25:36 - INFO - codeparrot_training - Skipping example with length 65 (seq_length=1024) +03/05/2022 05:25:40 - INFO - codeparrot_training - Step 34004: {'lr': 0.0004444956026668061, 'samples': 17410560, 'steps': 34004, 'loss/train': 1.5374693870544434} +03/05/2022 05:25:43 - INFO - codeparrot_training - Step 34005: {'lr': 0.00044449226846950964, 'samples': 17411072, 'steps': 34005, 'loss/train': 1.5551549196243286} +03/05/2022 05:25:44 - INFO - codeparrot_training - Skipping example with length 186 (seq_length=1024) +03/05/2022 05:25:49 - INFO - codeparrot_training - Step 34006: {'lr': 0.00044448893418457794, 'samples': 17411584, 'steps': 34006, 'loss/train': 0.5738779902458191} +03/05/2022 05:25:52 - INFO - codeparrot_training - Step 34007: {'lr': 0.00044448559981201256, 'samples': 17412096, 'steps': 34007, 'loss/train': 1.4854726791381836} +03/05/2022 05:25:52 - INFO - codeparrot_training - Skipping example with length 614 (seq_length=1024) +03/05/2022 05:25:57 - INFO - codeparrot_training - Step 34008: {'lr': 0.00044448226535181485, 'samples': 17412608, 'steps': 34008, 'loss/train': 2.1169748306274414} +03/05/2022 05:26:00 - INFO - codeparrot_training - Step 34009: {'lr': 0.0004444789308039865, 'samples': 17413120, 'steps': 34009, 'loss/train': 1.4246947765350342} +03/05/2022 05:26:00 - INFO - codeparrot_training - Skipping example with length 38 (seq_length=1024) +03/05/2022 05:26:06 - INFO - codeparrot_training - Step 34010: {'lr': 0.00044447559616852893, 'samples': 17413632, 'steps': 34010, 'loss/train': 1.1972066164016724} +03/05/2022 05:26:09 - INFO - codeparrot_training - Step 34011: {'lr': 0.0004444722614454437, 'samples': 17414144, 'steps': 34011, 'loss/train': 1.5975327491760254} +03/05/2022 05:26:09 - INFO - codeparrot_training - Skipping example with length 412 (seq_length=1024) +03/05/2022 05:26:14 - INFO - codeparrot_training - Step 34012: {'lr': 0.00044446892663473227, 'samples': 17414656, 'steps': 34012, 'loss/train': 1.0017327070236206} +03/05/2022 05:26:17 - INFO - codeparrot_training - Step 34013: {'lr': 0.0004444655917363961, 'samples': 17415168, 'steps': 34013, 'loss/train': 1.9199111461639404} +03/05/2022 05:26:18 - INFO - codeparrot_training - Skipping example with length 819 (seq_length=1024) +03/05/2022 05:26:23 - INFO - codeparrot_training - Step 34014: {'lr': 0.00044446225675043684, 'samples': 17415680, 'steps': 34014, 'loss/train': 2.266388177871704} +03/05/2022 05:26:26 - INFO - codeparrot_training - Step 34015: {'lr': 0.0004444589216768558, 'samples': 17416192, 'steps': 34015, 'loss/train': 2.0375964641571045} +03/05/2022 05:26:27 - INFO - codeparrot_training - Skipping example with length 886 (seq_length=1024) +03/05/2022 05:26:31 - INFO - codeparrot_training - Step 34016: {'lr': 0.0004444555865156545, 'samples': 17416704, 'steps': 34016, 'loss/train': 1.4140856266021729} +03/05/2022 05:26:34 - INFO - codeparrot_training - Step 34017: {'lr': 0.0004444522512668346, 'samples': 17417216, 'steps': 34017, 'loss/train': 1.0430351495742798} +03/05/2022 05:26:35 - INFO - codeparrot_training - Skipping example with length 111 (seq_length=1024) +03/05/2022 05:26:40 - INFO - codeparrot_training - Step 34018: {'lr': 0.0004444489159303976, 'samples': 17417728, 'steps': 34018, 'loss/train': 1.5708619356155396} +03/05/2022 05:26:43 - INFO - codeparrot_training - Step 34019: {'lr': 0.0004444455805063448, 'samples': 17418240, 'steps': 34019, 'loss/train': 1.9042675495147705} +03/05/2022 05:26:43 - INFO - codeparrot_training - Skipping example with length 833 (seq_length=1024) +03/05/2022 05:26:48 - INFO - codeparrot_training - Step 34020: {'lr': 0.00044444224499467784, 'samples': 17418752, 'steps': 34020, 'loss/train': 2.2518444061279297} +03/05/2022 05:26:51 - INFO - codeparrot_training - Step 34021: {'lr': 0.0004444389093953982, 'samples': 17419264, 'steps': 34021, 'loss/train': 1.9457601308822632} +03/05/2022 05:26:52 - INFO - codeparrot_training - Skipping example with length 903 (seq_length=1024) +03/05/2022 05:26:57 - INFO - codeparrot_training - Step 34022: {'lr': 0.00044443557370850743, 'samples': 17419776, 'steps': 34022, 'loss/train': 1.21356201171875} +03/05/2022 05:27:00 - INFO - codeparrot_training - Step 34023: {'lr': 0.00044443223793400695, 'samples': 17420288, 'steps': 34023, 'loss/train': 1.6199712753295898} +03/05/2022 05:27:00 - INFO - codeparrot_training - Skipping example with length 201 (seq_length=1024) +03/05/2022 05:27:05 - INFO - codeparrot_training - Step 34024: {'lr': 0.0004444289020718983, 'samples': 17420800, 'steps': 34024, 'loss/train': 1.809503197669983} +03/05/2022 05:27:08 - INFO - codeparrot_training - Step 34025: {'lr': 0.000444425566122183, 'samples': 17421312, 'steps': 34025, 'loss/train': 1.568223476409912} +03/05/2022 05:27:09 - INFO - codeparrot_training - Skipping example with length 688 (seq_length=1024) +03/05/2022 05:27:13 - INFO - codeparrot_training - Step 34026: {'lr': 0.0004444222300848626, 'samples': 17421824, 'steps': 34026, 'loss/train': 1.978883147239685} +03/05/2022 05:27:17 - INFO - codeparrot_training - Step 34027: {'lr': 0.00044441889395993844, 'samples': 17422336, 'steps': 34027, 'loss/train': 1.7291051149368286} +03/05/2022 05:27:17 - INFO - codeparrot_training - Skipping example with length 1018 (seq_length=1024) +03/05/2022 05:27:22 - INFO - codeparrot_training - Step 34028: {'lr': 0.00044441555774741215, 'samples': 17422848, 'steps': 34028, 'loss/train': 1.868433952331543} +03/05/2022 05:27:25 - INFO - codeparrot_training - Step 34029: {'lr': 0.00044441222144728525, 'samples': 17423360, 'steps': 34029, 'loss/train': 2.080197811126709} +03/05/2022 05:27:25 - INFO - codeparrot_training - Skipping example with length 997 (seq_length=1024) +03/05/2022 05:27:30 - INFO - codeparrot_training - Step 34030: {'lr': 0.00044440888505955926, 'samples': 17423872, 'steps': 34030, 'loss/train': 1.055450677871704} +03/05/2022 05:27:34 - INFO - codeparrot_training - Step 34031: {'lr': 0.00044440554858423553, 'samples': 17424384, 'steps': 34031, 'loss/train': 1.1946673393249512} +03/05/2022 05:27:34 - INFO - codeparrot_training - Skipping example with length 543 (seq_length=1024) +03/05/2022 05:27:39 - INFO - codeparrot_training - Step 34032: {'lr': 0.0004444022120213157, 'samples': 17424896, 'steps': 34032, 'loss/train': 2.417046546936035} +03/05/2022 05:27:42 - INFO - codeparrot_training - Step 34033: {'lr': 0.00044439887537080116, 'samples': 17425408, 'steps': 34033, 'loss/train': 1.494907259941101} +03/05/2022 05:27:42 - INFO - codeparrot_training - Skipping example with length 829 (seq_length=1024) +03/05/2022 05:27:47 - INFO - codeparrot_training - Step 34034: {'lr': 0.00044439553863269356, 'samples': 17425920, 'steps': 34034, 'loss/train': 0.11388105154037476} +03/05/2022 05:27:51 - INFO - codeparrot_training - Step 34035: {'lr': 0.00044439220180699434, 'samples': 17426432, 'steps': 34035, 'loss/train': 1.883411169052124} +03/05/2022 05:27:51 - INFO - codeparrot_training - Skipping example with length 81 (seq_length=1024) +03/05/2022 05:27:56 - INFO - codeparrot_training - Step 34036: {'lr': 0.00044438886489370493, 'samples': 17426944, 'steps': 34036, 'loss/train': 2.4596474170684814} +03/05/2022 05:27:59 - INFO - codeparrot_training - Skipping example with length 229 (seq_length=1024) +03/05/2022 05:28:01 - INFO - codeparrot_training - Step 34037: {'lr': 0.00044438552789282694, 'samples': 17427456, 'steps': 34037, 'loss/train': 1.4283480644226074} +03/05/2022 05:28:04 - INFO - codeparrot_training - Step 34038: {'lr': 0.00044438219080436184, 'samples': 17427968, 'steps': 34038, 'loss/train': 2.1580395698547363} +03/05/2022 05:28:07 - INFO - codeparrot_training - Skipping example with length 226 (seq_length=1024) +03/05/2022 05:28:10 - INFO - codeparrot_training - Step 34039: {'lr': 0.0004443788536283111, 'samples': 17428480, 'steps': 34039, 'loss/train': 1.7696539163589478} +03/05/2022 05:28:13 - INFO - codeparrot_training - Step 34040: {'lr': 0.0004443755163646762, 'samples': 17428992, 'steps': 34040, 'loss/train': 1.4342762231826782} +03/05/2022 05:28:15 - INFO - codeparrot_training - Skipping example with length 202 (seq_length=1024) +03/05/2022 05:28:18 - INFO - codeparrot_training - Step 34041: {'lr': 0.00044437217901345885, 'samples': 17429504, 'steps': 34041, 'loss/train': 1.6364816427230835} +03/05/2022 05:28:22 - INFO - codeparrot_training - Step 34042: {'lr': 0.0004443688415746602, 'samples': 17430016, 'steps': 34042, 'loss/train': 6.383542060852051} +03/05/2022 05:28:25 - INFO - codeparrot_training - Step 34043: {'lr': 0.00044436550404828207, 'samples': 17430528, 'steps': 34043, 'loss/train': 1.1378906965255737} +03/05/2022 05:28:25 - INFO - codeparrot_training - Skipping example with length 380 (seq_length=1024) +03/05/2022 05:28:30 - INFO - codeparrot_training - Step 34044: {'lr': 0.0004443621664343258, 'samples': 17431040, 'steps': 34044, 'loss/train': 2.4452288150787354} +03/05/2022 05:28:33 - INFO - codeparrot_training - Step 34045: {'lr': 0.000444358828732793, 'samples': 17431552, 'steps': 34045, 'loss/train': 1.940739631652832} +03/05/2022 05:28:34 - INFO - codeparrot_training - Skipping example with length 201 (seq_length=1024) +03/05/2022 05:28:38 - INFO - codeparrot_training - Step 34046: {'lr': 0.000444355490943685, 'samples': 17432064, 'steps': 34046, 'loss/train': 1.7151546478271484} +03/05/2022 05:28:42 - INFO - codeparrot_training - Step 34047: {'lr': 0.0004443521530670035, 'samples': 17432576, 'steps': 34047, 'loss/train': 1.630328893661499} +03/05/2022 05:28:42 - INFO - codeparrot_training - Skipping example with length 807 (seq_length=1024) +03/05/2022 05:28:47 - INFO - codeparrot_training - Step 34048: {'lr': 0.00044434881510274995, 'samples': 17433088, 'steps': 34048, 'loss/train': 0.8149397373199463} +03/05/2022 05:28:50 - INFO - codeparrot_training - Step 34049: {'lr': 0.00044434547705092574, 'samples': 17433600, 'steps': 34049, 'loss/train': 1.8687498569488525} +03/05/2022 05:28:51 - INFO - codeparrot_training - Skipping example with length 244 (seq_length=1024) +03/05/2022 05:28:55 - INFO - codeparrot_training - Step 34050: {'lr': 0.0004443421389115325, 'samples': 17434112, 'steps': 34050, 'loss/train': 1.3824677467346191} +03/05/2022 05:28:59 - INFO - codeparrot_training - Step 34051: {'lr': 0.00044433880068457166, 'samples': 17434624, 'steps': 34051, 'loss/train': 1.6641342639923096} +03/05/2022 05:28:59 - INFO - codeparrot_training - Skipping example with length 460 (seq_length=1024) +03/05/2022 05:29:04 - INFO - codeparrot_training - Step 34052: {'lr': 0.0004443354623700447, 'samples': 17435136, 'steps': 34052, 'loss/train': 1.1805343627929688} +03/05/2022 05:29:07 - INFO - codeparrot_training - Step 34053: {'lr': 0.0004443321239679533, 'samples': 17435648, 'steps': 34053, 'loss/train': 1.2358131408691406} +03/05/2022 05:29:08 - INFO - codeparrot_training - Skipping example with length 970 (seq_length=1024) +03/05/2022 05:29:12 - INFO - codeparrot_training - Step 34054: {'lr': 0.0004443287854782988, 'samples': 17436160, 'steps': 34054, 'loss/train': 3.921879768371582} +03/05/2022 05:29:15 - INFO - codeparrot_training - Step 34055: {'lr': 0.0004443254469010828, 'samples': 17436672, 'steps': 34055, 'loss/train': 1.191489338874817} +03/05/2022 05:29:16 - INFO - codeparrot_training - Skipping example with length 352 (seq_length=1024) +03/05/2022 05:29:21 - INFO - codeparrot_training - Step 34056: {'lr': 0.0004443221082363067, 'samples': 17437184, 'steps': 34056, 'loss/train': 2.0300021171569824} +03/05/2022 05:29:24 - INFO - codeparrot_training - Step 34057: {'lr': 0.000444318769483972, 'samples': 17437696, 'steps': 34057, 'loss/train': 0.5210140347480774} +03/05/2022 05:29:24 - INFO - codeparrot_training - Skipping example with length 745 (seq_length=1024) +03/05/2022 05:29:29 - INFO - codeparrot_training - Step 34058: {'lr': 0.0004443154306440803, 'samples': 17438208, 'steps': 34058, 'loss/train': 2.4055397510528564} +03/05/2022 05:29:32 - INFO - codeparrot_training - Step 34059: {'lr': 0.00044431209171663313, 'samples': 17438720, 'steps': 34059, 'loss/train': 2.0263545513153076} +03/05/2022 05:29:33 - INFO - codeparrot_training - Skipping example with length 605 (seq_length=1024) +03/05/2022 05:29:38 - INFO - codeparrot_training - Step 34060: {'lr': 0.00044430875270163185, 'samples': 17439232, 'steps': 34060, 'loss/train': 2.1843109130859375} +03/05/2022 05:29:41 - INFO - codeparrot_training - Step 34061: {'lr': 0.00044430541359907804, 'samples': 17439744, 'steps': 34061, 'loss/train': 2.376917600631714} +03/05/2022 05:29:41 - INFO - codeparrot_training - Skipping example with length 958 (seq_length=1024) +03/05/2022 05:29:46 - INFO - codeparrot_training - Step 34062: {'lr': 0.0004443020744089733, 'samples': 17440256, 'steps': 34062, 'loss/train': 2.157226800918579} +03/05/2022 05:29:49 - INFO - codeparrot_training - Step 34063: {'lr': 0.00044429873513131897, 'samples': 17440768, 'steps': 34063, 'loss/train': 1.7049163579940796} +03/05/2022 05:29:50 - INFO - codeparrot_training - Skipping example with length 42 (seq_length=1024) +03/05/2022 05:29:54 - INFO - codeparrot_training - Step 34064: {'lr': 0.00044429539576611664, 'samples': 17441280, 'steps': 34064, 'loss/train': 1.0562320947647095} +03/05/2022 05:29:58 - INFO - codeparrot_training - Step 34065: {'lr': 0.0004442920563133678, 'samples': 17441792, 'steps': 34065, 'loss/train': 1.3266373872756958} +03/05/2022 05:29:58 - INFO - codeparrot_training - Skipping example with length 321 (seq_length=1024) +03/05/2022 05:30:03 - INFO - codeparrot_training - Step 34066: {'lr': 0.000444288716773074, 'samples': 17442304, 'steps': 34066, 'loss/train': 1.7700921297073364} +03/05/2022 05:30:06 - INFO - codeparrot_training - Step 34067: {'lr': 0.00044428537714523664, 'samples': 17442816, 'steps': 34067, 'loss/train': 2.31009840965271} +03/05/2022 05:30:06 - INFO - codeparrot_training - Skipping example with length 539 (seq_length=1024) +03/05/2022 05:30:11 - INFO - codeparrot_training - Step 34068: {'lr': 0.00044428203742985734, 'samples': 17443328, 'steps': 34068, 'loss/train': 1.738326907157898} +03/05/2022 05:30:14 - INFO - codeparrot_training - Step 34069: {'lr': 0.0004442786976269375, 'samples': 17443840, 'steps': 34069, 'loss/train': 1.696182131767273} +03/05/2022 05:30:15 - INFO - codeparrot_training - Skipping example with length 107 (seq_length=1024) +03/05/2022 05:30:20 - INFO - codeparrot_training - Step 34070: {'lr': 0.0004442753577364788, 'samples': 17444352, 'steps': 34070, 'loss/train': 1.6762832403182983} +03/05/2022 05:30:23 - INFO - codeparrot_training - Step 34071: {'lr': 0.00044427201775848246, 'samples': 17444864, 'steps': 34071, 'loss/train': 2.6324005126953125} +03/05/2022 05:30:23 - INFO - codeparrot_training - Skipping example with length 391 (seq_length=1024) +03/05/2022 05:30:28 - INFO - codeparrot_training - Step 34072: {'lr': 0.0004442686776929502, 'samples': 17445376, 'steps': 34072, 'loss/train': 2.109015464782715} +03/05/2022 05:30:32 - INFO - codeparrot_training - Step 34073: {'lr': 0.0004442653375398835, 'samples': 17445888, 'steps': 34073, 'loss/train': 0.7658395171165466} +03/05/2022 05:30:32 - INFO - codeparrot_training - Skipping example with length 313 (seq_length=1024) +03/05/2022 05:30:37 - INFO - codeparrot_training - Step 34074: {'lr': 0.0004442619972992838, 'samples': 17446400, 'steps': 34074, 'loss/train': 1.2794744968414307} +03/05/2022 05:30:40 - INFO - codeparrot_training - Step 34075: {'lr': 0.00044425865697115266, 'samples': 17446912, 'steps': 34075, 'loss/train': 1.7137771844863892} +03/05/2022 05:30:41 - INFO - codeparrot_training - Skipping example with length 326 (seq_length=1024) +03/05/2022 05:30:45 - INFO - codeparrot_training - Step 34076: {'lr': 0.00044425531655549157, 'samples': 17447424, 'steps': 34076, 'loss/train': 3.111297369003296} +03/05/2022 05:30:48 - INFO - codeparrot_training - Step 34077: {'lr': 0.0004442519760523021, 'samples': 17447936, 'steps': 34077, 'loss/train': 1.9399579763412476} +03/05/2022 05:30:49 - INFO - codeparrot_training - Skipping example with length 314 (seq_length=1024) +03/05/2022 05:30:54 - INFO - codeparrot_training - Step 34078: {'lr': 0.00044424863546158554, 'samples': 17448448, 'steps': 34078, 'loss/train': 1.8226441144943237} +03/05/2022 05:30:57 - INFO - codeparrot_training - Step 34079: {'lr': 0.00044424529478334364, 'samples': 17448960, 'steps': 34079, 'loss/train': 1.540472149848938} +03/05/2022 05:30:57 - INFO - codeparrot_training - Skipping example with length 642 (seq_length=1024) +03/05/2022 05:31:02 - INFO - codeparrot_training - Step 34080: {'lr': 0.0004442419540175778, 'samples': 17449472, 'steps': 34080, 'loss/train': 1.758059024810791} +03/05/2022 05:31:05 - INFO - codeparrot_training - Step 34081: {'lr': 0.0004442386131642895, 'samples': 17449984, 'steps': 34081, 'loss/train': 1.5499799251556396} +03/05/2022 05:31:06 - INFO - codeparrot_training - Skipping example with length 250 (seq_length=1024) +03/05/2022 05:31:11 - INFO - codeparrot_training - Step 34082: {'lr': 0.0004442352722234803, 'samples': 17450496, 'steps': 34082, 'loss/train': 1.8947174549102783} +03/05/2022 05:31:14 - INFO - codeparrot_training - Step 34083: {'lr': 0.0004442319311951517, 'samples': 17451008, 'steps': 34083, 'loss/train': 1.7237558364868164} +03/05/2022 05:31:14 - INFO - codeparrot_training - Skipping example with length 924 (seq_length=1024) +03/05/2022 05:31:19 - INFO - codeparrot_training - Step 34084: {'lr': 0.00044422859007930515, 'samples': 17451520, 'steps': 34084, 'loss/train': 2.104606866836548} +03/05/2022 05:31:22 - INFO - codeparrot_training - Step 34085: {'lr': 0.00044422524887594223, 'samples': 17452032, 'steps': 34085, 'loss/train': 2.273200750350952} +03/05/2022 05:31:23 - INFO - codeparrot_training - Skipping example with length 548 (seq_length=1024) +03/05/2022 05:31:28 - INFO - codeparrot_training - Step 34086: {'lr': 0.0004442219075850644, 'samples': 17452544, 'steps': 34086, 'loss/train': 1.4440802335739136} +03/05/2022 05:31:31 - INFO - codeparrot_training - Step 34087: {'lr': 0.0004442185662066731, 'samples': 17453056, 'steps': 34087, 'loss/train': 1.655002474784851} +03/05/2022 05:31:31 - INFO - codeparrot_training - Skipping example with length 647 (seq_length=1024) +03/05/2022 05:31:36 - INFO - codeparrot_training - Step 34088: {'lr': 0.00044421522474077, 'samples': 17453568, 'steps': 34088, 'loss/train': 1.9454220533370972} +03/05/2022 05:31:39 - INFO - codeparrot_training - Step 34089: {'lr': 0.0004442118831873565, 'samples': 17454080, 'steps': 34089, 'loss/train': 0.9859744906425476} +03/05/2022 05:31:40 - INFO - codeparrot_training - Skipping example with length 686 (seq_length=1024) +03/05/2022 05:31:44 - INFO - codeparrot_training - Step 34090: {'lr': 0.00044420854154643413, 'samples': 17454592, 'steps': 34090, 'loss/train': 2.5611069202423096} +03/05/2022 05:31:48 - INFO - codeparrot_training - Step 34091: {'lr': 0.00044420519981800446, 'samples': 17455104, 'steps': 34091, 'loss/train': 1.5908671617507935} +03/05/2022 05:31:48 - INFO - codeparrot_training - Skipping example with length 282 (seq_length=1024) +03/05/2022 05:31:53 - INFO - codeparrot_training - Step 34092: {'lr': 0.0004442018580020688, 'samples': 17455616, 'steps': 34092, 'loss/train': 1.4729499816894531} +03/05/2022 05:31:56 - INFO - codeparrot_training - Step 34093: {'lr': 0.0004441985160986288, 'samples': 17456128, 'steps': 34093, 'loss/train': 1.5146385431289673} +03/05/2022 05:31:56 - INFO - codeparrot_training - Skipping example with length 565 (seq_length=1024) +03/05/2022 05:32:02 - INFO - codeparrot_training - Step 34094: {'lr': 0.00044419517410768594, 'samples': 17456640, 'steps': 34094, 'loss/train': 1.671014428138733} +03/05/2022 05:32:05 - INFO - codeparrot_training - Step 34095: {'lr': 0.0004441918320292418, 'samples': 17457152, 'steps': 34095, 'loss/train': 1.6886521577835083} +03/05/2022 05:32:05 - INFO - codeparrot_training - Skipping example with length 802 (seq_length=1024) +03/05/2022 05:32:10 - INFO - codeparrot_training - Step 34096: {'lr': 0.00044418848986329775, 'samples': 17457664, 'steps': 34096, 'loss/train': 1.3938440084457397} +03/05/2022 05:32:13 - INFO - codeparrot_training - Step 34097: {'lr': 0.0004441851476098554, 'samples': 17458176, 'steps': 34097, 'loss/train': 1.5952064990997314} +03/05/2022 05:32:13 - INFO - codeparrot_training - Skipping example with length 448 (seq_length=1024) +03/05/2022 05:32:18 - INFO - codeparrot_training - Step 34098: {'lr': 0.0004441818052689162, 'samples': 17458688, 'steps': 34098, 'loss/train': 2.0440635681152344} +03/05/2022 05:32:21 - INFO - codeparrot_training - Step 34099: {'lr': 0.0004441784628404817, 'samples': 17459200, 'steps': 34099, 'loss/train': 1.7776108980178833} +03/05/2022 05:32:22 - INFO - codeparrot_training - Skipping example with length 758 (seq_length=1024) +03/05/2022 05:32:27 - INFO - codeparrot_training - Step 34100: {'lr': 0.0004441751203245533, 'samples': 17459712, 'steps': 34100, 'loss/train': 1.8822574615478516} +03/05/2022 05:32:30 - INFO - codeparrot_training - Step 34101: {'lr': 0.0004441717777211327, 'samples': 17460224, 'steps': 34101, 'loss/train': 2.3708813190460205} +03/05/2022 05:32:30 - INFO - codeparrot_training - Skipping example with length 615 (seq_length=1024) +03/05/2022 05:32:35 - INFO - codeparrot_training - Step 34102: {'lr': 0.00044416843503022126, 'samples': 17460736, 'steps': 34102, 'loss/train': 0.9929918646812439} +03/05/2022 05:32:38 - INFO - codeparrot_training - Step 34103: {'lr': 0.00044416509225182044, 'samples': 17461248, 'steps': 34103, 'loss/train': 2.3612778186798096} +03/05/2022 05:32:38 - INFO - codeparrot_training - Skipping example with length 416 (seq_length=1024) +03/05/2022 05:32:43 - INFO - codeparrot_training - Step 34104: {'lr': 0.0004441617493859319, 'samples': 17461760, 'steps': 34104, 'loss/train': 1.6196959018707275} +03/05/2022 05:32:47 - INFO - codeparrot_training - Step 34105: {'lr': 0.0004441584064325571, 'samples': 17462272, 'steps': 34105, 'loss/train': 1.9568370580673218} +03/05/2022 05:32:47 - INFO - codeparrot_training - Skipping example with length 791 (seq_length=1024) +03/05/2022 05:32:52 - INFO - codeparrot_training - Step 34106: {'lr': 0.0004441550633916975, 'samples': 17462784, 'steps': 34106, 'loss/train': 0.5889873504638672} +03/05/2022 05:32:55 - INFO - codeparrot_training - Step 34107: {'lr': 0.0004441517202633546, 'samples': 17463296, 'steps': 34107, 'loss/train': 0.9713134765625} +03/05/2022 05:33:00 - INFO - codeparrot_training - Step 34108: {'lr': 0.0004441483770475299, 'samples': 17463808, 'steps': 34108, 'loss/train': 2.0026438236236572} +03/05/2022 05:33:03 - INFO - codeparrot_training - Skipping example with length 164 (seq_length=1024) +03/05/2022 05:33:06 - INFO - codeparrot_training - Step 34109: {'lr': 0.000444145033744225, 'samples': 17464320, 'steps': 34109, 'loss/train': 2.3801803588867188} +03/05/2022 05:33:09 - INFO - codeparrot_training - Step 34110: {'lr': 0.0004441416903534413, 'samples': 17464832, 'steps': 34110, 'loss/train': 1.7913153171539307} +03/05/2022 05:33:12 - INFO - codeparrot_training - Skipping example with length 514 (seq_length=1024) +03/05/2022 05:33:14 - INFO - codeparrot_training - Step 34111: {'lr': 0.00044413834687518034, 'samples': 17465344, 'steps': 34111, 'loss/train': 1.6845449209213257} +03/05/2022 05:33:17 - INFO - codeparrot_training - Step 34112: {'lr': 0.00044413500330944366, 'samples': 17465856, 'steps': 34112, 'loss/train': 2.147451162338257} +03/05/2022 05:33:21 - INFO - codeparrot_training - Step 34113: {'lr': 0.00044413165965623275, 'samples': 17466368, 'steps': 34113, 'loss/train': 2.1855807304382324} +03/05/2022 05:33:21 - INFO - codeparrot_training - Skipping example with length 805 (seq_length=1024) +03/05/2022 05:33:26 - INFO - codeparrot_training - Step 34114: {'lr': 0.00044412831591554916, 'samples': 17466880, 'steps': 34114, 'loss/train': 2.339319944381714} +03/05/2022 05:33:29 - INFO - codeparrot_training - Step 34115: {'lr': 0.0004441249720873942, 'samples': 17467392, 'steps': 34115, 'loss/train': 1.0943936109542847} +03/05/2022 05:33:29 - INFO - codeparrot_training - Skipping example with length 669 (seq_length=1024) +03/05/2022 05:33:34 - INFO - codeparrot_training - Step 34116: {'lr': 0.00044412162817176966, 'samples': 17467904, 'steps': 34116, 'loss/train': 1.85038423538208} +03/05/2022 05:33:37 - INFO - codeparrot_training - Skipping example with length 847 (seq_length=1024) +03/05/2022 05:33:40 - INFO - codeparrot_training - Step 34117: {'lr': 0.00044411828416867684, 'samples': 17468416, 'steps': 34117, 'loss/train': 1.950211524963379} +03/05/2022 05:33:43 - INFO - codeparrot_training - Step 34118: {'lr': 0.00044411494007811736, 'samples': 17468928, 'steps': 34118, 'loss/train': 0.8425441384315491} +03/05/2022 05:33:46 - INFO - codeparrot_training - Skipping example with length 50 (seq_length=1024) +03/05/2022 05:33:48 - INFO - codeparrot_training - Step 34119: {'lr': 0.00044411159590009263, 'samples': 17469440, 'steps': 34119, 'loss/train': 1.7786281108856201} +03/05/2022 05:33:52 - INFO - codeparrot_training - Step 34120: {'lr': 0.0004441082516346043, 'samples': 17469952, 'steps': 34120, 'loss/train': 2.330460548400879} +03/05/2022 05:33:54 - INFO - codeparrot_training - Skipping example with length 878 (seq_length=1024) +03/05/2022 05:33:57 - INFO - codeparrot_training - Step 34121: {'lr': 0.0004441049072816537, 'samples': 17470464, 'steps': 34121, 'loss/train': 1.8122012615203857} +03/05/2022 05:34:00 - INFO - codeparrot_training - Step 34122: {'lr': 0.0004441015628412425, 'samples': 17470976, 'steps': 34122, 'loss/train': 1.9550861120224} +03/05/2022 05:34:02 - INFO - codeparrot_training - Skipping example with length 685 (seq_length=1024) +03/05/2022 05:34:05 - INFO - codeparrot_training - Step 34123: {'lr': 0.0004440982183133721, 'samples': 17471488, 'steps': 34123, 'loss/train': 1.4404162168502808} +03/05/2022 05:34:08 - INFO - codeparrot_training - Step 34124: {'lr': 0.00044409487369804395, 'samples': 17472000, 'steps': 34124, 'loss/train': 1.7190989255905151} +03/05/2022 05:34:11 - INFO - codeparrot_training - Skipping example with length 298 (seq_length=1024) +03/05/2022 05:34:14 - INFO - codeparrot_training - Step 34125: {'lr': 0.00044409152899525973, 'samples': 17472512, 'steps': 34125, 'loss/train': 1.7323949337005615} +03/05/2022 05:34:17 - INFO - codeparrot_training - Step 34126: {'lr': 0.00044408818420502085, 'samples': 17473024, 'steps': 34126, 'loss/train': 0.8039728999137878} +03/05/2022 05:34:19 - INFO - codeparrot_training - Skipping example with length 1017 (seq_length=1024) +03/05/2022 05:34:22 - INFO - codeparrot_training - Step 34127: {'lr': 0.00044408483932732886, 'samples': 17473536, 'steps': 34127, 'loss/train': 2.007296085357666} +03/05/2022 05:34:25 - INFO - codeparrot_training - Step 34128: {'lr': 0.00044408149436218523, 'samples': 17474048, 'steps': 34128, 'loss/train': 1.5064901113510132} +03/05/2022 05:34:28 - INFO - codeparrot_training - Skipping example with length 438 (seq_length=1024) +03/05/2022 05:34:31 - INFO - codeparrot_training - Step 34129: {'lr': 0.00044407814930959137, 'samples': 17474560, 'steps': 34129, 'loss/train': 1.8547723293304443} +03/05/2022 05:34:34 - INFO - codeparrot_training - Step 34130: {'lr': 0.000444074804169549, 'samples': 17475072, 'steps': 34130, 'loss/train': 1.7464185953140259} +03/05/2022 05:34:36 - INFO - codeparrot_training - Skipping example with length 353 (seq_length=1024) +03/05/2022 05:34:39 - INFO - codeparrot_training - Step 34131: {'lr': 0.00044407145894205947, 'samples': 17475584, 'steps': 34131, 'loss/train': 2.269740581512451} +03/05/2022 05:34:42 - INFO - codeparrot_training - Step 34132: {'lr': 0.0004440681136271244, 'samples': 17476096, 'steps': 34132, 'loss/train': 2.106044054031372} +03/05/2022 05:34:45 - INFO - codeparrot_training - Skipping example with length 302 (seq_length=1024) +03/05/2022 05:34:47 - INFO - codeparrot_training - Step 34133: {'lr': 0.0004440647682247452, 'samples': 17476608, 'steps': 34133, 'loss/train': 1.6214338541030884} +03/05/2022 05:34:51 - INFO - codeparrot_training - Step 34134: {'lr': 0.00044406142273492334, 'samples': 17477120, 'steps': 34134, 'loss/train': 1.1986275911331177} +03/05/2022 05:34:53 - INFO - codeparrot_training - Skipping example with length 748 (seq_length=1024) +03/05/2022 05:34:56 - INFO - codeparrot_training - Step 34135: {'lr': 0.00044405807715766047, 'samples': 17477632, 'steps': 34135, 'loss/train': 0.2201683670282364} +03/05/2022 05:34:59 - INFO - codeparrot_training - Step 34136: {'lr': 0.00044405473149295804, 'samples': 17478144, 'steps': 34136, 'loss/train': 2.3020589351654053} +03/05/2022 05:35:01 - INFO - codeparrot_training - Skipping example with length 325 (seq_length=1024) +03/05/2022 05:35:04 - INFO - codeparrot_training - Step 34137: {'lr': 0.0004440513857408175, 'samples': 17478656, 'steps': 34137, 'loss/train': 1.0189393758773804} +03/05/2022 05:35:07 - INFO - codeparrot_training - Step 34138: {'lr': 0.0004440480399012404, 'samples': 17479168, 'steps': 34138, 'loss/train': 1.8139852285385132} +03/05/2022 05:35:09 - INFO - codeparrot_training - Skipping example with length 307 (seq_length=1024) +03/05/2022 05:35:13 - INFO - codeparrot_training - Step 34139: {'lr': 0.00044404469397422823, 'samples': 17479680, 'steps': 34139, 'loss/train': 1.9736565351486206} +03/05/2022 05:35:16 - INFO - codeparrot_training - Step 34140: {'lr': 0.00044404134795978257, 'samples': 17480192, 'steps': 34140, 'loss/train': 1.5291110277175903} +03/05/2022 05:35:17 - INFO - codeparrot_training - Skipping example with length 666 (seq_length=1024) +03/05/2022 05:35:21 - INFO - codeparrot_training - Step 34141: {'lr': 0.0004440380018579049, 'samples': 17480704, 'steps': 34141, 'loss/train': 1.5795916318893433} +03/05/2022 05:35:24 - INFO - codeparrot_training - Step 34142: {'lr': 0.00044403465566859656, 'samples': 17481216, 'steps': 34142, 'loss/train': 2.210779905319214} +03/05/2022 05:35:26 - INFO - codeparrot_training - Skipping example with length 524 (seq_length=1024) +03/05/2022 05:35:29 - INFO - codeparrot_training - Step 34143: {'lr': 0.0004440313093918593, 'samples': 17481728, 'steps': 34143, 'loss/train': 1.5776442289352417} +03/05/2022 05:35:33 - INFO - codeparrot_training - Step 34144: {'lr': 0.00044402796302769453, 'samples': 17482240, 'steps': 34144, 'loss/train': 1.3823585510253906} +03/05/2022 05:35:34 - INFO - codeparrot_training - Skipping example with length 560 (seq_length=1024) +03/05/2022 05:35:38 - INFO - codeparrot_training - Step 34145: {'lr': 0.0004440246165761037, 'samples': 17482752, 'steps': 34145, 'loss/train': 0.8426879048347473} +03/05/2022 05:35:41 - INFO - codeparrot_training - Step 34146: {'lr': 0.00044402127003708846, 'samples': 17483264, 'steps': 34146, 'loss/train': 2.297863006591797} +03/05/2022 05:35:42 - INFO - codeparrot_training - Skipping example with length 917 (seq_length=1024) +03/05/2022 05:35:47 - INFO - codeparrot_training - Step 34147: {'lr': 0.0004440179234106502, 'samples': 17483776, 'steps': 34147, 'loss/train': 5.218173980712891} +03/05/2022 05:35:50 - INFO - codeparrot_training - Step 34148: {'lr': 0.00044401457669679043, 'samples': 17484288, 'steps': 34148, 'loss/train': 1.0703234672546387} +03/05/2022 05:35:52 - INFO - codeparrot_training - Skipping example with length 783 (seq_length=1024) +03/05/2022 05:35:55 - INFO - codeparrot_training - Step 34149: {'lr': 0.0004440112298955107, 'samples': 17484800, 'steps': 34149, 'loss/train': 1.0748257637023926} +03/05/2022 05:35:58 - INFO - codeparrot_training - Step 34150: {'lr': 0.0004440078830068125, 'samples': 17485312, 'steps': 34150, 'loss/train': 1.4391534328460693} +03/05/2022 05:36:00 - INFO - codeparrot_training - Skipping example with length 535 (seq_length=1024) +03/05/2022 05:36:03 - INFO - codeparrot_training - Step 34151: {'lr': 0.00044400453603069727, 'samples': 17485824, 'steps': 34151, 'loss/train': 0.8661510348320007} +03/05/2022 05:36:07 - INFO - codeparrot_training - Step 34152: {'lr': 0.0004440011889671667, 'samples': 17486336, 'steps': 34152, 'loss/train': 1.792608618736267} +03/05/2022 05:36:08 - INFO - codeparrot_training - Skipping example with length 258 (seq_length=1024) +03/05/2022 05:36:12 - INFO - codeparrot_training - Step 34153: {'lr': 0.00044399784181622216, 'samples': 17486848, 'steps': 34153, 'loss/train': 2.131106376647949} +03/05/2022 05:36:15 - INFO - codeparrot_training - Step 34154: {'lr': 0.0004439944945778651, 'samples': 17487360, 'steps': 34154, 'loss/train': 1.5413190126419067} +03/05/2022 05:36:17 - INFO - codeparrot_training - Skipping example with length 872 (seq_length=1024) +03/05/2022 05:36:20 - INFO - codeparrot_training - Step 34155: {'lr': 0.0004439911472520972, 'samples': 17487872, 'steps': 34155, 'loss/train': 1.3426002264022827} +03/05/2022 05:36:23 - INFO - codeparrot_training - Step 34156: {'lr': 0.0004439877998389199, 'samples': 17488384, 'steps': 34156, 'loss/train': 1.57003915309906} +03/05/2022 05:36:25 - INFO - codeparrot_training - Skipping example with length 736 (seq_length=1024) +03/05/2022 05:36:29 - INFO - codeparrot_training - Step 34157: {'lr': 0.0004439844523383346, 'samples': 17488896, 'steps': 34157, 'loss/train': 1.2894264459609985} +03/05/2022 05:36:32 - INFO - codeparrot_training - Step 34158: {'lr': 0.000443981104750343, 'samples': 17489408, 'steps': 34158, 'loss/train': 0.39746251702308655} +03/05/2022 05:36:34 - INFO - codeparrot_training - Skipping example with length 500 (seq_length=1024) +03/05/2022 05:36:37 - INFO - codeparrot_training - Step 34159: {'lr': 0.0004439777570749465, 'samples': 17489920, 'steps': 34159, 'loss/train': 0.6969925165176392} +03/05/2022 05:36:40 - INFO - codeparrot_training - Step 34160: {'lr': 0.0004439744093121465, 'samples': 17490432, 'steps': 34160, 'loss/train': 1.8490140438079834} +03/05/2022 05:36:42 - INFO - codeparrot_training - Skipping example with length 437 (seq_length=1024) +03/05/2022 05:36:46 - INFO - codeparrot_training - Step 34161: {'lr': 0.00044397106146194473, 'samples': 17490944, 'steps': 34161, 'loss/train': 0.4180835485458374} +03/05/2022 05:36:49 - INFO - codeparrot_training - Step 34162: {'lr': 0.00044396771352434256, 'samples': 17491456, 'steps': 34162, 'loss/train': 1.2257460355758667} +03/05/2022 05:36:52 - INFO - codeparrot_training - Skipping example with length 807 (seq_length=1024) +03/05/2022 05:36:54 - INFO - codeparrot_training - Step 34163: {'lr': 0.00044396436549934155, 'samples': 17491968, 'steps': 34163, 'loss/train': 1.9260871410369873} +03/05/2022 05:36:58 - INFO - codeparrot_training - Step 34164: {'lr': 0.00044396101738694316, 'samples': 17492480, 'steps': 34164, 'loss/train': 1.8775568008422852} +03/05/2022 05:37:01 - INFO - codeparrot_training - Step 34165: {'lr': 0.000443957669187149, 'samples': 17492992, 'steps': 34165, 'loss/train': 1.9550294876098633} +03/05/2022 05:37:01 - INFO - codeparrot_training - Skipping example with length 742 (seq_length=1024) +03/05/2022 05:37:06 - INFO - codeparrot_training - Step 34166: {'lr': 0.0004439543208999604, 'samples': 17493504, 'steps': 34166, 'loss/train': 2.0865559577941895} +03/05/2022 05:37:10 - INFO - codeparrot_training - Step 34167: {'lr': 0.00044395097252537905, 'samples': 17494016, 'steps': 34167, 'loss/train': 0.9504692554473877} +03/05/2022 05:37:11 - INFO - codeparrot_training - Skipping example with length 687 (seq_length=1024) +03/05/2022 05:37:15 - INFO - codeparrot_training - Step 34168: {'lr': 0.0004439476240634064, 'samples': 17494528, 'steps': 34168, 'loss/train': 2.2714765071868896} +03/05/2022 05:37:18 - INFO - codeparrot_training - Step 34169: {'lr': 0.00044394427551404386, 'samples': 17495040, 'steps': 34169, 'loss/train': 1.9800372123718262} +03/05/2022 05:37:19 - INFO - codeparrot_training - Skipping example with length 935 (seq_length=1024) +03/05/2022 05:37:23 - INFO - codeparrot_training - Step 34170: {'lr': 0.00044394092687729305, 'samples': 17495552, 'steps': 34170, 'loss/train': 1.8309171199798584} +03/05/2022 05:37:26 - INFO - codeparrot_training - Step 34171: {'lr': 0.0004439375781531555, 'samples': 17496064, 'steps': 34171, 'loss/train': 2.181962728500366} +03/05/2022 05:37:28 - INFO - codeparrot_training - Skipping example with length 270 (seq_length=1024) +03/05/2022 05:37:31 - INFO - codeparrot_training - Step 34172: {'lr': 0.00044393422934163265, 'samples': 17496576, 'steps': 34172, 'loss/train': 1.0602643489837646} +03/05/2022 05:37:35 - INFO - codeparrot_training - Step 34173: {'lr': 0.000443930880442726, 'samples': 17497088, 'steps': 34173, 'loss/train': 1.1460702419281006} +03/05/2022 05:37:36 - INFO - codeparrot_training - Skipping example with length 272 (seq_length=1024) +03/05/2022 05:37:40 - INFO - codeparrot_training - Step 34174: {'lr': 0.0004439275314564371, 'samples': 17497600, 'steps': 34174, 'loss/train': 1.664525032043457} +03/05/2022 05:37:43 - INFO - codeparrot_training - Step 34175: {'lr': 0.0004439241823827674, 'samples': 17498112, 'steps': 34175, 'loss/train': 2.226043224334717} +03/05/2022 05:37:45 - INFO - codeparrot_training - Skipping example with length 13 (seq_length=1024) +03/05/2022 05:37:48 - INFO - codeparrot_training - Step 34176: {'lr': 0.0004439208332217186, 'samples': 17498624, 'steps': 34176, 'loss/train': 1.8547481298446655} +03/05/2022 05:37:52 - INFO - codeparrot_training - Step 34177: {'lr': 0.00044391748397329194, 'samples': 17499136, 'steps': 34177, 'loss/train': 2.1341235637664795} +03/05/2022 05:37:53 - INFO - codeparrot_training - Skipping example with length 614 (seq_length=1024) +03/05/2022 05:37:57 - INFO - codeparrot_training - Step 34178: {'lr': 0.0004439141346374891, 'samples': 17499648, 'steps': 34178, 'loss/train': 5.807307720184326} +03/05/2022 05:38:00 - INFO - codeparrot_training - Step 34179: {'lr': 0.0004439107852143115, 'samples': 17500160, 'steps': 34179, 'loss/train': 1.5781409740447998} +03/05/2022 05:38:02 - INFO - codeparrot_training - Skipping example with length 755 (seq_length=1024) +03/05/2022 05:38:05 - INFO - codeparrot_training - Step 34180: {'lr': 0.0004439074357037607, 'samples': 17500672, 'steps': 34180, 'loss/train': 2.3529586791992188} +03/05/2022 05:38:09 - INFO - codeparrot_training - Step 34181: {'lr': 0.0004439040861058383, 'samples': 17501184, 'steps': 34181, 'loss/train': 2.0639467239379883} +03/05/2022 05:38:11 - INFO - codeparrot_training - Skipping example with length 239 (seq_length=1024) +03/05/2022 05:38:14 - INFO - codeparrot_training - Step 34182: {'lr': 0.00044390073642054564, 'samples': 17501696, 'steps': 34182, 'loss/train': 1.917283296585083} +03/05/2022 05:38:17 - INFO - codeparrot_training - Step 34183: {'lr': 0.00044389738664788424, 'samples': 17502208, 'steps': 34183, 'loss/train': 1.2364617586135864} +03/05/2022 05:38:19 - INFO - codeparrot_training - Skipping example with length 225 (seq_length=1024) +03/05/2022 05:38:22 - INFO - codeparrot_training - Step 34184: {'lr': 0.00044389403678785576, 'samples': 17502720, 'steps': 34184, 'loss/train': 1.7462048530578613} +03/05/2022 05:38:25 - INFO - codeparrot_training - Step 34185: {'lr': 0.0004438906868404616, 'samples': 17503232, 'steps': 34185, 'loss/train': 2.254133939743042} +03/05/2022 05:38:27 - INFO - codeparrot_training - Skipping example with length 532 (seq_length=1024) +03/05/2022 05:38:31 - INFO - codeparrot_training - Step 34186: {'lr': 0.00044388733680570324, 'samples': 17503744, 'steps': 34186, 'loss/train': 1.0031273365020752} +03/05/2022 05:38:34 - INFO - codeparrot_training - Step 34187: {'lr': 0.00044388398668358234, 'samples': 17504256, 'steps': 34187, 'loss/train': 1.5295847654342651} +03/05/2022 05:38:35 - INFO - codeparrot_training - Skipping example with length 91 (seq_length=1024) +03/05/2022 05:38:39 - INFO - codeparrot_training - Step 34188: {'lr': 0.00044388063647410016, 'samples': 17504768, 'steps': 34188, 'loss/train': 1.9227910041809082} +03/05/2022 05:38:42 - INFO - codeparrot_training - Step 34189: {'lr': 0.00044387728617725845, 'samples': 17505280, 'steps': 34189, 'loss/train': 2.4586002826690674} +03/05/2022 05:38:44 - INFO - codeparrot_training - Skipping example with length 245 (seq_length=1024) +03/05/2022 05:38:48 - INFO - codeparrot_training - Step 34190: {'lr': 0.0004438739357930586, 'samples': 17505792, 'steps': 34190, 'loss/train': 2.033339023590088} +03/05/2022 05:38:51 - INFO - codeparrot_training - Step 34191: {'lr': 0.00044387058532150217, 'samples': 17506304, 'steps': 34191, 'loss/train': 1.110052227973938} +03/05/2022 05:38:52 - INFO - codeparrot_training - Skipping example with length 606 (seq_length=1024) +03/05/2022 05:38:56 - INFO - codeparrot_training - Step 34192: {'lr': 0.0004438672347625907, 'samples': 17506816, 'steps': 34192, 'loss/train': 1.0906049013137817} +03/05/2022 05:38:59 - INFO - codeparrot_training - Step 34193: {'lr': 0.0004438638841163255, 'samples': 17507328, 'steps': 34193, 'loss/train': 1.8400697708129883} +03/05/2022 05:39:00 - INFO - codeparrot_training - Skipping example with length 176 (seq_length=1024) +03/05/2022 05:39:04 - INFO - codeparrot_training - Step 34194: {'lr': 0.0004438605333827083, 'samples': 17507840, 'steps': 34194, 'loss/train': 1.9471436738967896} +03/05/2022 05:39:08 - INFO - codeparrot_training - Step 34195: {'lr': 0.00044385718256174055, 'samples': 17508352, 'steps': 34195, 'loss/train': 1.6939191818237305} +03/05/2022 05:39:09 - INFO - codeparrot_training - Skipping example with length 670 (seq_length=1024) +03/05/2022 05:39:13 - INFO - codeparrot_training - Step 34196: {'lr': 0.0004438538316534237, 'samples': 17508864, 'steps': 34196, 'loss/train': 2.4373652935028076} +03/05/2022 05:39:16 - INFO - codeparrot_training - Step 34197: {'lr': 0.0004438504806577594, 'samples': 17509376, 'steps': 34197, 'loss/train': 1.7957028150558472} +03/05/2022 05:39:17 - INFO - codeparrot_training - Skipping example with length 901 (seq_length=1024) +03/05/2022 05:39:21 - INFO - codeparrot_training - Step 34198: {'lr': 0.000443847129574749, 'samples': 17509888, 'steps': 34198, 'loss/train': 0.06292540580034256} +03/05/2022 05:39:25 - INFO - codeparrot_training - Step 34199: {'lr': 0.0004438437784043941, 'samples': 17510400, 'steps': 34199, 'loss/train': 1.7774512767791748} +03/05/2022 05:39:26 - INFO - codeparrot_training - Skipping example with length 438 (seq_length=1024) +03/05/2022 05:39:30 - INFO - codeparrot_training - Step 34200: {'lr': 0.00044384042714669614, 'samples': 17510912, 'steps': 34200, 'loss/train': 1.7547448873519897} +03/05/2022 05:39:33 - INFO - codeparrot_training - Step 34201: {'lr': 0.0004438370758016567, 'samples': 17511424, 'steps': 34201, 'loss/train': 1.7959250211715698} +03/05/2022 05:39:34 - INFO - codeparrot_training - Skipping example with length 743 (seq_length=1024) +03/05/2022 05:39:38 - INFO - codeparrot_training - Step 34202: {'lr': 0.00044383372436927727, 'samples': 17511936, 'steps': 34202, 'loss/train': 2.1022074222564697} +03/05/2022 05:39:41 - INFO - codeparrot_training - Step 34203: {'lr': 0.00044383037284955937, 'samples': 17512448, 'steps': 34203, 'loss/train': 1.398281455039978} +03/05/2022 05:39:42 - INFO - codeparrot_training - Skipping example with length 800 (seq_length=1024) +03/05/2022 05:39:47 - INFO - codeparrot_training - Step 34204: {'lr': 0.00044382702124250444, 'samples': 17512960, 'steps': 34204, 'loss/train': 1.6356000900268555} +03/05/2022 05:39:50 - INFO - codeparrot_training - Step 34205: {'lr': 0.0004438236695481141, 'samples': 17513472, 'steps': 34205, 'loss/train': 1.6093099117279053} +03/05/2022 05:39:51 - INFO - codeparrot_training - Skipping example with length 757 (seq_length=1024) +03/05/2022 05:39:55 - INFO - codeparrot_training - Step 34206: {'lr': 0.00044382031776638974, 'samples': 17513984, 'steps': 34206, 'loss/train': 1.7206929922103882} +03/05/2022 05:39:59 - INFO - codeparrot_training - Step 34207: {'lr': 0.000443816965897333, 'samples': 17514496, 'steps': 34207, 'loss/train': 0.7779200673103333} +03/05/2022 05:39:59 - INFO - codeparrot_training - Skipping example with length 742 (seq_length=1024) +03/05/2022 05:40:04 - INFO - codeparrot_training - Step 34208: {'lr': 0.0004438136139409453, 'samples': 17515008, 'steps': 34208, 'loss/train': 1.8553944826126099} +03/05/2022 05:40:07 - INFO - codeparrot_training - Step 34209: {'lr': 0.00044381026189722824, 'samples': 17515520, 'steps': 34209, 'loss/train': 0.8115091323852539} +03/05/2022 05:40:08 - INFO - codeparrot_training - Skipping example with length 40 (seq_length=1024) +03/05/2022 05:40:12 - INFO - codeparrot_training - Step 34210: {'lr': 0.0004438069097661832, 'samples': 17516032, 'steps': 34210, 'loss/train': 2.2580177783966064} +03/05/2022 05:40:15 - INFO - codeparrot_training - Step 34211: {'lr': 0.0004438035575478118, 'samples': 17516544, 'steps': 34211, 'loss/train': 1.4521112442016602} +03/05/2022 05:40:16 - INFO - codeparrot_training - Skipping example with length 547 (seq_length=1024) +03/05/2022 05:40:21 - INFO - codeparrot_training - Step 34212: {'lr': 0.0004438002052421154, 'samples': 17517056, 'steps': 34212, 'loss/train': 1.8690000772476196} +03/05/2022 05:40:24 - INFO - codeparrot_training - Step 34213: {'lr': 0.00044379685284909575, 'samples': 17517568, 'steps': 34213, 'loss/train': 1.5044785737991333} +03/05/2022 05:40:24 - INFO - codeparrot_training - Skipping example with length 292 (seq_length=1024) +03/05/2022 05:40:29 - INFO - codeparrot_training - Step 34214: {'lr': 0.00044379350036875413, 'samples': 17518080, 'steps': 34214, 'loss/train': 1.6928565502166748} +03/05/2022 05:40:32 - INFO - codeparrot_training - Step 34215: {'lr': 0.00044379014780109217, 'samples': 17518592, 'steps': 34215, 'loss/train': 1.7167913913726807} +03/05/2022 05:40:33 - INFO - codeparrot_training - Skipping example with length 966 (seq_length=1024) +03/05/2022 05:40:38 - INFO - codeparrot_training - Step 34216: {'lr': 0.00044378679514611144, 'samples': 17519104, 'steps': 34216, 'loss/train': 1.9740239381790161} +03/05/2022 05:40:41 - INFO - codeparrot_training - Step 34217: {'lr': 0.0004437834424038133, 'samples': 17519616, 'steps': 34217, 'loss/train': 1.097809910774231} +03/05/2022 05:40:41 - INFO - codeparrot_training - Skipping example with length 517 (seq_length=1024) +03/05/2022 05:40:46 - INFO - codeparrot_training - Step 34218: {'lr': 0.00044378008957419936, 'samples': 17520128, 'steps': 34218, 'loss/train': 2.2368226051330566} +03/05/2022 05:40:49 - INFO - codeparrot_training - Step 34219: {'lr': 0.00044377673665727105, 'samples': 17520640, 'steps': 34219, 'loss/train': 1.9591455459594727} +03/05/2022 05:40:49 - INFO - codeparrot_training - Skipping example with length 238 (seq_length=1024) +03/05/2022 05:40:54 - INFO - codeparrot_training - Step 34220: {'lr': 0.00044377338365303, 'samples': 17521152, 'steps': 34220, 'loss/train': 1.9518258571624756} +03/05/2022 05:40:58 - INFO - codeparrot_training - Step 34221: {'lr': 0.00044377003056147757, 'samples': 17521664, 'steps': 34221, 'loss/train': 0.06462162733078003} +03/05/2022 05:40:58 - INFO - codeparrot_training - Skipping example with length 1013 (seq_length=1024) +03/05/2022 05:41:03 - INFO - codeparrot_training - Step 34222: {'lr': 0.00044376667738261545, 'samples': 17522176, 'steps': 34222, 'loss/train': 0.47106412053108215} +03/05/2022 05:41:06 - INFO - codeparrot_training - Step 34223: {'lr': 0.000443763324116445, 'samples': 17522688, 'steps': 34223, 'loss/train': 1.8936957120895386} +03/05/2022 05:41:06 - INFO - codeparrot_training - Skipping example with length 303 (seq_length=1024) +03/05/2022 05:41:12 - INFO - codeparrot_training - Step 34224: {'lr': 0.00044375997076296774, 'samples': 17523200, 'steps': 34224, 'loss/train': 1.8771260976791382} +03/05/2022 05:41:15 - INFO - codeparrot_training - Step 34225: {'lr': 0.0004437566173221853, 'samples': 17523712, 'steps': 34225, 'loss/train': 2.251481056213379} +03/05/2022 05:41:15 - INFO - codeparrot_training - Skipping example with length 756 (seq_length=1024) +03/05/2022 05:41:20 - INFO - codeparrot_training - Step 34226: {'lr': 0.0004437532637940991, 'samples': 17524224, 'steps': 34226, 'loss/train': 1.5564502477645874} +03/05/2022 05:41:23 - INFO - codeparrot_training - Skipping example with length 557 (seq_length=1024) +03/05/2022 05:41:25 - INFO - codeparrot_training - Step 34227: {'lr': 0.0004437499101787107, 'samples': 17524736, 'steps': 34227, 'loss/train': 1.6151272058486938} +03/05/2022 05:41:28 - INFO - codeparrot_training - Step 34228: {'lr': 0.00044374655647602153, 'samples': 17525248, 'steps': 34228, 'loss/train': 1.7380579710006714} +03/05/2022 05:41:31 - INFO - codeparrot_training - Skipping example with length 498 (seq_length=1024) +03/05/2022 05:41:34 - INFO - codeparrot_training - Step 34229: {'lr': 0.0004437432026860332, 'samples': 17525760, 'steps': 34229, 'loss/train': 0.642063558101654} +03/05/2022 05:41:37 - INFO - codeparrot_training - Step 34230: {'lr': 0.00044373984880874705, 'samples': 17526272, 'steps': 34230, 'loss/train': 2.1146881580352783} +03/05/2022 05:41:39 - INFO - codeparrot_training - Skipping example with length 262 (seq_length=1024) +03/05/2022 05:41:42 - INFO - codeparrot_training - Step 34231: {'lr': 0.0004437364948441649, 'samples': 17526784, 'steps': 34231, 'loss/train': 1.0028339624404907} +03/05/2022 05:41:45 - INFO - codeparrot_training - Step 34232: {'lr': 0.00044373314079228796, 'samples': 17527296, 'steps': 34232, 'loss/train': 1.3107696771621704} +03/05/2022 05:41:49 - INFO - codeparrot_training - Step 34233: {'lr': 0.0004437297866531179, 'samples': 17527808, 'steps': 34233, 'loss/train': 1.8322502374649048} +03/05/2022 05:41:49 - INFO - codeparrot_training - Skipping example with length 165 (seq_length=1024) +03/05/2022 05:41:54 - INFO - codeparrot_training - Step 34234: {'lr': 0.0004437264324266561, 'samples': 17528320, 'steps': 34234, 'loss/train': 0.8838863968849182} +03/05/2022 05:41:57 - INFO - codeparrot_training - Step 34235: {'lr': 0.00044372307811290425, 'samples': 17528832, 'steps': 34235, 'loss/train': 2.091601848602295} +03/05/2022 05:41:57 - INFO - codeparrot_training - Skipping example with length 706 (seq_length=1024) +03/05/2022 05:42:02 - INFO - codeparrot_training - Step 34236: {'lr': 0.00044371972371186374, 'samples': 17529344, 'steps': 34236, 'loss/train': 0.8373674750328064} +03/05/2022 05:42:05 - INFO - codeparrot_training - Step 34237: {'lr': 0.0004437163692235361, 'samples': 17529856, 'steps': 34237, 'loss/train': 1.7728911638259888} +03/05/2022 05:42:06 - INFO - codeparrot_training - Skipping example with length 500 (seq_length=1024) +03/05/2022 05:42:11 - INFO - codeparrot_training - Step 34238: {'lr': 0.0004437130146479229, 'samples': 17530368, 'steps': 34238, 'loss/train': 1.5088465213775635} +03/05/2022 05:42:14 - INFO - codeparrot_training - Step 34239: {'lr': 0.00044370965998502554, 'samples': 17530880, 'steps': 34239, 'loss/train': 1.45180082321167} +03/05/2022 05:42:14 - INFO - codeparrot_training - Skipping example with length 650 (seq_length=1024) +03/05/2022 05:42:19 - INFO - codeparrot_training - Step 34240: {'lr': 0.0004437063052348457, 'samples': 17531392, 'steps': 34240, 'loss/train': 1.8537890911102295} +03/05/2022 05:42:22 - INFO - codeparrot_training - Step 34241: {'lr': 0.0004437029503973847, 'samples': 17531904, 'steps': 34241, 'loss/train': 1.139745831489563} +03/05/2022 05:42:22 - INFO - codeparrot_training - Skipping example with length 973 (seq_length=1024) +03/05/2022 05:42:28 - INFO - codeparrot_training - Step 34242: {'lr': 0.00044369959547264416, 'samples': 17532416, 'steps': 34242, 'loss/train': 1.970870018005371} +03/05/2022 05:42:31 - INFO - codeparrot_training - Step 34243: {'lr': 0.0004436962404606255, 'samples': 17532928, 'steps': 34243, 'loss/train': 1.0133898258209229} +03/05/2022 05:42:31 - INFO - codeparrot_training - Skipping example with length 932 (seq_length=1024) +03/05/2022 05:42:36 - INFO - codeparrot_training - Step 34244: {'lr': 0.0004436928853613304, 'samples': 17533440, 'steps': 34244, 'loss/train': 1.857613205909729} +03/05/2022 05:42:39 - INFO - codeparrot_training - Step 34245: {'lr': 0.0004436895301747602, 'samples': 17533952, 'steps': 34245, 'loss/train': 1.3862278461456299} +03/05/2022 05:42:40 - INFO - codeparrot_training - Skipping example with length 109 (seq_length=1024) +03/05/2022 05:42:45 - INFO - codeparrot_training - Step 34246: {'lr': 0.00044368617490091655, 'samples': 17534464, 'steps': 34246, 'loss/train': 0.9862126708030701} +03/05/2022 05:42:48 - INFO - codeparrot_training - Step 34247: {'lr': 0.0004436828195398009, 'samples': 17534976, 'steps': 34247, 'loss/train': 1.0331921577453613} +03/05/2022 05:42:49 - INFO - codeparrot_training - Skipping example with length 252 (seq_length=1024) +03/05/2022 05:42:53 - INFO - codeparrot_training - Step 34248: {'lr': 0.0004436794640914148, 'samples': 17535488, 'steps': 34248, 'loss/train': 1.9212638139724731} +03/05/2022 05:42:56 - INFO - codeparrot_training - Step 34249: {'lr': 0.00044367610855575965, 'samples': 17536000, 'steps': 34249, 'loss/train': 2.0165295600891113} +03/05/2022 05:42:57 - INFO - codeparrot_training - Skipping example with length 331 (seq_length=1024) +03/05/2022 05:43:01 - INFO - codeparrot_training - Step 34250: {'lr': 0.00044367275293283705, 'samples': 17536512, 'steps': 34250, 'loss/train': 1.4806463718414307} +03/05/2022 05:43:05 - INFO - codeparrot_training - Step 34251: {'lr': 0.00044366939722264843, 'samples': 17537024, 'steps': 34251, 'loss/train': 1.6289920806884766} +03/05/2022 05:43:05 - INFO - codeparrot_training - Skipping example with length 192 (seq_length=1024) +03/05/2022 05:43:10 - INFO - codeparrot_training - Step 34252: {'lr': 0.00044366604142519547, 'samples': 17537536, 'steps': 34252, 'loss/train': 2.0826120376586914} +03/05/2022 05:43:13 - INFO - codeparrot_training - Step 34253: {'lr': 0.0004436626855404796, 'samples': 17538048, 'steps': 34253, 'loss/train': 2.0340754985809326} +03/05/2022 05:43:14 - INFO - codeparrot_training - Skipping example with length 657 (seq_length=1024) +03/05/2022 05:43:18 - INFO - codeparrot_training - Step 34254: {'lr': 0.0004436593295685022, 'samples': 17538560, 'steps': 34254, 'loss/train': 1.880374550819397} +03/05/2022 05:43:22 - INFO - codeparrot_training - Step 34255: {'lr': 0.00044365597350926495, 'samples': 17539072, 'steps': 34255, 'loss/train': 1.6729193925857544} +03/05/2022 05:43:22 - INFO - codeparrot_training - Skipping example with length 527 (seq_length=1024) +03/05/2022 05:43:27 - INFO - codeparrot_training - Step 34256: {'lr': 0.0004436526173627693, 'samples': 17539584, 'steps': 34256, 'loss/train': 1.50307297706604} +03/05/2022 05:43:30 - INFO - codeparrot_training - Step 34257: {'lr': 0.00044364926112901675, 'samples': 17540096, 'steps': 34257, 'loss/train': 1.5444446802139282} +03/05/2022 05:43:30 - INFO - codeparrot_training - Skipping example with length 893 (seq_length=1024) +03/05/2022 05:43:35 - INFO - codeparrot_training - Step 34258: {'lr': 0.0004436459048080089, 'samples': 17540608, 'steps': 34258, 'loss/train': 1.6453111171722412} +03/05/2022 05:43:38 - INFO - codeparrot_training - Step 34259: {'lr': 0.00044364254839974717, 'samples': 17541120, 'steps': 34259, 'loss/train': 1.885575771331787} +03/05/2022 05:43:39 - INFO - codeparrot_training - Skipping example with length 249 (seq_length=1024) +03/05/2022 05:43:44 - INFO - codeparrot_training - Step 34260: {'lr': 0.0004436391919042331, 'samples': 17541632, 'steps': 34260, 'loss/train': 2.1808481216430664} +03/05/2022 05:43:47 - INFO - codeparrot_training - Step 34261: {'lr': 0.00044363583532146814, 'samples': 17542144, 'steps': 34261, 'loss/train': 2.3671934604644775} +03/05/2022 05:43:47 - INFO - codeparrot_training - Skipping example with length 274 (seq_length=1024) +03/05/2022 05:43:52 - INFO - codeparrot_training - Step 34262: {'lr': 0.0004436324786514538, 'samples': 17542656, 'steps': 34262, 'loss/train': 2.110642194747925} +03/05/2022 05:43:55 - INFO - codeparrot_training - Step 34263: {'lr': 0.0004436291218941918, 'samples': 17543168, 'steps': 34263, 'loss/train': 1.900086760520935} +03/05/2022 05:43:55 - INFO - codeparrot_training - Skipping example with length 566 (seq_length=1024) +03/05/2022 05:44:01 - INFO - codeparrot_training - Step 34264: {'lr': 0.00044362576504968344, 'samples': 17543680, 'steps': 34264, 'loss/train': 2.3246779441833496} +03/05/2022 05:44:03 - INFO - codeparrot_training - Skipping example with length 197 (seq_length=1024) +03/05/2022 05:44:06 - INFO - codeparrot_training - Step 34265: {'lr': 0.0004436224081179303, 'samples': 17544192, 'steps': 34265, 'loss/train': 1.9526376724243164} +03/05/2022 05:44:09 - INFO - codeparrot_training - Step 34266: {'lr': 0.00044361905109893397, 'samples': 17544704, 'steps': 34266, 'loss/train': 1.129917025566101} +03/05/2022 05:44:12 - INFO - codeparrot_training - Step 34267: {'lr': 0.00044361569399269574, 'samples': 17545216, 'steps': 34267, 'loss/train': 0.5088042616844177} +03/05/2022 05:44:12 - INFO - codeparrot_training - Skipping example with length 470 (seq_length=1024) +03/05/2022 05:44:17 - INFO - codeparrot_training - Step 34268: {'lr': 0.0004436123367992174, 'samples': 17545728, 'steps': 34268, 'loss/train': 1.6535800695419312} +03/05/2022 05:44:21 - INFO - codeparrot_training - Step 34269: {'lr': 0.0004436089795185003, 'samples': 17546240, 'steps': 34269, 'loss/train': 1.4636188745498657} +03/05/2022 05:44:21 - INFO - codeparrot_training - Skipping example with length 732 (seq_length=1024) +03/05/2022 05:44:26 - INFO - codeparrot_training - Step 34270: {'lr': 0.0004436056221505459, 'samples': 17546752, 'steps': 34270, 'loss/train': 2.0245325565338135} +03/05/2022 05:44:29 - INFO - codeparrot_training - Step 34271: {'lr': 0.00044360226469535583, 'samples': 17547264, 'steps': 34271, 'loss/train': 2.298933744430542} +03/05/2022 05:44:29 - INFO - codeparrot_training - Skipping example with length 326 (seq_length=1024) +03/05/2022 05:44:34 - INFO - codeparrot_training - Step 34272: {'lr': 0.0004435989071529316, 'samples': 17547776, 'steps': 34272, 'loss/train': 1.7053426504135132} +03/05/2022 05:44:37 - INFO - codeparrot_training - Step 34273: {'lr': 0.0004435955495232746, 'samples': 17548288, 'steps': 34273, 'loss/train': 1.9695854187011719} +03/05/2022 05:44:38 - INFO - codeparrot_training - Skipping example with length 96 (seq_length=1024) +03/05/2022 05:44:43 - INFO - codeparrot_training - Step 34274: {'lr': 0.00044359219180638656, 'samples': 17548800, 'steps': 34274, 'loss/train': 1.5016789436340332} +03/05/2022 05:44:46 - INFO - codeparrot_training - Step 34275: {'lr': 0.0004435888340022688, 'samples': 17549312, 'steps': 34275, 'loss/train': 1.553998589515686} +03/05/2022 05:44:46 - INFO - codeparrot_training - Skipping example with length 358 (seq_length=1024) +03/05/2022 05:44:51 - INFO - codeparrot_training - Step 34276: {'lr': 0.0004435854761109229, 'samples': 17549824, 'steps': 34276, 'loss/train': 2.1069953441619873} +03/05/2022 05:44:54 - INFO - codeparrot_training - Step 34277: {'lr': 0.00044358211813235046, 'samples': 17550336, 'steps': 34277, 'loss/train': 1.1969993114471436} +03/05/2022 05:44:54 - INFO - codeparrot_training - Skipping example with length 129 (seq_length=1024) +03/05/2022 05:45:00 - INFO - codeparrot_training - Step 34278: {'lr': 0.0004435787600665528, 'samples': 17550848, 'steps': 34278, 'loss/train': 1.773040771484375} +03/05/2022 05:45:03 - INFO - codeparrot_training - Step 34279: {'lr': 0.0004435754019135315, 'samples': 17551360, 'steps': 34279, 'loss/train': 2.3009142875671387} +03/05/2022 05:45:03 - INFO - codeparrot_training - Skipping example with length 954 (seq_length=1024) +03/05/2022 05:45:08 - INFO - codeparrot_training - Step 34280: {'lr': 0.0004435720436732882, 'samples': 17551872, 'steps': 34280, 'loss/train': 1.7082451581954956} +03/05/2022 05:45:11 - INFO - codeparrot_training - Step 34281: {'lr': 0.0004435686853458243, 'samples': 17552384, 'steps': 34281, 'loss/train': 1.6464056968688965} +03/05/2022 05:45:12 - INFO - codeparrot_training - Skipping example with length 744 (seq_length=1024) +03/05/2022 05:45:17 - INFO - codeparrot_training - Step 34282: {'lr': 0.0004435653269311414, 'samples': 17552896, 'steps': 34282, 'loss/train': 2.080547332763672} +03/05/2022 05:45:20 - INFO - codeparrot_training - Step 34283: {'lr': 0.00044356196842924086, 'samples': 17553408, 'steps': 34283, 'loss/train': 1.6106858253479004} +03/05/2022 05:45:20 - INFO - codeparrot_training - Skipping example with length 183 (seq_length=1024) +03/05/2022 05:45:25 - INFO - codeparrot_training - Step 34284: {'lr': 0.0004435586098401243, 'samples': 17553920, 'steps': 34284, 'loss/train': 1.7904860973358154} +03/05/2022 05:45:28 - INFO - codeparrot_training - Step 34285: {'lr': 0.00044355525116379326, 'samples': 17554432, 'steps': 34285, 'loss/train': 1.9045751094818115} +03/05/2022 05:45:28 - INFO - codeparrot_training - Skipping example with length 379 (seq_length=1024) +03/05/2022 05:45:33 - INFO - codeparrot_training - Step 34286: {'lr': 0.00044355189240024917, 'samples': 17554944, 'steps': 34286, 'loss/train': 0.3161822557449341} +03/05/2022 05:45:37 - INFO - codeparrot_training - Step 34287: {'lr': 0.00044354853354949353, 'samples': 17555456, 'steps': 34287, 'loss/train': 0.8550520539283752} +03/05/2022 05:45:37 - INFO - codeparrot_training - Skipping example with length 614 (seq_length=1024) +03/05/2022 05:45:42 - INFO - codeparrot_training - Step 34288: {'lr': 0.000443545174611528, 'samples': 17555968, 'steps': 34288, 'loss/train': 1.2666447162628174} +03/05/2022 05:45:45 - INFO - codeparrot_training - Step 34289: {'lr': 0.000443541815586354, 'samples': 17556480, 'steps': 34289, 'loss/train': 1.4957973957061768} +03/05/2022 05:45:45 - INFO - codeparrot_training - Skipping example with length 632 (seq_length=1024) +03/05/2022 05:45:51 - INFO - codeparrot_training - Step 34290: {'lr': 0.0004435384564739729, 'samples': 17556992, 'steps': 34290, 'loss/train': 1.529710054397583} +03/05/2022 05:45:54 - INFO - codeparrot_training - Step 34291: {'lr': 0.00044353509727438657, 'samples': 17557504, 'steps': 34291, 'loss/train': 1.7087292671203613} +03/05/2022 05:45:54 - INFO - codeparrot_training - Skipping example with length 527 (seq_length=1024) +03/05/2022 05:45:59 - INFO - codeparrot_training - Step 34292: {'lr': 0.00044353173798759616, 'samples': 17558016, 'steps': 34292, 'loss/train': 1.639023780822754} +03/05/2022 05:46:02 - INFO - codeparrot_training - Skipping example with length 16 (seq_length=1024) +03/05/2022 05:46:04 - INFO - codeparrot_training - Step 34293: {'lr': 0.0004435283786136034, 'samples': 17558528, 'steps': 34293, 'loss/train': 1.2677940130233765} +03/05/2022 05:46:08 - INFO - codeparrot_training - Step 34294: {'lr': 0.0004435250191524097, 'samples': 17559040, 'steps': 34294, 'loss/train': 1.6011766195297241} +03/05/2022 05:46:11 - INFO - codeparrot_training - Step 34295: {'lr': 0.0004435216596040167, 'samples': 17559552, 'steps': 34295, 'loss/train': 1.6702256202697754} +03/05/2022 05:46:11 - INFO - codeparrot_training - Skipping example with length 72 (seq_length=1024) +03/05/2022 05:46:16 - INFO - codeparrot_training - Step 34296: {'lr': 0.00044351829996842575, 'samples': 17560064, 'steps': 34296, 'loss/train': 0.8600285053253174} +03/05/2022 05:46:19 - INFO - codeparrot_training - Step 34297: {'lr': 0.00044351494024563845, 'samples': 17560576, 'steps': 34297, 'loss/train': 1.9177359342575073} +03/05/2022 05:46:19 - INFO - codeparrot_training - Skipping example with length 66 (seq_length=1024) +03/05/2022 05:46:24 - INFO - codeparrot_training - Step 34298: {'lr': 0.0004435115804356563, 'samples': 17561088, 'steps': 34298, 'loss/train': 0.8987356424331665} +03/05/2022 05:46:28 - INFO - codeparrot_training - Step 34299: {'lr': 0.0004435082205384808, 'samples': 17561600, 'steps': 34299, 'loss/train': 1.7946609258651733} +03/05/2022 05:46:28 - INFO - codeparrot_training - Skipping example with length 88 (seq_length=1024) +03/05/2022 05:46:33 - INFO - codeparrot_training - Step 34300: {'lr': 0.00044350486055411354, 'samples': 17562112, 'steps': 34300, 'loss/train': 1.2640492916107178} +03/05/2022 05:46:36 - INFO - codeparrot_training - Step 34301: {'lr': 0.000443501500482556, 'samples': 17562624, 'steps': 34301, 'loss/train': 3.3504762649536133} +03/05/2022 05:46:37 - INFO - codeparrot_training - Skipping example with length 892 (seq_length=1024) +03/05/2022 05:46:41 - INFO - codeparrot_training - Step 34302: {'lr': 0.0004434981403238096, 'samples': 17563136, 'steps': 34302, 'loss/train': 1.7024686336517334} +03/05/2022 05:46:45 - INFO - codeparrot_training - Step 34303: {'lr': 0.0004434947800778759, 'samples': 17563648, 'steps': 34303, 'loss/train': 1.0958644151687622} +03/05/2022 05:46:45 - INFO - codeparrot_training - Skipping example with length 998 (seq_length=1024) +03/05/2022 05:46:50 - INFO - codeparrot_training - Step 34304: {'lr': 0.0004434914197447565, 'samples': 17564160, 'steps': 34304, 'loss/train': 1.7085331678390503} +03/05/2022 05:46:53 - INFO - codeparrot_training - Step 34305: {'lr': 0.0004434880593244528, 'samples': 17564672, 'steps': 34305, 'loss/train': 0.06464465707540512} +03/05/2022 05:46:53 - INFO - codeparrot_training - Skipping example with length 533 (seq_length=1024) +03/05/2022 05:46:58 - INFO - codeparrot_training - Step 34306: {'lr': 0.0004434846988169664, 'samples': 17565184, 'steps': 34306, 'loss/train': 1.4451203346252441} +03/05/2022 05:47:02 - INFO - codeparrot_training - Step 34307: {'lr': 0.0004434813382222989, 'samples': 17565696, 'steps': 34307, 'loss/train': 1.5405151844024658} +03/05/2022 05:47:02 - INFO - codeparrot_training - Skipping example with length 470 (seq_length=1024) +03/05/2022 05:47:07 - INFO - codeparrot_training - Step 34308: {'lr': 0.0004434779775404515, 'samples': 17566208, 'steps': 34308, 'loss/train': 1.9971555471420288} +03/05/2022 05:47:10 - INFO - codeparrot_training - Step 34309: {'lr': 0.000443474616771426, 'samples': 17566720, 'steps': 34309, 'loss/train': 2.0689680576324463} +03/05/2022 05:47:10 - INFO - codeparrot_training - Skipping example with length 247 (seq_length=1024) +03/05/2022 05:47:16 - INFO - codeparrot_training - Step 34310: {'lr': 0.00044347125591522377, 'samples': 17567232, 'steps': 34310, 'loss/train': 1.8060925006866455} +03/05/2022 05:47:19 - INFO - codeparrot_training - Step 34311: {'lr': 0.00044346789497184643, 'samples': 17567744, 'steps': 34311, 'loss/train': 1.0623342990875244} +03/05/2022 05:47:20 - INFO - codeparrot_training - Skipping example with length 411 (seq_length=1024) +03/05/2022 05:47:24 - INFO - codeparrot_training - Step 34312: {'lr': 0.0004434645339412954, 'samples': 17568256, 'steps': 34312, 'loss/train': 1.2388983964920044} +03/05/2022 05:47:27 - INFO - codeparrot_training - Step 34313: {'lr': 0.0004434611728235722, 'samples': 17568768, 'steps': 34313, 'loss/train': 2.177865505218506} +03/05/2022 05:47:28 - INFO - codeparrot_training - Skipping example with length 810 (seq_length=1024) +03/05/2022 05:47:33 - INFO - codeparrot_training - Step 34314: {'lr': 0.0004434578116186785, 'samples': 17569280, 'steps': 34314, 'loss/train': 1.789249300956726} +03/05/2022 05:47:36 - INFO - codeparrot_training - Step 34315: {'lr': 0.00044345445032661565, 'samples': 17569792, 'steps': 34315, 'loss/train': 1.8509910106658936} +03/05/2022 05:47:37 - INFO - codeparrot_training - Skipping example with length 871 (seq_length=1024) +03/05/2022 05:47:41 - INFO - codeparrot_training - Step 34316: {'lr': 0.0004434510889473852, 'samples': 17570304, 'steps': 34316, 'loss/train': 2.1319479942321777} +03/05/2022 05:47:44 - INFO - codeparrot_training - Step 34317: {'lr': 0.00044344772748098867, 'samples': 17570816, 'steps': 34317, 'loss/train': 1.7488441467285156} +03/05/2022 05:47:45 - INFO - codeparrot_training - Skipping example with length 965 (seq_length=1024) +03/05/2022 05:47:50 - INFO - codeparrot_training - Step 34318: {'lr': 0.00044344436592742755, 'samples': 17571328, 'steps': 34318, 'loss/train': 2.176799774169922} +03/05/2022 05:47:53 - INFO - codeparrot_training - Step 34319: {'lr': 0.0004434410042867034, 'samples': 17571840, 'steps': 34319, 'loss/train': 0.9293532967567444} +03/05/2022 05:47:53 - INFO - codeparrot_training - Skipping example with length 565 (seq_length=1024) +03/05/2022 05:47:58 - INFO - codeparrot_training - Step 34320: {'lr': 0.0004434376425588178, 'samples': 17572352, 'steps': 34320, 'loss/train': 1.8992440700531006} +03/05/2022 05:48:01 - INFO - codeparrot_training - Step 34321: {'lr': 0.00044343428074377207, 'samples': 17572864, 'steps': 34321, 'loss/train': 0.9902983903884888} +03/05/2022 05:48:02 - INFO - codeparrot_training - Skipping example with length 855 (seq_length=1024) +03/05/2022 05:48:06 - INFO - codeparrot_training - Step 34322: {'lr': 0.0004434309188415679, 'samples': 17573376, 'steps': 34322, 'loss/train': 1.4456440210342407} +03/05/2022 05:48:10 - INFO - codeparrot_training - Step 34323: {'lr': 0.0004434275568522067, 'samples': 17573888, 'steps': 34323, 'loss/train': 1.9827333688735962} +03/05/2022 05:48:10 - INFO - codeparrot_training - Skipping example with length 931 (seq_length=1024) +03/05/2022 05:48:15 - INFO - codeparrot_training - Step 34324: {'lr': 0.0004434241947756901, 'samples': 17574400, 'steps': 34324, 'loss/train': 1.8385484218597412} +03/05/2022 05:48:18 - INFO - codeparrot_training - Step 34325: {'lr': 0.0004434208326120195, 'samples': 17574912, 'steps': 34325, 'loss/train': 2.059199333190918} +03/05/2022 05:48:19 - INFO - codeparrot_training - Skipping example with length 566 (seq_length=1024) +03/05/2022 05:48:23 - INFO - codeparrot_training - Step 34326: {'lr': 0.0004434174703611964, 'samples': 17575424, 'steps': 34326, 'loss/train': 1.24283766746521} +03/05/2022 05:48:27 - INFO - codeparrot_training - Step 34327: {'lr': 0.00044341410802322247, 'samples': 17575936, 'steps': 34327, 'loss/train': 1.4816592931747437} +03/05/2022 05:48:27 - INFO - codeparrot_training - Skipping example with length 828 (seq_length=1024) +03/05/2022 05:48:32 - INFO - codeparrot_training - Step 34328: {'lr': 0.00044341074559809903, 'samples': 17576448, 'steps': 34328, 'loss/train': 1.7746317386627197} +03/05/2022 05:48:35 - INFO - codeparrot_training - Step 34329: {'lr': 0.00044340738308582775, 'samples': 17576960, 'steps': 34329, 'loss/train': 2.00506591796875} +03/05/2022 05:48:36 - INFO - codeparrot_training - Skipping example with length 233 (seq_length=1024) +03/05/2022 05:48:40 - INFO - codeparrot_training - Step 34330: {'lr': 0.0004434040204864101, 'samples': 17577472, 'steps': 34330, 'loss/train': 1.7405996322631836} +03/05/2022 05:48:43 - INFO - codeparrot_training - Step 34331: {'lr': 0.00044340065779984757, 'samples': 17577984, 'steps': 34331, 'loss/train': 2.0547502040863037} +03/05/2022 05:48:44 - INFO - codeparrot_training - Skipping example with length 185 (seq_length=1024) +03/05/2022 05:48:49 - INFO - codeparrot_training - Step 34332: {'lr': 0.0004433972950261417, 'samples': 17578496, 'steps': 34332, 'loss/train': 1.6941430568695068} +03/05/2022 05:48:52 - INFO - codeparrot_training - Step 34333: {'lr': 0.00044339393216529394, 'samples': 17579008, 'steps': 34333, 'loss/train': 1.4666920900344849} +03/05/2022 05:48:52 - INFO - codeparrot_training - Skipping example with length 318 (seq_length=1024) +03/05/2022 05:48:57 - INFO - codeparrot_training - Step 34334: {'lr': 0.00044339056921730593, 'samples': 17579520, 'steps': 34334, 'loss/train': 0.9629276990890503} +03/05/2022 05:49:00 - INFO - codeparrot_training - Step 34335: {'lr': 0.000443387206182179, 'samples': 17580032, 'steps': 34335, 'loss/train': 1.7317924499511719} +03/05/2022 05:49:01 - INFO - codeparrot_training - Skipping example with length 69 (seq_length=1024) +03/05/2022 05:49:06 - INFO - codeparrot_training - Step 34336: {'lr': 0.0004433838430599149, 'samples': 17580544, 'steps': 34336, 'loss/train': 1.4611281156539917} +03/05/2022 05:49:09 - INFO - codeparrot_training - Step 34337: {'lr': 0.000443380479850515, 'samples': 17581056, 'steps': 34337, 'loss/train': 1.758908987045288} +03/05/2022 05:49:09 - INFO - codeparrot_training - Skipping example with length 586 (seq_length=1024) +03/05/2022 05:49:14 - INFO - codeparrot_training - Step 34338: {'lr': 0.00044337711655398083, 'samples': 17581568, 'steps': 34338, 'loss/train': 1.1988584995269775} +03/05/2022 05:49:17 - INFO - codeparrot_training - Step 34339: {'lr': 0.00044337375317031393, 'samples': 17582080, 'steps': 34339, 'loss/train': 1.847428798675537} +03/05/2022 05:49:17 - INFO - codeparrot_training - Skipping example with length 814 (seq_length=1024) +03/05/2022 05:49:22 - INFO - codeparrot_training - Step 34340: {'lr': 0.0004433703896995157, 'samples': 17582592, 'steps': 34340, 'loss/train': 1.344567894935608} +03/05/2022 05:49:25 - INFO - codeparrot_training - Step 34341: {'lr': 0.0004433670261415879, 'samples': 17583104, 'steps': 34341, 'loss/train': 1.682849645614624} +03/05/2022 05:49:26 - INFO - codeparrot_training - Skipping example with length 879 (seq_length=1024) +03/05/2022 05:49:31 - INFO - codeparrot_training - Step 34342: {'lr': 0.0004433636624965318, 'samples': 17583616, 'steps': 34342, 'loss/train': 2.6633098125457764} +03/05/2022 05:49:34 - INFO - codeparrot_training - Step 34343: {'lr': 0.0004433602987643491, 'samples': 17584128, 'steps': 34343, 'loss/train': 0.10058866441249847} +03/05/2022 05:49:35 - INFO - codeparrot_training - Skipping example with length 1003 (seq_length=1024) +03/05/2022 05:49:39 - INFO - codeparrot_training - Step 34344: {'lr': 0.00044335693494504115, 'samples': 17584640, 'steps': 34344, 'loss/train': 1.789832592010498} +03/05/2022 05:49:43 - INFO - codeparrot_training - Step 34345: {'lr': 0.00044335357103860964, 'samples': 17585152, 'steps': 34345, 'loss/train': 2.1360182762145996} +03/05/2022 05:49:44 - INFO - codeparrot_training - Skipping example with length 871 (seq_length=1024) +03/05/2022 05:49:48 - INFO - codeparrot_training - Step 34346: {'lr': 0.0004433502070450559, 'samples': 17585664, 'steps': 34346, 'loss/train': 2.0114269256591797} +03/05/2022 05:49:51 - INFO - codeparrot_training - Step 34347: {'lr': 0.0004433468429643816, 'samples': 17586176, 'steps': 34347, 'loss/train': 1.6056681871414185} +03/05/2022 05:49:52 - INFO - codeparrot_training - Skipping example with length 479 (seq_length=1024) +03/05/2022 05:49:56 - INFO - codeparrot_training - Step 34348: {'lr': 0.00044334347879658817, 'samples': 17586688, 'steps': 34348, 'loss/train': 1.8490829467773438} +03/05/2022 05:50:00 - INFO - codeparrot_training - Step 34349: {'lr': 0.0004433401145416771, 'samples': 17587200, 'steps': 34349, 'loss/train': 1.1431628465652466} +03/05/2022 05:50:01 - INFO - codeparrot_training - Skipping example with length 28 (seq_length=1024) +03/05/2022 05:50:05 - INFO - codeparrot_training - Step 34350: {'lr': 0.00044333675019965, 'samples': 17587712, 'steps': 34350, 'loss/train': 1.0035871267318726} +03/05/2022 05:50:08 - INFO - codeparrot_training - Step 34351: {'lr': 0.00044333338577050844, 'samples': 17588224, 'steps': 34351, 'loss/train': 3.328921318054199} +03/05/2022 05:50:10 - INFO - codeparrot_training - Skipping example with length 168 (seq_length=1024) +03/05/2022 05:50:14 - INFO - codeparrot_training - Step 34352: {'lr': 0.0004433300212542537, 'samples': 17588736, 'steps': 34352, 'loss/train': 0.7708403468132019} +03/05/2022 05:50:17 - INFO - codeparrot_training - Step 34353: {'lr': 0.00044332665665088755, 'samples': 17589248, 'steps': 34353, 'loss/train': 1.471516728401184} +03/05/2022 05:50:19 - INFO - codeparrot_training - Skipping example with length 527 (seq_length=1024) +03/05/2022 05:50:22 - INFO - codeparrot_training - Step 34354: {'lr': 0.00044332329196041133, 'samples': 17589760, 'steps': 34354, 'loss/train': 0.1122208759188652} +03/05/2022 05:50:25 - INFO - codeparrot_training - Step 34355: {'lr': 0.0004433199271828267, 'samples': 17590272, 'steps': 34355, 'loss/train': 1.0844810009002686} +03/05/2022 05:50:27 - INFO - codeparrot_training - Skipping example with length 459 (seq_length=1024) +03/05/2022 05:50:31 - INFO - codeparrot_training - Step 34356: {'lr': 0.0004433165623181349, 'samples': 17590784, 'steps': 34356, 'loss/train': 1.5952184200286865} +03/05/2022 05:50:34 - INFO - codeparrot_training - Step 34357: {'lr': 0.0004433131973663378, 'samples': 17591296, 'steps': 34357, 'loss/train': 1.9786046743392944} +03/05/2022 05:50:35 - INFO - codeparrot_training - Skipping example with length 371 (seq_length=1024) +03/05/2022 05:50:39 - INFO - codeparrot_training - Step 34358: {'lr': 0.0004433098323274367, 'samples': 17591808, 'steps': 34358, 'loss/train': 0.9796678423881531} +03/05/2022 05:50:42 - INFO - codeparrot_training - Step 34359: {'lr': 0.00044330646720143317, 'samples': 17592320, 'steps': 34359, 'loss/train': 1.2841209173202515} +03/05/2022 05:50:44 - INFO - codeparrot_training - Skipping example with length 934 (seq_length=1024) +03/05/2022 05:50:47 - INFO - codeparrot_training - Step 34360: {'lr': 0.0004433031019883288, 'samples': 17592832, 'steps': 34360, 'loss/train': 2.4441580772399902} +03/05/2022 05:50:51 - INFO - codeparrot_training - Step 34361: {'lr': 0.00044329973668812497, 'samples': 17593344, 'steps': 34361, 'loss/train': 2.3340935707092285} +03/05/2022 05:50:52 - INFO - codeparrot_training - Skipping example with length 1018 (seq_length=1024) +03/05/2022 05:50:56 - INFO - codeparrot_training - Step 34362: {'lr': 0.00044329637130082324, 'samples': 17593856, 'steps': 34362, 'loss/train': 1.3810921907424927} +03/05/2022 05:50:59 - INFO - codeparrot_training - Step 34363: {'lr': 0.00044329300582642516, 'samples': 17594368, 'steps': 34363, 'loss/train': 1.4531831741333008} +03/05/2022 05:51:00 - INFO - codeparrot_training - Skipping example with length 346 (seq_length=1024) +03/05/2022 05:51:04 - INFO - codeparrot_training - Step 34364: {'lr': 0.0004432896402649323, 'samples': 17594880, 'steps': 34364, 'loss/train': 1.7095104455947876} +03/05/2022 05:51:07 - INFO - codeparrot_training - Step 34365: {'lr': 0.0004432862746163461, 'samples': 17595392, 'steps': 34365, 'loss/train': 1.4555608034133911} +03/05/2022 05:51:09 - INFO - codeparrot_training - Skipping example with length 80 (seq_length=1024) +03/05/2022 05:51:13 - INFO - codeparrot_training - Step 34366: {'lr': 0.000443282908880668, 'samples': 17595904, 'steps': 34366, 'loss/train': 1.9329689741134644} +03/05/2022 05:51:16 - INFO - codeparrot_training - Step 34367: {'lr': 0.00044327954305789963, 'samples': 17596416, 'steps': 34367, 'loss/train': 1.521092414855957} +03/05/2022 05:51:17 - INFO - codeparrot_training - Skipping example with length 5 (seq_length=1024) +03/05/2022 05:51:21 - INFO - codeparrot_training - Step 34368: {'lr': 0.0004432761771480426, 'samples': 17596928, 'steps': 34368, 'loss/train': 0.47753584384918213} +03/05/2022 05:51:24 - INFO - codeparrot_training - Step 34369: {'lr': 0.0004432728111510982, 'samples': 17597440, 'steps': 34369, 'loss/train': 1.56006920337677} +03/05/2022 05:51:25 - INFO - codeparrot_training - Skipping example with length 812 (seq_length=1024) +03/05/2022 05:51:29 - INFO - codeparrot_training - Step 34370: {'lr': 0.000443269445067068, 'samples': 17597952, 'steps': 34370, 'loss/train': 1.8805415630340576} +03/05/2022 05:51:33 - INFO - codeparrot_training - Step 34371: {'lr': 0.0004432660788959537, 'samples': 17598464, 'steps': 34371, 'loss/train': 2.6906087398529053} +03/05/2022 05:51:34 - INFO - codeparrot_training - Skipping example with length 580 (seq_length=1024) +03/05/2022 05:51:38 - INFO - codeparrot_training - Step 34372: {'lr': 0.00044326271263775657, 'samples': 17598976, 'steps': 34372, 'loss/train': 1.870263695716858} +03/05/2022 05:51:41 - INFO - codeparrot_training - Step 34373: {'lr': 0.0004432593462924783, 'samples': 17599488, 'steps': 34373, 'loss/train': 2.1580281257629395} +03/05/2022 05:51:42 - INFO - codeparrot_training - Skipping example with length 1016 (seq_length=1024) +03/05/2022 05:51:46 - INFO - codeparrot_training - Step 34374: {'lr': 0.0004432559798601203, 'samples': 17600000, 'steps': 34374, 'loss/train': 1.7139902114868164} +03/05/2022 05:51:49 - INFO - codeparrot_training - Step 34375: {'lr': 0.0004432526133406842, 'samples': 17600512, 'steps': 34375, 'loss/train': 1.9820737838745117} +03/05/2022 05:51:50 - INFO - codeparrot_training - Skipping example with length 997 (seq_length=1024) +03/05/2022 05:51:55 - INFO - codeparrot_training - Step 34376: {'lr': 0.0004432492467341715, 'samples': 17601024, 'steps': 34376, 'loss/train': 1.0611504316329956} +03/05/2022 05:51:58 - INFO - codeparrot_training - Step 34377: {'lr': 0.00044324588004058364, 'samples': 17601536, 'steps': 34377, 'loss/train': 0.07836358994245529} +03/05/2022 05:51:59 - INFO - codeparrot_training - Skipping example with length 906 (seq_length=1024) +03/05/2022 05:52:03 - INFO - codeparrot_training - Step 34378: {'lr': 0.00044324251325992214, 'samples': 17602048, 'steps': 34378, 'loss/train': 1.802234172821045} +03/05/2022 05:52:06 - INFO - codeparrot_training - Step 34379: {'lr': 0.0004432391463921885, 'samples': 17602560, 'steps': 34379, 'loss/train': 0.8240492939949036} +03/05/2022 05:52:07 - INFO - codeparrot_training - Skipping example with length 72 (seq_length=1024) +03/05/2022 05:52:12 - INFO - codeparrot_training - Step 34380: {'lr': 0.00044323577943738437, 'samples': 17603072, 'steps': 34380, 'loss/train': 2.1280899047851562} +03/05/2022 05:52:15 - INFO - codeparrot_training - Step 34381: {'lr': 0.00044323241239551113, 'samples': 17603584, 'steps': 34381, 'loss/train': 1.7750048637390137} +03/05/2022 05:52:16 - INFO - codeparrot_training - Skipping example with length 366 (seq_length=1024) +03/05/2022 05:52:20 - INFO - codeparrot_training - Step 34382: {'lr': 0.0004432290452665704, 'samples': 17604096, 'steps': 34382, 'loss/train': 1.799130916595459} +03/05/2022 05:52:23 - INFO - codeparrot_training - Step 34383: {'lr': 0.00044322567805056356, 'samples': 17604608, 'steps': 34383, 'loss/train': 1.7529054880142212} +03/05/2022 05:52:24 - INFO - codeparrot_training - Skipping example with length 440 (seq_length=1024) +03/05/2022 05:52:29 - INFO - codeparrot_training - Step 34384: {'lr': 0.00044322231074749225, 'samples': 17605120, 'steps': 34384, 'loss/train': 1.4071407318115234} +03/05/2022 05:52:32 - INFO - codeparrot_training - Step 34385: {'lr': 0.0004432189433573579, 'samples': 17605632, 'steps': 34385, 'loss/train': 0.5387511849403381} +03/05/2022 05:52:33 - INFO - codeparrot_training - Skipping example with length 841 (seq_length=1024) +03/05/2022 05:52:37 - INFO - codeparrot_training - Step 34386: {'lr': 0.00044321557588016214, 'samples': 17606144, 'steps': 34386, 'loss/train': 1.0450592041015625} +03/05/2022 05:52:40 - INFO - codeparrot_training - Step 34387: {'lr': 0.0004432122083159065, 'samples': 17606656, 'steps': 34387, 'loss/train': 1.3318291902542114} +03/05/2022 05:52:41 - INFO - codeparrot_training - Skipping example with length 795 (seq_length=1024) +03/05/2022 05:52:45 - INFO - codeparrot_training - Step 34388: {'lr': 0.0004432088406645922, 'samples': 17607168, 'steps': 34388, 'loss/train': 1.5386408567428589} +03/05/2022 05:52:48 - INFO - codeparrot_training - Step 34389: {'lr': 0.00044320547292622114, 'samples': 17607680, 'steps': 34389, 'loss/train': 1.052255630493164} +03/05/2022 05:52:49 - INFO - codeparrot_training - Skipping example with length 903 (seq_length=1024) +03/05/2022 05:52:54 - INFO - codeparrot_training - Step 34390: {'lr': 0.0004432021051007946, 'samples': 17608192, 'steps': 34390, 'loss/train': 2.951464891433716} +03/05/2022 05:52:57 - INFO - codeparrot_training - Step 34391: {'lr': 0.00044319873718831425, 'samples': 17608704, 'steps': 34391, 'loss/train': 2.170942544937134} +03/05/2022 05:52:58 - INFO - codeparrot_training - Skipping example with length 89 (seq_length=1024) +03/05/2022 05:53:02 - INFO - codeparrot_training - Step 34392: {'lr': 0.00044319536918878156, 'samples': 17609216, 'steps': 34392, 'loss/train': 2.1667444705963135} +03/05/2022 05:53:05 - INFO - codeparrot_training - Step 34393: {'lr': 0.00044319200110219794, 'samples': 17609728, 'steps': 34393, 'loss/train': 1.8097416162490845} +03/05/2022 05:53:07 - INFO - codeparrot_training - Skipping example with length 497 (seq_length=1024) +03/05/2022 05:53:11 - INFO - codeparrot_training - Step 34394: {'lr': 0.000443188632928565, 'samples': 17610240, 'steps': 34394, 'loss/train': 1.1077992916107178} +03/05/2022 05:53:14 - INFO - codeparrot_training - Step 34395: {'lr': 0.0004431852646678842, 'samples': 17610752, 'steps': 34395, 'loss/train': 2.0320076942443848} +03/05/2022 05:53:15 - INFO - codeparrot_training - Skipping example with length 867 (seq_length=1024) +03/05/2022 05:53:19 - INFO - codeparrot_training - Step 34396: {'lr': 0.00044318189632015716, 'samples': 17611264, 'steps': 34396, 'loss/train': 1.2975411415100098} +03/05/2022 05:53:22 - INFO - codeparrot_training - Step 34397: {'lr': 0.0004431785278853853, 'samples': 17611776, 'steps': 34397, 'loss/train': 2.9047763347625732} +03/05/2022 05:53:23 - INFO - codeparrot_training - Skipping example with length 451 (seq_length=1024) +03/05/2022 05:53:27 - INFO - codeparrot_training - Step 34398: {'lr': 0.0004431751593635702, 'samples': 17612288, 'steps': 34398, 'loss/train': 1.077797770500183} +03/05/2022 05:53:31 - INFO - codeparrot_training - Step 34399: {'lr': 0.00044317179075471335, 'samples': 17612800, 'steps': 34399, 'loss/train': 0.564679741859436} +03/05/2022 05:53:31 - INFO - codeparrot_training - Skipping example with length 219 (seq_length=1024) +03/05/2022 05:53:36 - INFO - codeparrot_training - Step 34400: {'lr': 0.00044316842205881625, 'samples': 17613312, 'steps': 34400, 'loss/train': 1.935970425605774} +03/05/2022 05:53:39 - INFO - codeparrot_training - Step 34401: {'lr': 0.00044316505327588054, 'samples': 17613824, 'steps': 34401, 'loss/train': 2.5713207721710205} +03/05/2022 05:53:39 - INFO - codeparrot_training - Skipping example with length 931 (seq_length=1024) +03/05/2022 05:53:44 - INFO - codeparrot_training - Step 34402: {'lr': 0.00044316168440590757, 'samples': 17614336, 'steps': 34402, 'loss/train': 1.9616584777832031} +03/05/2022 05:53:47 - INFO - codeparrot_training - Step 34403: {'lr': 0.00044315831544889886, 'samples': 17614848, 'steps': 34403, 'loss/train': 0.3963319957256317} +03/05/2022 05:53:48 - INFO - codeparrot_training - Skipping example with length 184 (seq_length=1024) +03/05/2022 05:53:53 - INFO - codeparrot_training - Step 34404: {'lr': 0.0004431549464048561, 'samples': 17615360, 'steps': 34404, 'loss/train': 2.0712599754333496} +03/05/2022 05:53:56 - INFO - codeparrot_training - Step 34405: {'lr': 0.0004431515772737806, 'samples': 17615872, 'steps': 34405, 'loss/train': 1.9355063438415527} +03/05/2022 05:53:57 - INFO - codeparrot_training - Skipping example with length 139 (seq_length=1024) +03/05/2022 05:54:01 - INFO - codeparrot_training - Step 34406: {'lr': 0.000443148208055674, 'samples': 17616384, 'steps': 34406, 'loss/train': 1.78676438331604} +03/05/2022 05:54:04 - INFO - codeparrot_training - Step 34407: {'lr': 0.0004431448387505379, 'samples': 17616896, 'steps': 34407, 'loss/train': 1.5852714776992798} +03/05/2022 05:54:05 - INFO - codeparrot_training - Skipping example with length 652 (seq_length=1024) +03/05/2022 05:54:10 - INFO - codeparrot_training - Step 34408: {'lr': 0.00044314146935837365, 'samples': 17617408, 'steps': 34408, 'loss/train': 2.192098617553711} +03/05/2022 05:54:13 - INFO - codeparrot_training - Step 34409: {'lr': 0.0004431380998791828, 'samples': 17617920, 'steps': 34409, 'loss/train': 1.824895977973938} +03/05/2022 05:54:14 - INFO - codeparrot_training - Skipping example with length 329 (seq_length=1024) +03/05/2022 05:54:18 - INFO - codeparrot_training - Step 34410: {'lr': 0.0004431347303129669, 'samples': 17618432, 'steps': 34410, 'loss/train': 1.9701175689697266} +03/05/2022 05:54:21 - INFO - codeparrot_training - Step 34411: {'lr': 0.00044313136065972754, 'samples': 17618944, 'steps': 34411, 'loss/train': 0.8751137852668762} +03/05/2022 05:54:22 - INFO - codeparrot_training - Skipping example with length 761 (seq_length=1024) +03/05/2022 05:54:27 - INFO - codeparrot_training - Step 34412: {'lr': 0.0004431279909194661, 'samples': 17619456, 'steps': 34412, 'loss/train': 1.698349118232727} +03/05/2022 05:54:30 - INFO - codeparrot_training - Step 34413: {'lr': 0.00044312462109218423, 'samples': 17619968, 'steps': 34413, 'loss/train': 1.0718051195144653} +03/05/2022 05:54:31 - INFO - codeparrot_training - Skipping example with length 234 (seq_length=1024) +03/05/2022 05:54:35 - INFO - codeparrot_training - Step 34414: {'lr': 0.0004431212511778834, 'samples': 17620480, 'steps': 34414, 'loss/train': 1.3571727275848389} +03/05/2022 05:54:38 - INFO - codeparrot_training - Step 34415: {'lr': 0.000443117881176565, 'samples': 17620992, 'steps': 34415, 'loss/train': 1.6778255701065063} +03/05/2022 05:54:39 - INFO - codeparrot_training - Skipping example with length 677 (seq_length=1024) +03/05/2022 05:54:43 - INFO - codeparrot_training - Step 34416: {'lr': 0.00044311451108823075, 'samples': 17621504, 'steps': 34416, 'loss/train': 0.9632115364074707} +03/05/2022 05:54:47 - INFO - codeparrot_training - Step 34417: {'lr': 0.00044311114091288205, 'samples': 17622016, 'steps': 34417, 'loss/train': 1.2326486110687256} +03/05/2022 05:54:47 - INFO - codeparrot_training - Skipping example with length 116 (seq_length=1024) +03/05/2022 05:54:52 - INFO - codeparrot_training - Step 34418: {'lr': 0.0004431077706505205, 'samples': 17622528, 'steps': 34418, 'loss/train': 1.995125412940979} +03/05/2022 05:54:55 - INFO - codeparrot_training - Step 34419: {'lr': 0.0004431044003011475, 'samples': 17623040, 'steps': 34419, 'loss/train': 1.4261152744293213} +03/05/2022 05:54:55 - INFO - codeparrot_training - Skipping example with length 191 (seq_length=1024) +03/05/2022 05:55:00 - INFO - codeparrot_training - Step 34420: {'lr': 0.00044310102986476463, 'samples': 17623552, 'steps': 34420, 'loss/train': 1.9545880556106567} +03/05/2022 05:55:03 - INFO - codeparrot_training - Step 34421: {'lr': 0.0004430976593413735, 'samples': 17624064, 'steps': 34421, 'loss/train': 1.7602641582489014} +03/05/2022 05:55:04 - INFO - codeparrot_training - Skipping example with length 418 (seq_length=1024) +03/05/2022 05:55:09 - INFO - codeparrot_training - Step 34422: {'lr': 0.0004430942887309755, 'samples': 17624576, 'steps': 34422, 'loss/train': 1.4113630056381226} +03/05/2022 05:55:12 - INFO - codeparrot_training - Step 34423: {'lr': 0.00044309091803357216, 'samples': 17625088, 'steps': 34423, 'loss/train': 1.584171175956726} +03/05/2022 05:55:12 - INFO - codeparrot_training - Skipping example with length 760 (seq_length=1024) +03/05/2022 05:55:17 - INFO - codeparrot_training - Step 34424: {'lr': 0.0004430875472491651, 'samples': 17625600, 'steps': 34424, 'loss/train': 1.815016746520996} +03/05/2022 05:55:20 - INFO - codeparrot_training - Step 34425: {'lr': 0.0004430841763777557, 'samples': 17626112, 'steps': 34425, 'loss/train': 2.3161253929138184} +03/05/2022 05:55:20 - INFO - codeparrot_training - Skipping example with length 938 (seq_length=1024) +03/05/2022 05:55:25 - INFO - codeparrot_training - Step 34426: {'lr': 0.0004430808054193456, 'samples': 17626624, 'steps': 34426, 'loss/train': 1.9756784439086914} +03/05/2022 05:55:28 - INFO - codeparrot_training - Skipping example with length 625 (seq_length=1024) +03/05/2022 05:55:31 - INFO - codeparrot_training - Step 34427: {'lr': 0.00044307743437393623, 'samples': 17627136, 'steps': 34427, 'loss/train': 1.6235538721084595} +03/05/2022 05:55:34 - INFO - codeparrot_training - Step 34428: {'lr': 0.0004430740632415292, 'samples': 17627648, 'steps': 34428, 'loss/train': 1.426363468170166} +03/05/2022 05:55:37 - INFO - codeparrot_training - Skipping example with length 710 (seq_length=1024) +03/05/2022 05:55:39 - INFO - codeparrot_training - Step 34429: {'lr': 0.0004430706920221259, 'samples': 17628160, 'steps': 34429, 'loss/train': 1.7427458763122559} +03/05/2022 05:55:42 - INFO - codeparrot_training - Step 34430: {'lr': 0.00044306732071572796, 'samples': 17628672, 'steps': 34430, 'loss/train': 2.6821250915527344} +03/05/2022 05:55:45 - INFO - codeparrot_training - Skipping example with length 174 (seq_length=1024) +03/05/2022 05:55:48 - INFO - codeparrot_training - Step 34431: {'lr': 0.00044306394932233694, 'samples': 17629184, 'steps': 34431, 'loss/train': 1.5240299701690674} +03/05/2022 05:55:51 - INFO - codeparrot_training - Step 34432: {'lr': 0.0004430605778419542, 'samples': 17629696, 'steps': 34432, 'loss/train': 1.8086680173873901} +03/05/2022 05:55:53 - INFO - codeparrot_training - Skipping example with length 993 (seq_length=1024) +03/05/2022 05:55:56 - INFO - codeparrot_training - Step 34433: {'lr': 0.00044305720627458136, 'samples': 17630208, 'steps': 34433, 'loss/train': 1.9986445903778076} +03/05/2022 05:55:59 - INFO - codeparrot_training - Step 34434: {'lr': 0.00044305383462022, 'samples': 17630720, 'steps': 34434, 'loss/train': 1.1556581258773804} +03/05/2022 05:56:02 - INFO - codeparrot_training - Skipping example with length 965 (seq_length=1024) +03/05/2022 05:56:04 - INFO - codeparrot_training - Step 34435: {'lr': 0.0004430504628788714, 'samples': 17631232, 'steps': 34435, 'loss/train': 1.813632845878601} +03/05/2022 05:56:08 - INFO - codeparrot_training - Step 34436: {'lr': 0.0004430470910505373, 'samples': 17631744, 'steps': 34436, 'loss/train': 1.6379098892211914} +03/05/2022 05:56:10 - INFO - codeparrot_training - Skipping example with length 96 (seq_length=1024) +03/05/2022 05:56:13 - INFO - codeparrot_training - Step 34437: {'lr': 0.00044304371913521926, 'samples': 17632256, 'steps': 34437, 'loss/train': 1.3613522052764893} +03/05/2022 05:56:16 - INFO - codeparrot_training - Step 34438: {'lr': 0.0004430403471329186, 'samples': 17632768, 'steps': 34438, 'loss/train': 1.427315592765808} +03/05/2022 05:56:19 - INFO - codeparrot_training - Skipping example with length 266 (seq_length=1024) +03/05/2022 05:56:21 - INFO - codeparrot_training - Step 34439: {'lr': 0.0004430369750436369, 'samples': 17633280, 'steps': 34439, 'loss/train': 1.2265994548797607} +03/05/2022 05:56:24 - INFO - codeparrot_training - Step 34440: {'lr': 0.0004430336028673758, 'samples': 17633792, 'steps': 34440, 'loss/train': 1.8094308376312256} +03/05/2022 05:56:27 - INFO - codeparrot_training - Skipping example with length 560 (seq_length=1024) +03/05/2022 05:56:30 - INFO - codeparrot_training - Step 34441: {'lr': 0.00044303023060413677, 'samples': 17634304, 'steps': 34441, 'loss/train': 1.7392663955688477} +03/05/2022 05:56:33 - INFO - codeparrot_training - Step 34442: {'lr': 0.0004430268582539212, 'samples': 17634816, 'steps': 34442, 'loss/train': 0.80379718542099} +03/05/2022 05:56:35 - INFO - codeparrot_training - Skipping example with length 740 (seq_length=1024) +03/05/2022 05:56:38 - INFO - codeparrot_training - Step 34443: {'lr': 0.0004430234858167308, 'samples': 17635328, 'steps': 34443, 'loss/train': 0.9262971878051758} +03/05/2022 05:56:41 - INFO - codeparrot_training - Step 34444: {'lr': 0.000443020113292567, 'samples': 17635840, 'steps': 34444, 'loss/train': 0.8795902132987976} +03/05/2022 05:56:44 - INFO - codeparrot_training - Skipping example with length 240 (seq_length=1024) +03/05/2022 05:56:47 - INFO - codeparrot_training - Step 34445: {'lr': 0.0004430167406814312, 'samples': 17636352, 'steps': 34445, 'loss/train': 1.2451926469802856} +03/05/2022 05:56:50 - INFO - codeparrot_training - Step 34446: {'lr': 0.0004430133679833251, 'samples': 17636864, 'steps': 34446, 'loss/train': 1.6805188655853271} +03/05/2022 05:56:52 - INFO - codeparrot_training - Skipping example with length 659 (seq_length=1024) +03/05/2022 05:56:55 - INFO - codeparrot_training - Step 34447: {'lr': 0.00044300999519825016, 'samples': 17637376, 'steps': 34447, 'loss/train': 1.478570580482483} +03/05/2022 05:56:58 - INFO - codeparrot_training - Step 34448: {'lr': 0.00044300662232620784, 'samples': 17637888, 'steps': 34448, 'loss/train': 2.1637840270996094} +03/05/2022 05:57:00 - INFO - codeparrot_training - Skipping example with length 505 (seq_length=1024) +03/05/2022 05:57:03 - INFO - codeparrot_training - Step 34449: {'lr': 0.0004430032493671998, 'samples': 17638400, 'steps': 34449, 'loss/train': 2.482656478881836} +03/05/2022 05:57:07 - INFO - codeparrot_training - Step 34450: {'lr': 0.0004429998763212274, 'samples': 17638912, 'steps': 34450, 'loss/train': 1.4891188144683838} +03/05/2022 05:57:08 - INFO - codeparrot_training - Skipping example with length 494 (seq_length=1024) +03/05/2022 05:57:12 - INFO - codeparrot_training - Step 34451: {'lr': 0.00044299650318829233, 'samples': 17639424, 'steps': 34451, 'loss/train': 1.8637944459915161} +03/05/2022 05:57:15 - INFO - codeparrot_training - Step 34452: {'lr': 0.0004429931299683959, 'samples': 17639936, 'steps': 34452, 'loss/train': 1.5967692136764526} +03/05/2022 05:57:17 - INFO - codeparrot_training - Skipping example with length 427 (seq_length=1024) +03/05/2022 05:57:20 - INFO - codeparrot_training - Step 34453: {'lr': 0.0004429897566615398, 'samples': 17640448, 'steps': 34453, 'loss/train': 1.0530067682266235} +03/05/2022 05:57:24 - INFO - codeparrot_training - Step 34454: {'lr': 0.0004429863832677255, 'samples': 17640960, 'steps': 34454, 'loss/train': 2.082125186920166} +03/05/2022 05:57:26 - INFO - codeparrot_training - Skipping example with length 616 (seq_length=1024) +03/05/2022 05:57:29 - INFO - codeparrot_training - Step 34455: {'lr': 0.0004429830097869545, 'samples': 17641472, 'steps': 34455, 'loss/train': 0.6839268207550049} +03/05/2022 05:57:32 - INFO - codeparrot_training - Step 34456: {'lr': 0.0004429796362192283, 'samples': 17641984, 'steps': 34456, 'loss/train': 1.8771288394927979} +03/05/2022 05:57:34 - INFO - codeparrot_training - Skipping example with length 575 (seq_length=1024) +03/05/2022 05:57:38 - INFO - codeparrot_training - Step 34457: {'lr': 0.0004429762625645485, 'samples': 17642496, 'steps': 34457, 'loss/train': 2.4734363555908203} +03/05/2022 05:57:41 - INFO - codeparrot_training - Step 34458: {'lr': 0.0004429728888229166, 'samples': 17643008, 'steps': 34458, 'loss/train': 2.0212860107421875} +03/05/2022 05:57:43 - INFO - codeparrot_training - Skipping example with length 300 (seq_length=1024) +03/05/2022 05:57:46 - INFO - codeparrot_training - Step 34459: {'lr': 0.000442969514994334, 'samples': 17643520, 'steps': 34459, 'loss/train': 2.442194938659668} +03/05/2022 05:57:49 - INFO - codeparrot_training - Step 34460: {'lr': 0.0004429661410788024, 'samples': 17644032, 'steps': 34460, 'loss/train': 1.4718222618103027} +03/05/2022 05:57:51 - INFO - codeparrot_training - Skipping example with length 638 (seq_length=1024) +03/05/2022 05:57:54 - INFO - codeparrot_training - Step 34461: {'lr': 0.00044296276707632323, 'samples': 17644544, 'steps': 34461, 'loss/train': 1.0123987197875977} +03/05/2022 05:57:58 - INFO - codeparrot_training - Step 34462: {'lr': 0.000442959392986898, 'samples': 17645056, 'steps': 34462, 'loss/train': 1.391916275024414} +03/05/2022 05:57:59 - INFO - codeparrot_training - Skipping example with length 85 (seq_length=1024) +03/05/2022 05:58:03 - INFO - codeparrot_training - Step 34463: {'lr': 0.0004429560188105282, 'samples': 17645568, 'steps': 34463, 'loss/train': 1.7734508514404297} +03/05/2022 05:58:06 - INFO - codeparrot_training - Step 34464: {'lr': 0.00044295264454721544, 'samples': 17646080, 'steps': 34464, 'loss/train': 1.8301419019699097} +03/05/2022 05:58:09 - INFO - codeparrot_training - Skipping example with length 34 (seq_length=1024) +03/05/2022 05:58:11 - INFO - codeparrot_training - Step 34465: {'lr': 0.0004429492701969612, 'samples': 17646592, 'steps': 34465, 'loss/train': 1.7986633777618408} +03/05/2022 05:58:15 - INFO - codeparrot_training - Step 34466: {'lr': 0.00044294589575976696, 'samples': 17647104, 'steps': 34466, 'loss/train': 1.6322604417800903} +03/05/2022 05:58:17 - INFO - codeparrot_training - Skipping example with length 900 (seq_length=1024) +03/05/2022 05:58:20 - INFO - codeparrot_training - Step 34467: {'lr': 0.00044294252123563434, 'samples': 17647616, 'steps': 34467, 'loss/train': 1.8993381261825562} +03/05/2022 05:58:23 - INFO - codeparrot_training - Step 34468: {'lr': 0.00044293914662456475, 'samples': 17648128, 'steps': 34468, 'loss/train': 2.0840775966644287} +03/05/2022 05:58:25 - INFO - codeparrot_training - Skipping example with length 978 (seq_length=1024) +03/05/2022 05:58:28 - INFO - codeparrot_training - Step 34469: {'lr': 0.00044293577192655977, 'samples': 17648640, 'steps': 34469, 'loss/train': 1.587438702583313} +03/05/2022 05:58:32 - INFO - codeparrot_training - Step 34470: {'lr': 0.0004429323971416209, 'samples': 17649152, 'steps': 34470, 'loss/train': 1.7007900476455688} +03/05/2022 05:58:34 - INFO - codeparrot_training - Skipping example with length 920 (seq_length=1024) +03/05/2022 05:58:37 - INFO - codeparrot_training - Step 34471: {'lr': 0.0004429290222697497, 'samples': 17649664, 'steps': 34471, 'loss/train': 1.5698492527008057} +03/05/2022 05:58:40 - INFO - codeparrot_training - Step 34472: {'lr': 0.0004429256473109476, 'samples': 17650176, 'steps': 34472, 'loss/train': 1.1360188722610474} +03/05/2022 05:58:42 - INFO - codeparrot_training - Skipping example with length 126 (seq_length=1024) +03/05/2022 05:58:45 - INFO - codeparrot_training - Step 34473: {'lr': 0.0004429222722652162, 'samples': 17650688, 'steps': 34473, 'loss/train': 2.3210785388946533} +03/05/2022 05:58:48 - INFO - codeparrot_training - Step 34474: {'lr': 0.0004429188971325571, 'samples': 17651200, 'steps': 34474, 'loss/train': 1.236336350440979} +03/05/2022 05:58:51 - INFO - codeparrot_training - Skipping example with length 617 (seq_length=1024) +03/05/2022 05:58:54 - INFO - codeparrot_training - Step 34475: {'lr': 0.00044291552191297155, 'samples': 17651712, 'steps': 34475, 'loss/train': 2.191598415374756} +03/05/2022 05:58:57 - INFO - codeparrot_training - Step 34476: {'lr': 0.0004429121466064614, 'samples': 17652224, 'steps': 34476, 'loss/train': 1.911533236503601} +03/05/2022 05:58:59 - INFO - codeparrot_training - Skipping example with length 230 (seq_length=1024) +03/05/2022 05:59:02 - INFO - codeparrot_training - Step 34477: {'lr': 0.0004429087712130279, 'samples': 17652736, 'steps': 34477, 'loss/train': 2.01478910446167} +03/05/2022 05:59:05 - INFO - codeparrot_training - Step 34478: {'lr': 0.00044290539573267276, 'samples': 17653248, 'steps': 34478, 'loss/train': 2.3136849403381348} +03/05/2022 05:59:07 - INFO - codeparrot_training - Skipping example with length 773 (seq_length=1024) +03/05/2022 05:59:11 - INFO - codeparrot_training - Step 34479: {'lr': 0.00044290202016539736, 'samples': 17653760, 'steps': 34479, 'loss/train': 2.9014499187469482} +03/05/2022 05:59:14 - INFO - codeparrot_training - Step 34480: {'lr': 0.0004428986445112033, 'samples': 17654272, 'steps': 34480, 'loss/train': 1.076346516609192} +03/05/2022 05:59:16 - INFO - codeparrot_training - Skipping example with length 58 (seq_length=1024) +03/05/2022 05:59:19 - INFO - codeparrot_training - Step 34481: {'lr': 0.00044289526877009213, 'samples': 17654784, 'steps': 34481, 'loss/train': 1.359923005104065} +03/05/2022 05:59:22 - INFO - codeparrot_training - Step 34482: {'lr': 0.00044289189294206534, 'samples': 17655296, 'steps': 34482, 'loss/train': 1.3713167905807495} +03/05/2022 05:59:25 - INFO - codeparrot_training - Skipping example with length 617 (seq_length=1024) +03/05/2022 05:59:28 - INFO - codeparrot_training - Step 34483: {'lr': 0.0004428885170271244, 'samples': 17655808, 'steps': 34483, 'loss/train': 2.030492067337036} +03/05/2022 05:59:31 - INFO - codeparrot_training - Step 34484: {'lr': 0.0004428851410252709, 'samples': 17656320, 'steps': 34484, 'loss/train': 2.152890205383301} +03/05/2022 05:59:33 - INFO - codeparrot_training - Skipping example with length 641 (seq_length=1024) +03/05/2022 05:59:36 - INFO - codeparrot_training - Step 34485: {'lr': 0.0004428817649365063, 'samples': 17656832, 'steps': 34485, 'loss/train': 2.473890542984009} +03/05/2022 05:59:39 - INFO - codeparrot_training - Step 34486: {'lr': 0.0004428783887608321, 'samples': 17657344, 'steps': 34486, 'loss/train': 1.3030574321746826} +03/05/2022 05:59:42 - INFO - codeparrot_training - Skipping example with length 704 (seq_length=1024) +03/05/2022 05:59:44 - INFO - codeparrot_training - Step 34487: {'lr': 0.00044287501249824996, 'samples': 17657856, 'steps': 34487, 'loss/train': 1.1493401527404785} +03/05/2022 05:59:48 - INFO - codeparrot_training - Step 34488: {'lr': 0.0004428716361487613, 'samples': 17658368, 'steps': 34488, 'loss/train': 1.7590959072113037} +03/05/2022 05:59:50 - INFO - codeparrot_training - Skipping example with length 640 (seq_length=1024) +03/05/2022 05:59:53 - INFO - codeparrot_training - Step 34489: {'lr': 0.0004428682597123677, 'samples': 17658880, 'steps': 34489, 'loss/train': 0.6687783002853394} +03/05/2022 05:59:56 - INFO - codeparrot_training - Step 34490: {'lr': 0.0004428648831890705, 'samples': 17659392, 'steps': 34490, 'loss/train': 1.8729727268218994} +03/05/2022 05:59:59 - INFO - codeparrot_training - Step 34491: {'lr': 0.0004428615065788715, 'samples': 17659904, 'steps': 34491, 'loss/train': 1.6569838523864746} +03/05/2022 06:00:00 - INFO - codeparrot_training - Skipping example with length 340 (seq_length=1024) +03/05/2022 06:00:05 - INFO - codeparrot_training - Step 34492: {'lr': 0.00044285812988177197, 'samples': 17660416, 'steps': 34492, 'loss/train': 1.2252579927444458} +03/05/2022 06:00:08 - INFO - codeparrot_training - Step 34493: {'lr': 0.0004428547530977736, 'samples': 17660928, 'steps': 34493, 'loss/train': 1.933573842048645} +03/05/2022 06:00:08 - INFO - codeparrot_training - Skipping example with length 345 (seq_length=1024) +03/05/2022 06:00:13 - INFO - codeparrot_training - Step 34494: {'lr': 0.0004428513762268779, 'samples': 17661440, 'steps': 34494, 'loss/train': 1.1966859102249146} +03/05/2022 06:00:16 - INFO - codeparrot_training - Step 34495: {'lr': 0.00044284799926908627, 'samples': 17661952, 'steps': 34495, 'loss/train': 1.6820588111877441} +03/05/2022 06:00:17 - INFO - codeparrot_training - Skipping example with length 395 (seq_length=1024) +03/05/2022 06:00:22 - INFO - codeparrot_training - Step 34496: {'lr': 0.0004428446222244004, 'samples': 17662464, 'steps': 34496, 'loss/train': 1.6945387125015259} +03/05/2022 06:00:25 - INFO - codeparrot_training - Step 34497: {'lr': 0.0004428412450928216, 'samples': 17662976, 'steps': 34497, 'loss/train': 1.37456476688385} +03/05/2022 06:00:25 - INFO - codeparrot_training - Skipping example with length 119 (seq_length=1024) +03/05/2022 06:00:30 - INFO - codeparrot_training - Step 34498: {'lr': 0.00044283786787435156, 'samples': 17663488, 'steps': 34498, 'loss/train': 1.9964081048965454} +03/05/2022 06:00:33 - INFO - codeparrot_training - Step 34499: {'lr': 0.0004428344905689917, 'samples': 17664000, 'steps': 34499, 'loss/train': 1.551255464553833} +03/05/2022 06:00:34 - INFO - codeparrot_training - Skipping example with length 833 (seq_length=1024) +03/05/2022 06:00:38 - INFO - codeparrot_training - Step 34500: {'lr': 0.0004428311131767437, 'samples': 17664512, 'steps': 34500, 'loss/train': 1.8067249059677124} +03/05/2022 06:00:42 - INFO - codeparrot_training - Step 34501: {'lr': 0.0004428277356976089, 'samples': 17665024, 'steps': 34501, 'loss/train': 2.3206627368927} +03/05/2022 06:00:42 - INFO - codeparrot_training - Skipping example with length 212 (seq_length=1024) +03/05/2022 06:00:47 - INFO - codeparrot_training - Step 34502: {'lr': 0.0004428243581315889, 'samples': 17665536, 'steps': 34502, 'loss/train': 1.9363330602645874} +03/05/2022 06:00:50 - INFO - codeparrot_training - Step 34503: {'lr': 0.0004428209804786853, 'samples': 17666048, 'steps': 34503, 'loss/train': 1.4331533908843994} +03/05/2022 06:00:51 - INFO - codeparrot_training - Skipping example with length 609 (seq_length=1024) +03/05/2022 06:00:55 - INFO - codeparrot_training - Step 34504: {'lr': 0.0004428176027388995, 'samples': 17666560, 'steps': 34504, 'loss/train': 1.2737483978271484} +03/05/2022 06:00:58 - INFO - codeparrot_training - Step 34505: {'lr': 0.0004428142249122331, 'samples': 17667072, 'steps': 34505, 'loss/train': 1.9564390182495117} +03/05/2022 06:00:59 - INFO - codeparrot_training - Skipping example with length 36 (seq_length=1024) +03/05/2022 06:01:04 - INFO - codeparrot_training - Step 34506: {'lr': 0.00044281084699868747, 'samples': 17667584, 'steps': 34506, 'loss/train': 2.270721435546875} +03/05/2022 06:01:07 - INFO - codeparrot_training - Step 34507: {'lr': 0.0004428074689982643, 'samples': 17668096, 'steps': 34507, 'loss/train': 1.6944383382797241} +03/05/2022 06:01:08 - INFO - codeparrot_training - Skipping example with length 143 (seq_length=1024) +03/05/2022 06:01:12 - INFO - codeparrot_training - Step 34508: {'lr': 0.0004428040909109651, 'samples': 17668608, 'steps': 34508, 'loss/train': 1.8433403968811035} +03/05/2022 06:01:15 - INFO - codeparrot_training - Step 34509: {'lr': 0.00044280071273679133, 'samples': 17669120, 'steps': 34509, 'loss/train': 0.9025130867958069} +03/05/2022 06:01:16 - INFO - codeparrot_training - Skipping example with length 281 (seq_length=1024) +03/05/2022 06:01:21 - INFO - codeparrot_training - Step 34510: {'lr': 0.00044279733447574456, 'samples': 17669632, 'steps': 34510, 'loss/train': 1.6995915174484253} +03/05/2022 06:01:24 - INFO - codeparrot_training - Step 34511: {'lr': 0.00044279395612782625, 'samples': 17670144, 'steps': 34511, 'loss/train': 1.9385913610458374} +03/05/2022 06:01:24 - INFO - codeparrot_training - Skipping example with length 1021 (seq_length=1024) +03/05/2022 06:01:29 - INFO - codeparrot_training - Step 34512: {'lr': 0.0004427905776930379, 'samples': 17670656, 'steps': 34512, 'loss/train': 2.012213945388794} +03/05/2022 06:01:32 - INFO - codeparrot_training - Step 34513: {'lr': 0.0004427871991713812, 'samples': 17671168, 'steps': 34513, 'loss/train': 2.0768423080444336} +03/05/2022 06:01:32 - INFO - codeparrot_training - Skipping example with length 355 (seq_length=1024) +03/05/2022 06:01:37 - INFO - codeparrot_training - Step 34514: {'lr': 0.0004427838205628575, 'samples': 17671680, 'steps': 34514, 'loss/train': 0.9320793747901917} +03/05/2022 06:01:41 - INFO - codeparrot_training - Step 34515: {'lr': 0.0004427804418674684, 'samples': 17672192, 'steps': 34515, 'loss/train': 1.0418295860290527} +03/05/2022 06:01:41 - INFO - codeparrot_training - Skipping example with length 823 (seq_length=1024) +03/05/2022 06:01:46 - INFO - codeparrot_training - Step 34516: {'lr': 0.00044277706308521543, 'samples': 17672704, 'steps': 34516, 'loss/train': 2.046491861343384} +03/05/2022 06:01:49 - INFO - codeparrot_training - Step 34517: {'lr': 0.0004427736842161001, 'samples': 17673216, 'steps': 34517, 'loss/train': 0.33359941840171814} +03/05/2022 06:01:49 - INFO - codeparrot_training - Skipping example with length 868 (seq_length=1024) +03/05/2022 06:01:55 - INFO - codeparrot_training - Step 34518: {'lr': 0.00044277030526012386, 'samples': 17673728, 'steps': 34518, 'loss/train': 2.0205187797546387} +03/05/2022 06:01:58 - INFO - codeparrot_training - Step 34519: {'lr': 0.0004427669262172883, 'samples': 17674240, 'steps': 34519, 'loss/train': 2.1777687072753906} +03/05/2022 06:02:00 - INFO - codeparrot_training - Skipping example with length 98 (seq_length=1024) +03/05/2022 06:02:03 - INFO - codeparrot_training - Step 34520: {'lr': 0.000442763547087595, 'samples': 17674752, 'steps': 34520, 'loss/train': 1.5915614366531372} +03/05/2022 06:02:06 - INFO - codeparrot_training - Step 34521: {'lr': 0.00044276016787104535, 'samples': 17675264, 'steps': 34521, 'loss/train': 2.315542221069336} +03/05/2022 06:02:09 - INFO - codeparrot_training - Skipping example with length 579 (seq_length=1024) +03/05/2022 06:02:12 - INFO - codeparrot_training - Step 34522: {'lr': 0.000442756788567641, 'samples': 17675776, 'steps': 34522, 'loss/train': 1.3581876754760742} +03/05/2022 06:02:15 - INFO - codeparrot_training - Step 34523: {'lr': 0.0004427534091773834, 'samples': 17676288, 'steps': 34523, 'loss/train': 1.4427965879440308} +03/05/2022 06:02:17 - INFO - codeparrot_training - Skipping example with length 673 (seq_length=1024) +03/05/2022 06:02:20 - INFO - codeparrot_training - Step 34524: {'lr': 0.00044275002970027403, 'samples': 17676800, 'steps': 34524, 'loss/train': 0.5988059043884277} +03/05/2022 06:02:23 - INFO - codeparrot_training - Step 34525: {'lr': 0.00044274665013631457, 'samples': 17677312, 'steps': 34525, 'loss/train': 2.2581124305725098} +03/05/2022 06:02:26 - INFO - codeparrot_training - Skipping example with length 714 (seq_length=1024) +03/05/2022 06:02:29 - INFO - codeparrot_training - Step 34526: {'lr': 0.0004427432704855064, 'samples': 17677824, 'steps': 34526, 'loss/train': 2.050006151199341} +03/05/2022 06:02:32 - INFO - codeparrot_training - Step 34527: {'lr': 0.000442739890747851, 'samples': 17678336, 'steps': 34527, 'loss/train': 1.5434801578521729} +03/05/2022 06:02:34 - INFO - codeparrot_training - Skipping example with length 1017 (seq_length=1024) +03/05/2022 06:02:37 - INFO - codeparrot_training - Step 34528: {'lr': 0.0004427365109233502, 'samples': 17678848, 'steps': 34528, 'loss/train': 1.1500861644744873} +03/05/2022 06:02:40 - INFO - codeparrot_training - Step 34529: {'lr': 0.00044273313101200507, 'samples': 17679360, 'steps': 34529, 'loss/train': 1.921228289604187} +03/05/2022 06:02:42 - INFO - codeparrot_training - Skipping example with length 179 (seq_length=1024) +03/05/2022 06:02:45 - INFO - codeparrot_training - Step 34530: {'lr': 0.00044272975101381754, 'samples': 17679872, 'steps': 34530, 'loss/train': 1.23170006275177} +03/05/2022 06:02:49 - INFO - codeparrot_training - Step 34531: {'lr': 0.0004427263709287889, 'samples': 17680384, 'steps': 34531, 'loss/train': 1.8685948848724365} +03/05/2022 06:02:51 - INFO - codeparrot_training - Skipping example with length 799 (seq_length=1024) +03/05/2022 06:02:54 - INFO - codeparrot_training - Step 34532: {'lr': 0.00044272299075692067, 'samples': 17680896, 'steps': 34532, 'loss/train': 1.5906106233596802} +03/05/2022 06:02:57 - INFO - codeparrot_training - Step 34533: {'lr': 0.0004427196104982145, 'samples': 17681408, 'steps': 34533, 'loss/train': 0.545563280582428} +03/05/2022 06:02:59 - INFO - codeparrot_training - Skipping example with length 591 (seq_length=1024) +03/05/2022 06:03:02 - INFO - codeparrot_training - Step 34534: {'lr': 0.0004427162301526718, 'samples': 17681920, 'steps': 34534, 'loss/train': 1.0510560274124146} +03/05/2022 06:03:06 - INFO - codeparrot_training - Step 34535: {'lr': 0.0004427128497202941, 'samples': 17682432, 'steps': 34535, 'loss/train': 1.3369512557983398} +03/05/2022 06:03:08 - INFO - codeparrot_training - Skipping example with length 339 (seq_length=1024) +03/05/2022 06:03:11 - INFO - codeparrot_training - Step 34536: {'lr': 0.00044270946920108305, 'samples': 17682944, 'steps': 34536, 'loss/train': 1.617935299873352} +03/05/2022 06:03:14 - INFO - codeparrot_training - Step 34537: {'lr': 0.00044270608859504006, 'samples': 17683456, 'steps': 34537, 'loss/train': 0.6327489614486694} +03/05/2022 06:03:16 - INFO - codeparrot_training - Skipping example with length 445 (seq_length=1024) +03/05/2022 06:03:19 - INFO - codeparrot_training - Step 34538: {'lr': 0.0004427027079021667, 'samples': 17683968, 'steps': 34538, 'loss/train': 0.8658568263053894} +03/05/2022 06:03:22 - INFO - codeparrot_training - Step 34539: {'lr': 0.0004426993271224645, 'samples': 17684480, 'steps': 34539, 'loss/train': 1.9620453119277954} +03/05/2022 06:03:24 - INFO - codeparrot_training - Skipping example with length 156 (seq_length=1024) +03/05/2022 06:03:28 - INFO - codeparrot_training - Step 34540: {'lr': 0.0004426959462559349, 'samples': 17684992, 'steps': 34540, 'loss/train': 1.5879038572311401} +03/05/2022 06:03:31 - INFO - codeparrot_training - Step 34541: {'lr': 0.0004426925653025795, 'samples': 17685504, 'steps': 34541, 'loss/train': 2.1064929962158203} +03/05/2022 06:03:33 - INFO - codeparrot_training - Skipping example with length 979 (seq_length=1024) +03/05/2022 06:03:36 - INFO - codeparrot_training - Step 34542: {'lr': 0.0004426891842623998, 'samples': 17686016, 'steps': 34542, 'loss/train': 1.9624521732330322} +03/05/2022 06:03:39 - INFO - codeparrot_training - Step 34543: {'lr': 0.0004426858031353973, 'samples': 17686528, 'steps': 34543, 'loss/train': 2.1045734882354736} +03/05/2022 06:03:41 - INFO - codeparrot_training - Skipping example with length 861 (seq_length=1024) +03/05/2022 06:03:44 - INFO - codeparrot_training - Step 34544: {'lr': 0.0004426824219215736, 'samples': 17687040, 'steps': 34544, 'loss/train': 1.2236227989196777} +03/05/2022 06:03:48 - INFO - codeparrot_training - Step 34545: {'lr': 0.00044267904062093014, 'samples': 17687552, 'steps': 34545, 'loss/train': 1.5783729553222656} +03/05/2022 06:03:49 - INFO - codeparrot_training - Skipping example with length 694 (seq_length=1024) +03/05/2022 06:03:53 - INFO - codeparrot_training - Step 34546: {'lr': 0.0004426756592334685, 'samples': 17688064, 'steps': 34546, 'loss/train': 1.6775139570236206} +03/05/2022 06:03:56 - INFO - codeparrot_training - Step 34547: {'lr': 0.0004426722777591902, 'samples': 17688576, 'steps': 34547, 'loss/train': 1.333911657333374} +03/05/2022 06:03:58 - INFO - codeparrot_training - Skipping example with length 136 (seq_length=1024) +03/05/2022 06:04:01 - INFO - codeparrot_training - Step 34548: {'lr': 0.00044266889619809665, 'samples': 17689088, 'steps': 34548, 'loss/train': 1.4337565898895264} +03/05/2022 06:04:05 - INFO - codeparrot_training - Step 34549: {'lr': 0.00044266551455018953, 'samples': 17689600, 'steps': 34549, 'loss/train': 1.3708990812301636} +03/05/2022 06:04:06 - INFO - codeparrot_training - Skipping example with length 1005 (seq_length=1024) +03/05/2022 06:04:10 - INFO - codeparrot_training - Step 34550: {'lr': 0.0004426621328154703, 'samples': 17690112, 'steps': 34550, 'loss/train': 1.552330493927002} +03/05/2022 06:04:13 - INFO - codeparrot_training - Step 34551: {'lr': 0.0004426587509939405, 'samples': 17690624, 'steps': 34551, 'loss/train': 1.8199992179870605} +03/05/2022 06:04:14 - INFO - codeparrot_training - Skipping example with length 400 (seq_length=1024) +03/05/2022 06:04:18 - INFO - codeparrot_training - Step 34552: {'lr': 0.0004426553690856016, 'samples': 17691136, 'steps': 34552, 'loss/train': 0.3973861336708069} +03/05/2022 06:04:22 - INFO - codeparrot_training - Step 34553: {'lr': 0.0004426519870904552, 'samples': 17691648, 'steps': 34553, 'loss/train': 1.7761049270629883} +03/05/2022 06:04:23 - INFO - codeparrot_training - Skipping example with length 405 (seq_length=1024) +03/05/2022 06:04:27 - INFO - codeparrot_training - Step 34554: {'lr': 0.0004426486050085028, 'samples': 17692160, 'steps': 34554, 'loss/train': 1.829074740409851} +03/05/2022 06:04:30 - INFO - codeparrot_training - Step 34555: {'lr': 0.0004426452228397458, 'samples': 17692672, 'steps': 34555, 'loss/train': 0.055017683655023575} +03/05/2022 06:04:31 - INFO - codeparrot_training - Skipping example with length 568 (seq_length=1024) +03/05/2022 06:04:35 - INFO - codeparrot_training - Step 34556: {'lr': 0.000442641840584186, 'samples': 17693184, 'steps': 34556, 'loss/train': 1.1627459526062012} +03/05/2022 06:04:38 - INFO - codeparrot_training - Step 34557: {'lr': 0.00044263845824182467, 'samples': 17693696, 'steps': 34557, 'loss/train': 2.321988582611084} +03/05/2022 06:04:40 - INFO - codeparrot_training - Skipping example with length 44 (seq_length=1024) +03/05/2022 06:04:44 - INFO - codeparrot_training - Step 34558: {'lr': 0.0004426350758126634, 'samples': 17694208, 'steps': 34558, 'loss/train': 1.952880859375} +03/05/2022 06:04:47 - INFO - codeparrot_training - Step 34559: {'lr': 0.0004426316932967038, 'samples': 17694720, 'steps': 34559, 'loss/train': 1.6647371053695679} +03/05/2022 06:04:48 - INFO - codeparrot_training - Skipping example with length 946 (seq_length=1024) +03/05/2022 06:04:52 - INFO - codeparrot_training - Step 34560: {'lr': 0.0004426283106939473, 'samples': 17695232, 'steps': 34560, 'loss/train': 0.7882624864578247} +03/05/2022 06:04:55 - INFO - codeparrot_training - Step 34561: {'lr': 0.00044262492800439547, 'samples': 17695744, 'steps': 34561, 'loss/train': 1.3706730604171753} +03/05/2022 06:04:56 - INFO - codeparrot_training - Skipping example with length 744 (seq_length=1024) +03/05/2022 06:05:01 - INFO - codeparrot_training - Step 34562: {'lr': 0.00044262154522804986, 'samples': 17696256, 'steps': 34562, 'loss/train': 0.4932713806629181} +03/05/2022 06:05:04 - INFO - codeparrot_training - Step 34563: {'lr': 0.00044261816236491186, 'samples': 17696768, 'steps': 34563, 'loss/train': 1.73300039768219} +03/05/2022 06:05:05 - INFO - codeparrot_training - Skipping example with length 530 (seq_length=1024) +03/05/2022 06:05:09 - INFO - codeparrot_training - Step 34564: {'lr': 0.00044261477941498316, 'samples': 17697280, 'steps': 34564, 'loss/train': 1.480662226676941} +03/05/2022 06:05:12 - INFO - codeparrot_training - Step 34565: {'lr': 0.0004426113963782652, 'samples': 17697792, 'steps': 34565, 'loss/train': 1.805383324623108} +03/05/2022 06:05:14 - INFO - codeparrot_training - Skipping example with length 303 (seq_length=1024) +03/05/2022 06:05:18 - INFO - codeparrot_training - Step 34566: {'lr': 0.00044260801325475953, 'samples': 17698304, 'steps': 34566, 'loss/train': 2.316495180130005} +03/05/2022 06:05:21 - INFO - codeparrot_training - Step 34567: {'lr': 0.0004426046300444676, 'samples': 17698816, 'steps': 34567, 'loss/train': 1.5681407451629639} +03/05/2022 06:05:22 - INFO - codeparrot_training - Skipping example with length 96 (seq_length=1024) +03/05/2022 06:05:26 - INFO - codeparrot_training - Step 34568: {'lr': 0.000442601246747391, 'samples': 17699328, 'steps': 34568, 'loss/train': 1.744669795036316} +03/05/2022 06:05:29 - INFO - codeparrot_training - Step 34569: {'lr': 0.0004425978633635313, 'samples': 17699840, 'steps': 34569, 'loss/train': 1.7447888851165771} +03/05/2022 06:05:31 - INFO - codeparrot_training - Skipping example with length 769 (seq_length=1024) +03/05/2022 06:05:34 - INFO - codeparrot_training - Step 34570: {'lr': 0.0004425944798928899, 'samples': 17700352, 'steps': 34570, 'loss/train': 1.3900948762893677} +03/05/2022 06:05:38 - INFO - codeparrot_training - Step 34571: {'lr': 0.0004425910963354685, 'samples': 17700864, 'steps': 34571, 'loss/train': 1.8431289196014404} +03/05/2022 06:05:39 - INFO - codeparrot_training - Skipping example with length 843 (seq_length=1024) +03/05/2022 06:05:43 - INFO - codeparrot_training - Step 34572: {'lr': 0.0004425877126912685, 'samples': 17701376, 'steps': 34572, 'loss/train': 1.8359674215316772} +03/05/2022 06:05:46 - INFO - codeparrot_training - Step 34573: {'lr': 0.00044258432896029145, 'samples': 17701888, 'steps': 34573, 'loss/train': 1.255735993385315} +03/05/2022 06:05:48 - INFO - codeparrot_training - Skipping example with length 52 (seq_length=1024) +03/05/2022 06:05:52 - INFO - codeparrot_training - Step 34574: {'lr': 0.00044258094514253876, 'samples': 17702400, 'steps': 34574, 'loss/train': 1.9837300777435303} +03/05/2022 06:05:55 - INFO - codeparrot_training - Step 34575: {'lr': 0.00044257756123801216, 'samples': 17702912, 'steps': 34575, 'loss/train': 0.6697525382041931} +03/05/2022 06:05:56 - INFO - codeparrot_training - Skipping example with length 264 (seq_length=1024) +03/05/2022 06:06:00 - INFO - codeparrot_training - Step 34576: {'lr': 0.0004425741772467131, 'samples': 17703424, 'steps': 34576, 'loss/train': 1.7515296936035156} +03/05/2022 06:06:03 - INFO - codeparrot_training - Step 34577: {'lr': 0.0004425707931686431, 'samples': 17703936, 'steps': 34577, 'loss/train': 1.8513121604919434} +03/05/2022 06:06:05 - INFO - codeparrot_training - Skipping example with length 434 (seq_length=1024) +03/05/2022 06:06:09 - INFO - codeparrot_training - Step 34578: {'lr': 0.00044256740900380364, 'samples': 17704448, 'steps': 34578, 'loss/train': 1.9542770385742188} +03/05/2022 06:06:12 - INFO - codeparrot_training - Step 34579: {'lr': 0.0004425640247521963, 'samples': 17704960, 'steps': 34579, 'loss/train': 1.866998314857483} +03/05/2022 06:06:14 - INFO - codeparrot_training - Skipping example with length 255 (seq_length=1024) +03/05/2022 06:06:17 - INFO - codeparrot_training - Step 34580: {'lr': 0.00044256064041382255, 'samples': 17705472, 'steps': 34580, 'loss/train': 1.4035999774932861} +03/05/2022 06:06:20 - INFO - codeparrot_training - Step 34581: {'lr': 0.0004425572559886839, 'samples': 17705984, 'steps': 34581, 'loss/train': 2.0088398456573486} +03/05/2022 06:06:23 - INFO - codeparrot_training - Skipping example with length 547 (seq_length=1024) +03/05/2022 06:06:26 - INFO - codeparrot_training - Step 34582: {'lr': 0.00044255387147678206, 'samples': 17706496, 'steps': 34582, 'loss/train': 1.5861475467681885} +03/05/2022 06:06:29 - INFO - codeparrot_training - Step 34583: {'lr': 0.0004425504868781183, 'samples': 17707008, 'steps': 34583, 'loss/train': 1.9714163541793823} +03/05/2022 06:06:31 - INFO - codeparrot_training - Skipping example with length 599 (seq_length=1024) +03/05/2022 06:06:34 - INFO - codeparrot_training - Step 34584: {'lr': 0.0004425471021926943, 'samples': 17707520, 'steps': 34584, 'loss/train': 2.1568093299865723} +03/05/2022 06:06:37 - INFO - codeparrot_training - Step 34585: {'lr': 0.0004425437174205115, 'samples': 17708032, 'steps': 34585, 'loss/train': 1.5789313316345215} +03/05/2022 06:06:40 - INFO - codeparrot_training - Skipping example with length 618 (seq_length=1024) +03/05/2022 06:06:43 - INFO - codeparrot_training - Step 34586: {'lr': 0.00044254033256157154, 'samples': 17708544, 'steps': 34586, 'loss/train': 1.2729425430297852} +03/05/2022 06:06:46 - INFO - codeparrot_training - Step 34587: {'lr': 0.0004425369476158759, 'samples': 17709056, 'steps': 34587, 'loss/train': 1.4998366832733154} +03/05/2022 06:06:48 - INFO - codeparrot_training - Skipping example with length 470 (seq_length=1024) +03/05/2022 06:06:51 - INFO - codeparrot_training - Step 34588: {'lr': 0.000442533562583426, 'samples': 17709568, 'steps': 34588, 'loss/train': 1.6784372329711914} +03/05/2022 06:06:54 - INFO - codeparrot_training - Step 34589: {'lr': 0.00044253017746422355, 'samples': 17710080, 'steps': 34589, 'loss/train': 2.341175079345703} +03/05/2022 06:06:56 - INFO - codeparrot_training - Skipping example with length 159 (seq_length=1024) +03/05/2022 06:07:00 - INFO - codeparrot_training - Step 34590: {'lr': 0.00044252679225826984, 'samples': 17710592, 'steps': 34590, 'loss/train': 1.6452728509902954} +03/05/2022 06:07:03 - INFO - codeparrot_training - Step 34591: {'lr': 0.0004425234069655666, 'samples': 17711104, 'steps': 34591, 'loss/train': 1.3519376516342163} +03/05/2022 06:07:05 - INFO - codeparrot_training - Skipping example with length 756 (seq_length=1024) +03/05/2022 06:07:08 - INFO - codeparrot_training - Step 34592: {'lr': 0.0004425200215861153, 'samples': 17711616, 'steps': 34592, 'loss/train': 0.897087037563324} +03/05/2022 06:07:11 - INFO - codeparrot_training - Step 34593: {'lr': 0.00044251663611991743, 'samples': 17712128, 'steps': 34593, 'loss/train': 0.7061640620231628} +03/05/2022 06:07:13 - INFO - codeparrot_training - Skipping example with length 92 (seq_length=1024) +03/05/2022 06:07:16 - INFO - codeparrot_training - Step 34594: {'lr': 0.0004425132505669745, 'samples': 17712640, 'steps': 34594, 'loss/train': 1.88649320602417} +03/05/2022 06:07:19 - INFO - codeparrot_training - Step 34595: {'lr': 0.00044250986492728805, 'samples': 17713152, 'steps': 34595, 'loss/train': 1.4049944877624512} +03/05/2022 06:07:22 - INFO - codeparrot_training - Skipping example with length 1015 (seq_length=1024) +03/05/2022 06:07:25 - INFO - codeparrot_training - Step 34596: {'lr': 0.0004425064792008597, 'samples': 17713664, 'steps': 34596, 'loss/train': 0.05822386220097542} +03/05/2022 06:07:28 - INFO - codeparrot_training - Step 34597: {'lr': 0.0004425030933876909, 'samples': 17714176, 'steps': 34597, 'loss/train': 1.9433174133300781} +03/05/2022 06:07:30 - INFO - codeparrot_training - Skipping example with length 722 (seq_length=1024) +03/05/2022 06:07:33 - INFO - codeparrot_training - Step 34598: {'lr': 0.0004424997074877831, 'samples': 17714688, 'steps': 34598, 'loss/train': 1.0996251106262207} +03/05/2022 06:07:36 - INFO - codeparrot_training - Step 34599: {'lr': 0.00044249632150113806, 'samples': 17715200, 'steps': 34599, 'loss/train': 2.2290470600128174} +03/05/2022 06:07:38 - INFO - codeparrot_training - Skipping example with length 305 (seq_length=1024) +03/05/2022 06:07:42 - INFO - codeparrot_training - Step 34600: {'lr': 0.000442492935427757, 'samples': 17715712, 'steps': 34600, 'loss/train': 1.7642180919647217} +03/05/2022 06:07:45 - INFO - codeparrot_training - Step 34601: {'lr': 0.00044248954926764164, 'samples': 17716224, 'steps': 34601, 'loss/train': 1.7567397356033325} +03/05/2022 06:07:47 - INFO - codeparrot_training - Skipping example with length 347 (seq_length=1024) +03/05/2022 06:07:50 - INFO - codeparrot_training - Step 34602: {'lr': 0.0004424861630207935, 'samples': 17716736, 'steps': 34602, 'loss/train': 2.0870018005371094} +03/05/2022 06:07:53 - INFO - codeparrot_training - Step 34603: {'lr': 0.00044248277668721396, 'samples': 17717248, 'steps': 34603, 'loss/train': 1.5389583110809326} +03/05/2022 06:07:55 - INFO - codeparrot_training - Skipping example with length 994 (seq_length=1024) +03/05/2022 06:07:59 - INFO - codeparrot_training - Step 34604: {'lr': 0.00044247939026690475, 'samples': 17717760, 'steps': 34604, 'loss/train': 1.2625257968902588} +03/05/2022 06:08:02 - INFO - codeparrot_training - Step 34605: {'lr': 0.0004424760037598673, 'samples': 17718272, 'steps': 34605, 'loss/train': 1.3623377084732056} +03/05/2022 06:08:04 - INFO - codeparrot_training - Skipping example with length 121 (seq_length=1024) +03/05/2022 06:08:07 - INFO - codeparrot_training - Step 34606: {'lr': 0.00044247261716610307, 'samples': 17718784, 'steps': 34606, 'loss/train': 1.6758027076721191} +03/05/2022 06:08:11 - INFO - codeparrot_training - Step 34607: {'lr': 0.0004424692304856136, 'samples': 17719296, 'steps': 34607, 'loss/train': 2.121821403503418} +03/05/2022 06:08:13 - INFO - codeparrot_training - Skipping example with length 614 (seq_length=1024) +03/05/2022 06:08:16 - INFO - codeparrot_training - Step 34608: {'lr': 0.0004424658437184006, 'samples': 17719808, 'steps': 34608, 'loss/train': 6.4753804206848145} +03/05/2022 06:08:19 - INFO - codeparrot_training - Step 34609: {'lr': 0.0004424624568644654, 'samples': 17720320, 'steps': 34609, 'loss/train': 2.092836856842041} +03/05/2022 06:08:22 - INFO - codeparrot_training - Skipping example with length 176 (seq_length=1024) +03/05/2022 06:08:24 - INFO - codeparrot_training - Step 34610: {'lr': 0.00044245906992380955, 'samples': 17720832, 'steps': 34610, 'loss/train': 2.1099298000335693} +03/05/2022 06:08:27 - INFO - codeparrot_training - Step 34611: {'lr': 0.0004424556828964347, 'samples': 17721344, 'steps': 34611, 'loss/train': 0.7350862622261047} +03/05/2022 06:08:30 - INFO - codeparrot_training - Skipping example with length 211 (seq_length=1024) +03/05/2022 06:08:33 - INFO - codeparrot_training - Step 34612: {'lr': 0.0004424522957823422, 'samples': 17721856, 'steps': 34612, 'loss/train': 1.220876932144165} +03/05/2022 06:08:36 - INFO - codeparrot_training - Step 34613: {'lr': 0.00044244890858153376, 'samples': 17722368, 'steps': 34613, 'loss/train': 1.487913966178894} +03/05/2022 06:08:38 - INFO - codeparrot_training - Skipping example with length 279 (seq_length=1024) +03/05/2022 06:08:41 - INFO - codeparrot_training - Step 34614: {'lr': 0.00044244552129401075, 'samples': 17722880, 'steps': 34614, 'loss/train': 0.24374724924564362} +03/05/2022 06:08:44 - INFO - codeparrot_training - Step 34615: {'lr': 0.0004424421339197747, 'samples': 17723392, 'steps': 34615, 'loss/train': 1.81853187084198} +03/05/2022 06:08:47 - INFO - codeparrot_training - Skipping example with length 891 (seq_length=1024) +03/05/2022 06:08:49 - INFO - codeparrot_training - Step 34616: {'lr': 0.00044243874645882733, 'samples': 17723904, 'steps': 34616, 'loss/train': 1.776626706123352} +03/05/2022 06:08:53 - INFO - codeparrot_training - Step 34617: {'lr': 0.0004424353589111699, 'samples': 17724416, 'steps': 34617, 'loss/train': 2.194687843322754} +03/05/2022 06:08:55 - INFO - codeparrot_training - Skipping example with length 725 (seq_length=1024) +03/05/2022 06:08:58 - INFO - codeparrot_training - Step 34618: {'lr': 0.0004424319712768041, 'samples': 17724928, 'steps': 34618, 'loss/train': 1.2187559604644775} +03/05/2022 06:09:01 - INFO - codeparrot_training - Step 34619: {'lr': 0.00044242858355573143, 'samples': 17725440, 'steps': 34619, 'loss/train': 2.320472002029419} +03/05/2022 06:09:05 - INFO - codeparrot_training - Step 34620: {'lr': 0.00044242519574795347, 'samples': 17725952, 'steps': 34620, 'loss/train': 1.5902724266052246} +03/05/2022 06:09:06 - INFO - codeparrot_training - Skipping example with length 414 (seq_length=1024) +03/05/2022 06:09:10 - INFO - codeparrot_training - Step 34621: {'lr': 0.00044242180785347164, 'samples': 17726464, 'steps': 34621, 'loss/train': 1.8483232259750366} +03/05/2022 06:09:13 - INFO - codeparrot_training - Step 34622: {'lr': 0.00044241841987228747, 'samples': 17726976, 'steps': 34622, 'loss/train': 2.2183682918548584} +03/05/2022 06:09:14 - INFO - codeparrot_training - Skipping example with length 686 (seq_length=1024) +03/05/2022 06:09:18 - INFO - codeparrot_training - Step 34623: {'lr': 0.00044241503180440263, 'samples': 17727488, 'steps': 34623, 'loss/train': 1.461199164390564} +03/05/2022 06:09:22 - INFO - codeparrot_training - Step 34624: {'lr': 0.0004424116436498185, 'samples': 17728000, 'steps': 34624, 'loss/train': 1.8575831651687622} +03/05/2022 06:09:23 - INFO - codeparrot_training - Skipping example with length 169 (seq_length=1024) +03/05/2022 06:09:27 - INFO - codeparrot_training - Step 34625: {'lr': 0.0004424082554085366, 'samples': 17728512, 'steps': 34625, 'loss/train': 2.330263376235962} +03/05/2022 06:09:30 - INFO - codeparrot_training - Step 34626: {'lr': 0.0004424048670805586, 'samples': 17729024, 'steps': 34626, 'loss/train': 0.7419248819351196} +03/05/2022 06:09:31 - INFO - codeparrot_training - Skipping example with length 209 (seq_length=1024) +03/05/2022 06:09:35 - INFO - codeparrot_training - Step 34627: {'lr': 0.0004424014786658859, 'samples': 17729536, 'steps': 34627, 'loss/train': 0.8694044351577759} +03/05/2022 06:09:38 - INFO - codeparrot_training - Step 34628: {'lr': 0.00044239809016452, 'samples': 17730048, 'steps': 34628, 'loss/train': 1.6624994277954102} +03/05/2022 06:09:40 - INFO - codeparrot_training - Skipping example with length 781 (seq_length=1024) +03/05/2022 06:09:44 - INFO - codeparrot_training - Step 34629: {'lr': 0.00044239470157646254, 'samples': 17730560, 'steps': 34629, 'loss/train': 1.5681383609771729} +03/05/2022 06:09:47 - INFO - codeparrot_training - Step 34630: {'lr': 0.000442391312901715, 'samples': 17731072, 'steps': 34630, 'loss/train': 1.7738909721374512} +03/05/2022 06:09:48 - INFO - codeparrot_training - Skipping example with length 816 (seq_length=1024) +03/05/2022 06:09:52 - INFO - codeparrot_training - Step 34631: {'lr': 0.0004423879241402788, 'samples': 17731584, 'steps': 34631, 'loss/train': 1.7575047016143799} +03/05/2022 06:09:55 - INFO - codeparrot_training - Step 34632: {'lr': 0.00044238453529215575, 'samples': 17732096, 'steps': 34632, 'loss/train': 0.6281212568283081} +03/05/2022 06:09:57 - INFO - codeparrot_training - Skipping example with length 327 (seq_length=1024) +03/05/2022 06:10:01 - INFO - codeparrot_training - Step 34633: {'lr': 0.00044238114635734713, 'samples': 17732608, 'steps': 34633, 'loss/train': 1.2663601636886597} +03/05/2022 06:10:04 - INFO - codeparrot_training - Step 34634: {'lr': 0.0004423777573358545, 'samples': 17733120, 'steps': 34634, 'loss/train': 0.7107919454574585} +03/05/2022 06:10:05 - INFO - codeparrot_training - Skipping example with length 260 (seq_length=1024) +03/05/2022 06:10:09 - INFO - codeparrot_training - Step 34635: {'lr': 0.0004423743682276794, 'samples': 17733632, 'steps': 34635, 'loss/train': 0.693023681640625} +03/05/2022 06:10:12 - INFO - codeparrot_training - Step 34636: {'lr': 0.0004423709790328235, 'samples': 17734144, 'steps': 34636, 'loss/train': 2.307650327682495} +03/05/2022 06:10:14 - INFO - codeparrot_training - Skipping example with length 571 (seq_length=1024) +03/05/2022 06:10:18 - INFO - codeparrot_training - Step 34637: {'lr': 0.0004423675897512881, 'samples': 17734656, 'steps': 34637, 'loss/train': 0.9209141731262207} +03/05/2022 06:10:21 - INFO - codeparrot_training - Step 34638: {'lr': 0.0004423642003830748, 'samples': 17735168, 'steps': 34638, 'loss/train': 1.7870094776153564} +03/05/2022 06:10:22 - INFO - codeparrot_training - Skipping example with length 854 (seq_length=1024) +03/05/2022 06:10:26 - INFO - codeparrot_training - Step 34639: {'lr': 0.00044236081092818527, 'samples': 17735680, 'steps': 34639, 'loss/train': 1.7178212404251099} +03/05/2022 06:10:29 - INFO - codeparrot_training - Step 34640: {'lr': 0.00044235742138662085, 'samples': 17736192, 'steps': 34640, 'loss/train': 1.360457420349121} +03/05/2022 06:10:31 - INFO - codeparrot_training - Skipping example with length 701 (seq_length=1024) +03/05/2022 06:10:35 - INFO - codeparrot_training - Step 34641: {'lr': 0.0004423540317583832, 'samples': 17736704, 'steps': 34641, 'loss/train': 1.5048810243606567} +03/05/2022 06:10:38 - INFO - codeparrot_training - Step 34642: {'lr': 0.00044235064204347377, 'samples': 17737216, 'steps': 34642, 'loss/train': 1.6018308401107788} +03/05/2022 06:10:40 - INFO - codeparrot_training - Skipping example with length 858 (seq_length=1024) +03/05/2022 06:10:43 - INFO - codeparrot_training - Step 34643: {'lr': 0.0004423472522418941, 'samples': 17737728, 'steps': 34643, 'loss/train': 1.799862265586853} +03/05/2022 06:10:46 - INFO - codeparrot_training - Step 34644: {'lr': 0.0004423438623536457, 'samples': 17738240, 'steps': 34644, 'loss/train': 1.9152681827545166} +03/05/2022 06:10:48 - INFO - codeparrot_training - Skipping example with length 588 (seq_length=1024) +03/05/2022 06:10:51 - INFO - codeparrot_training - Step 34645: {'lr': 0.0004423404723787301, 'samples': 17738752, 'steps': 34645, 'loss/train': 1.3875528573989868} +03/05/2022 06:10:55 - INFO - codeparrot_training - Step 34646: {'lr': 0.000442337082317149, 'samples': 17739264, 'steps': 34646, 'loss/train': 2.1265366077423096} +03/05/2022 06:10:57 - INFO - codeparrot_training - Skipping example with length 175 (seq_length=1024) +03/05/2022 06:11:00 - INFO - codeparrot_training - Step 34647: {'lr': 0.0004423336921689036, 'samples': 17739776, 'steps': 34647, 'loss/train': 0.784816324710846} +03/05/2022 06:11:03 - INFO - codeparrot_training - Step 34648: {'lr': 0.0004423303019339957, 'samples': 17740288, 'steps': 34648, 'loss/train': 0.8291152715682983} +03/05/2022 06:11:05 - INFO - codeparrot_training - Skipping example with length 395 (seq_length=1024) +03/05/2022 06:11:08 - INFO - codeparrot_training - Step 34649: {'lr': 0.0004423269116124267, 'samples': 17740800, 'steps': 34649, 'loss/train': 1.6914132833480835} +03/05/2022 06:11:11 - INFO - codeparrot_training - Step 34650: {'lr': 0.0004423235212041982, 'samples': 17741312, 'steps': 34650, 'loss/train': 1.378540277481079} +03/05/2022 06:11:13 - INFO - codeparrot_training - Skipping example with length 197 (seq_length=1024) +03/05/2022 06:11:17 - INFO - codeparrot_training - Step 34651: {'lr': 0.00044232013070931165, 'samples': 17741824, 'steps': 34651, 'loss/train': 0.6377180814743042} +03/05/2022 06:11:20 - INFO - codeparrot_training - Step 34652: {'lr': 0.00044231674012776864, 'samples': 17742336, 'steps': 34652, 'loss/train': 1.2246763706207275} +03/05/2022 06:11:22 - INFO - codeparrot_training - Skipping example with length 205 (seq_length=1024) +03/05/2022 06:11:25 - INFO - codeparrot_training - Step 34653: {'lr': 0.0004423133494595707, 'samples': 17742848, 'steps': 34653, 'loss/train': 2.167185068130493} +03/05/2022 06:11:28 - INFO - codeparrot_training - Step 34654: {'lr': 0.00044230995870471923, 'samples': 17743360, 'steps': 34654, 'loss/train': 0.6286876201629639} +03/05/2022 06:11:30 - INFO - codeparrot_training - Skipping example with length 901 (seq_length=1024) +03/05/2022 06:11:34 - INFO - codeparrot_training - Step 34655: {'lr': 0.000442306567863216, 'samples': 17743872, 'steps': 34655, 'loss/train': 1.2910902500152588} +03/05/2022 06:11:37 - INFO - codeparrot_training - Step 34656: {'lr': 0.00044230317693506226, 'samples': 17744384, 'steps': 34656, 'loss/train': 1.2925772666931152} +03/05/2022 06:11:39 - INFO - codeparrot_training - Skipping example with length 358 (seq_length=1024) +03/05/2022 06:11:42 - INFO - codeparrot_training - Step 34657: {'lr': 0.00044229978592025975, 'samples': 17744896, 'steps': 34657, 'loss/train': 2.401838779449463} +03/05/2022 06:11:46 - INFO - codeparrot_training - Step 34658: {'lr': 0.00044229639481881, 'samples': 17745408, 'steps': 34658, 'loss/train': 1.6781604290008545} +03/05/2022 06:11:47 - INFO - codeparrot_training - Skipping example with length 453 (seq_length=1024) +03/05/2022 06:11:51 - INFO - codeparrot_training - Step 34659: {'lr': 0.00044229300363071434, 'samples': 17745920, 'steps': 34659, 'loss/train': 1.4354958534240723} +03/05/2022 06:11:54 - INFO - codeparrot_training - Step 34660: {'lr': 0.0004422896123559744, 'samples': 17746432, 'steps': 34660, 'loss/train': 1.2898335456848145} +03/05/2022 06:11:56 - INFO - codeparrot_training - Skipping example with length 283 (seq_length=1024) +03/05/2022 06:11:59 - INFO - codeparrot_training - Step 34661: {'lr': 0.00044228622099459183, 'samples': 17746944, 'steps': 34661, 'loss/train': 2.530094623565674} +03/05/2022 06:12:03 - INFO - codeparrot_training - Step 34662: {'lr': 0.000442282829546568, 'samples': 17747456, 'steps': 34662, 'loss/train': 1.5053707361221313} +03/05/2022 06:12:04 - INFO - codeparrot_training - Skipping example with length 341 (seq_length=1024) +03/05/2022 06:12:08 - INFO - codeparrot_training - Step 34663: {'lr': 0.00044227943801190454, 'samples': 17747968, 'steps': 34663, 'loss/train': 1.0806703567504883} +03/05/2022 06:12:11 - INFO - codeparrot_training - Step 34664: {'lr': 0.0004422760463906029, 'samples': 17748480, 'steps': 34664, 'loss/train': 1.530690312385559} +03/05/2022 06:12:13 - INFO - codeparrot_training - Skipping example with length 11 (seq_length=1024) +03/05/2022 06:12:16 - INFO - codeparrot_training - Step 34665: {'lr': 0.00044227265468266464, 'samples': 17748992, 'steps': 34665, 'loss/train': 1.824294924736023} +03/05/2022 06:12:20 - INFO - codeparrot_training - Step 34666: {'lr': 0.0004422692628880913, 'samples': 17749504, 'steps': 34666, 'loss/train': 1.8913726806640625} +03/05/2022 06:12:21 - INFO - codeparrot_training - Skipping example with length 689 (seq_length=1024) +03/05/2022 06:12:25 - INFO - codeparrot_training - Step 34667: {'lr': 0.00044226587100688436, 'samples': 17750016, 'steps': 34667, 'loss/train': 0.0817064642906189} +03/05/2022 06:12:28 - INFO - codeparrot_training - Step 34668: {'lr': 0.0004422624790390454, 'samples': 17750528, 'steps': 34668, 'loss/train': 1.9480189085006714} +03/05/2022 06:12:29 - INFO - codeparrot_training - Skipping example with length 483 (seq_length=1024) +03/05/2022 06:12:33 - INFO - codeparrot_training - Step 34669: {'lr': 0.000442259086984576, 'samples': 17751040, 'steps': 34669, 'loss/train': 2.4002320766448975} +03/05/2022 06:12:37 - INFO - codeparrot_training - Step 34670: {'lr': 0.00044225569484347753, 'samples': 17751552, 'steps': 34670, 'loss/train': 0.9600015878677368} +03/05/2022 06:12:42 - INFO - codeparrot_training - Step 34671: {'lr': 0.00044225230261575165, 'samples': 17752064, 'steps': 34671, 'loss/train': 1.6734172105789185} +03/05/2022 06:12:45 - INFO - codeparrot_training - Step 34672: {'lr': 0.00044224891030139986, 'samples': 17752576, 'steps': 34672, 'loss/train': 1.072651982307434} +03/05/2022 06:12:50 - INFO - codeparrot_training - Step 34673: {'lr': 0.0004422455179004237, 'samples': 17753088, 'steps': 34673, 'loss/train': 1.556174397468567} +03/05/2022 06:12:53 - INFO - codeparrot_training - Step 34674: {'lr': 0.00044224212541282463, 'samples': 17753600, 'steps': 34674, 'loss/train': 0.7710404992103577} +03/05/2022 06:12:55 - INFO - codeparrot_training - Skipping example with length 169 (seq_length=1024) +03/05/2022 06:12:59 - INFO - codeparrot_training - Step 34675: {'lr': 0.0004422387328386042, 'samples': 17754112, 'steps': 34675, 'loss/train': 1.2669563293457031} +03/05/2022 06:13:02 - INFO - codeparrot_training - Step 34676: {'lr': 0.000442235340177764, 'samples': 17754624, 'steps': 34676, 'loss/train': 2.039918899536133} +03/05/2022 06:13:03 - INFO - codeparrot_training - Skipping example with length 339 (seq_length=1024) +03/05/2022 06:13:07 - INFO - codeparrot_training - Step 34677: {'lr': 0.00044223194743030556, 'samples': 17755136, 'steps': 34677, 'loss/train': 1.0990524291992188} +03/05/2022 06:13:10 - INFO - codeparrot_training - Step 34678: {'lr': 0.00044222855459623034, 'samples': 17755648, 'steps': 34678, 'loss/train': 1.5621976852416992} +03/05/2022 06:13:11 - INFO - codeparrot_training - Skipping example with length 869 (seq_length=1024) +03/05/2022 06:13:15 - INFO - codeparrot_training - Step 34679: {'lr': 0.00044222516167553985, 'samples': 17756160, 'steps': 34679, 'loss/train': 1.59064781665802} +03/05/2022 06:13:19 - INFO - codeparrot_training - Step 34680: {'lr': 0.0004422217686682357, 'samples': 17756672, 'steps': 34680, 'loss/train': 1.2528200149536133} +03/05/2022 06:13:24 - INFO - codeparrot_training - Step 34681: {'lr': 0.00044221837557431945, 'samples': 17757184, 'steps': 34681, 'loss/train': 0.7929532527923584} +03/05/2022 06:13:27 - INFO - codeparrot_training - Step 34682: {'lr': 0.00044221498239379247, 'samples': 17757696, 'steps': 34682, 'loss/train': 1.9037834405899048} +03/05/2022 06:13:28 - INFO - codeparrot_training - Skipping example with length 837 (seq_length=1024) +03/05/2022 06:13:32 - INFO - codeparrot_training - Step 34683: {'lr': 0.0004422115891266565, 'samples': 17758208, 'steps': 34683, 'loss/train': 2.475658416748047} +03/05/2022 06:13:36 - INFO - codeparrot_training - Step 34684: {'lr': 0.00044220819577291283, 'samples': 17758720, 'steps': 34684, 'loss/train': 2.007002115249634} +03/05/2022 06:13:37 - INFO - codeparrot_training - Skipping example with length 680 (seq_length=1024) +03/05/2022 06:13:41 - INFO - codeparrot_training - Step 34685: {'lr': 0.00044220480233256315, 'samples': 17759232, 'steps': 34685, 'loss/train': 1.4666168689727783} +03/05/2022 06:13:44 - INFO - codeparrot_training - Step 34686: {'lr': 0.00044220140880560897, 'samples': 17759744, 'steps': 34686, 'loss/train': 1.1131591796875} +03/05/2022 06:13:45 - INFO - codeparrot_training - Skipping example with length 251 (seq_length=1024) +03/05/2022 06:13:49 - INFO - codeparrot_training - Step 34687: {'lr': 0.0004421980151920518, 'samples': 17760256, 'steps': 34687, 'loss/train': 2.0053248405456543} +03/05/2022 06:13:53 - INFO - codeparrot_training - Step 34688: {'lr': 0.00044219462149189313, 'samples': 17760768, 'steps': 34688, 'loss/train': 1.8689898252487183} +03/05/2022 06:13:53 - INFO - codeparrot_training - Skipping example with length 831 (seq_length=1024) +03/05/2022 06:13:58 - INFO - codeparrot_training - Step 34689: {'lr': 0.0004421912277051346, 'samples': 17761280, 'steps': 34689, 'loss/train': 1.8633910417556763} +03/05/2022 06:14:01 - INFO - codeparrot_training - Step 34690: {'lr': 0.00044218783383177763, 'samples': 17761792, 'steps': 34690, 'loss/train': 1.4913395643234253} +03/05/2022 06:14:02 - INFO - codeparrot_training - Skipping example with length 446 (seq_length=1024) +03/05/2022 06:14:06 - INFO - codeparrot_training - Step 34691: {'lr': 0.00044218443987182384, 'samples': 17762304, 'steps': 34691, 'loss/train': 1.578671932220459} +03/05/2022 06:14:09 - INFO - codeparrot_training - Step 34692: {'lr': 0.0004421810458252746, 'samples': 17762816, 'steps': 34692, 'loss/train': 1.354146122932434} +03/05/2022 06:14:10 - INFO - codeparrot_training - Skipping example with length 966 (seq_length=1024) +03/05/2022 06:14:15 - INFO - codeparrot_training - Step 34693: {'lr': 0.00044217765169213166, 'samples': 17763328, 'steps': 34693, 'loss/train': 1.4421546459197998} +03/05/2022 06:14:18 - INFO - codeparrot_training - Step 34694: {'lr': 0.00044217425747239636, 'samples': 17763840, 'steps': 34694, 'loss/train': 1.170554757118225} +03/05/2022 06:14:18 - INFO - codeparrot_training - Skipping example with length 37 (seq_length=1024) +03/05/2022 06:14:23 - INFO - codeparrot_training - Step 34695: {'lr': 0.00044217086316607033, 'samples': 17764352, 'steps': 34695, 'loss/train': 1.7306098937988281} +03/05/2022 06:14:26 - INFO - codeparrot_training - Step 34696: {'lr': 0.00044216746877315504, 'samples': 17764864, 'steps': 34696, 'loss/train': 1.713168740272522} +03/05/2022 06:14:27 - INFO - codeparrot_training - Skipping example with length 753 (seq_length=1024) +03/05/2022 06:14:32 - INFO - codeparrot_training - Step 34697: {'lr': 0.0004421640742936521, 'samples': 17765376, 'steps': 34697, 'loss/train': 3.4272780418395996} +03/05/2022 06:14:35 - INFO - codeparrot_training - Step 34698: {'lr': 0.000442160679727563, 'samples': 17765888, 'steps': 34698, 'loss/train': 2.222865581512451} +03/05/2022 06:14:35 - INFO - codeparrot_training - Skipping example with length 47 (seq_length=1024) +03/05/2022 06:14:40 - INFO - codeparrot_training - Step 34699: {'lr': 0.0004421572850748893, 'samples': 17766400, 'steps': 34699, 'loss/train': 1.9602172374725342} +03/05/2022 06:14:43 - INFO - codeparrot_training - Step 34700: {'lr': 0.00044215389033563235, 'samples': 17766912, 'steps': 34700, 'loss/train': 1.9322041273117065} +03/05/2022 06:14:45 - INFO - codeparrot_training - Skipping example with length 660 (seq_length=1024) +03/05/2022 06:14:49 - INFO - codeparrot_training - Step 34701: {'lr': 0.00044215049550979394, 'samples': 17767424, 'steps': 34701, 'loss/train': 1.4731426239013672} +03/05/2022 06:14:52 - INFO - codeparrot_training - Step 34702: {'lr': 0.0004421471005973755, 'samples': 17767936, 'steps': 34702, 'loss/train': 1.500730037689209} +03/05/2022 06:14:53 - INFO - codeparrot_training - Skipping example with length 409 (seq_length=1024) +03/05/2022 06:14:57 - INFO - codeparrot_training - Step 34703: {'lr': 0.0004421437055983785, 'samples': 17768448, 'steps': 34703, 'loss/train': 1.727432131767273} +03/05/2022 06:15:00 - INFO - codeparrot_training - Step 34704: {'lr': 0.0004421403105128045, 'samples': 17768960, 'steps': 34704, 'loss/train': 2.3604538440704346} +03/05/2022 06:15:01 - INFO - codeparrot_training - Skipping example with length 59 (seq_length=1024) +03/05/2022 06:15:05 - INFO - codeparrot_training - Step 34705: {'lr': 0.00044213691534065503, 'samples': 17769472, 'steps': 34705, 'loss/train': 1.733148455619812} +03/05/2022 06:15:09 - INFO - codeparrot_training - Step 34706: {'lr': 0.0004421335200819316, 'samples': 17769984, 'steps': 34706, 'loss/train': 2.107748031616211} +03/05/2022 06:15:10 - INFO - codeparrot_training - Skipping example with length 164 (seq_length=1024) +03/05/2022 06:15:14 - INFO - codeparrot_training - Step 34707: {'lr': 0.00044213012473663584, 'samples': 17770496, 'steps': 34707, 'loss/train': 2.013026237487793} +03/05/2022 06:15:17 - INFO - codeparrot_training - Step 34708: {'lr': 0.0004421267293047692, 'samples': 17771008, 'steps': 34708, 'loss/train': 2.3180277347564697} +03/05/2022 06:15:18 - INFO - codeparrot_training - Skipping example with length 13 (seq_length=1024) +03/05/2022 06:15:23 - INFO - codeparrot_training - Step 34709: {'lr': 0.0004421233337863332, 'samples': 17771520, 'steps': 34709, 'loss/train': 1.822326421737671} +03/05/2022 06:15:26 - INFO - codeparrot_training - Step 34710: {'lr': 0.0004421199381813293, 'samples': 17772032, 'steps': 34710, 'loss/train': 1.1826245784759521} +03/05/2022 06:15:27 - INFO - codeparrot_training - Skipping example with length 307 (seq_length=1024) +03/05/2022 06:15:31 - INFO - codeparrot_training - Step 34711: {'lr': 0.0004421165424897593, 'samples': 17772544, 'steps': 34711, 'loss/train': 2.132946491241455} +03/05/2022 06:15:34 - INFO - codeparrot_training - Step 34712: {'lr': 0.00044211314671162446, 'samples': 17773056, 'steps': 34712, 'loss/train': 1.8319579362869263} +03/05/2022 06:15:35 - INFO - codeparrot_training - Skipping example with length 661 (seq_length=1024) +03/05/2022 06:15:39 - INFO - codeparrot_training - Step 34713: {'lr': 0.0004421097508469264, 'samples': 17773568, 'steps': 34713, 'loss/train': 1.5415055751800537} +03/05/2022 06:15:43 - INFO - codeparrot_training - Step 34714: {'lr': 0.0004421063548956666, 'samples': 17774080, 'steps': 34714, 'loss/train': 1.4501134157180786} +03/05/2022 06:15:43 - INFO - codeparrot_training - Skipping example with length 598 (seq_length=1024) +03/05/2022 06:15:48 - INFO - codeparrot_training - Step 34715: {'lr': 0.0004421029588578468, 'samples': 17774592, 'steps': 34715, 'loss/train': 1.2714436054229736} +03/05/2022 06:15:51 - INFO - codeparrot_training - Step 34716: {'lr': 0.00044209956273346816, 'samples': 17775104, 'steps': 34716, 'loss/train': 1.5021438598632812} +03/05/2022 06:15:52 - INFO - codeparrot_training - Skipping example with length 863 (seq_length=1024) +03/05/2022 06:15:56 - INFO - codeparrot_training - Step 34717: {'lr': 0.0004420961665225326, 'samples': 17775616, 'steps': 34717, 'loss/train': 1.8067482709884644} +03/05/2022 06:15:59 - INFO - codeparrot_training - Step 34718: {'lr': 0.0004420927702250414, 'samples': 17776128, 'steps': 34718, 'loss/train': 2.017714738845825} +03/05/2022 06:16:00 - INFO - codeparrot_training - Skipping example with length 702 (seq_length=1024) +03/05/2022 06:16:05 - INFO - codeparrot_training - Step 34719: {'lr': 0.00044208937384099614, 'samples': 17776640, 'steps': 34719, 'loss/train': 1.4139554500579834} +03/05/2022 06:16:08 - INFO - codeparrot_training - Step 34720: {'lr': 0.0004420859773703985, 'samples': 17777152, 'steps': 34720, 'loss/train': 1.0347590446472168} +03/05/2022 06:16:08 - INFO - codeparrot_training - Skipping example with length 314 (seq_length=1024) +03/05/2022 06:16:13 - INFO - codeparrot_training - Step 34721: {'lr': 0.0004420825808132497, 'samples': 17777664, 'steps': 34721, 'loss/train': 0.8553276658058167} +03/05/2022 06:16:16 - INFO - codeparrot_training - Step 34722: {'lr': 0.0004420791841695515, 'samples': 17778176, 'steps': 34722, 'loss/train': 1.979260802268982} +03/05/2022 06:16:18 - INFO - codeparrot_training - Skipping example with length 840 (seq_length=1024) +03/05/2022 06:16:22 - INFO - codeparrot_training - Step 34723: {'lr': 0.00044207578743930544, 'samples': 17778688, 'steps': 34723, 'loss/train': 1.5269734859466553} +03/05/2022 06:16:25 - INFO - codeparrot_training - Step 34724: {'lr': 0.00044207239062251297, 'samples': 17779200, 'steps': 34724, 'loss/train': 1.002009630203247} +03/05/2022 06:16:26 - INFO - codeparrot_training - Skipping example with length 380 (seq_length=1024) +03/05/2022 06:16:30 - INFO - codeparrot_training - Step 34725: {'lr': 0.00044206899371917563, 'samples': 17779712, 'steps': 34725, 'loss/train': 1.8381508588790894} +03/05/2022 06:16:33 - INFO - codeparrot_training - Step 34726: {'lr': 0.00044206559672929505, 'samples': 17780224, 'steps': 34726, 'loss/train': 0.971093475818634} +03/05/2022 06:16:34 - INFO - codeparrot_training - Skipping example with length 27 (seq_length=1024) +03/05/2022 06:16:38 - INFO - codeparrot_training - Step 34727: {'lr': 0.00044206219965287253, 'samples': 17780736, 'steps': 34727, 'loss/train': 1.3300241231918335} +03/05/2022 06:16:42 - INFO - codeparrot_training - Step 34728: {'lr': 0.0004420588024899098, 'samples': 17781248, 'steps': 34728, 'loss/train': 1.9163177013397217} +03/05/2022 06:16:42 - INFO - codeparrot_training - Skipping example with length 821 (seq_length=1024) +03/05/2022 06:16:47 - INFO - codeparrot_training - Step 34729: {'lr': 0.00044205540524040846, 'samples': 17781760, 'steps': 34729, 'loss/train': 2.20051646232605} +03/05/2022 06:16:50 - INFO - codeparrot_training - Step 34730: {'lr': 0.0004420520079043698, 'samples': 17782272, 'steps': 34730, 'loss/train': 1.244758129119873} +03/05/2022 06:16:51 - INFO - codeparrot_training - Skipping example with length 338 (seq_length=1024) +03/05/2022 06:16:55 - INFO - codeparrot_training - Step 34731: {'lr': 0.00044204861048179544, 'samples': 17782784, 'steps': 34731, 'loss/train': 2.03043532371521} +03/05/2022 06:16:58 - INFO - codeparrot_training - Step 34732: {'lr': 0.000442045212972687, 'samples': 17783296, 'steps': 34732, 'loss/train': 2.111168622970581} +03/05/2022 06:16:59 - INFO - codeparrot_training - Skipping example with length 194 (seq_length=1024) +03/05/2022 06:17:04 - INFO - codeparrot_training - Step 34733: {'lr': 0.00044204181537704594, 'samples': 17783808, 'steps': 34733, 'loss/train': 2.1760730743408203} +03/05/2022 06:17:07 - INFO - codeparrot_training - Step 34734: {'lr': 0.0004420384176948738, 'samples': 17784320, 'steps': 34734, 'loss/train': 1.9002472162246704} +03/05/2022 06:17:08 - INFO - codeparrot_training - Skipping example with length 844 (seq_length=1024) +03/05/2022 06:17:12 - INFO - codeparrot_training - Step 34735: {'lr': 0.0004420350199261721, 'samples': 17784832, 'steps': 34735, 'loss/train': 1.3317527770996094} +03/05/2022 06:17:15 - INFO - codeparrot_training - Step 34736: {'lr': 0.0004420316220709424, 'samples': 17785344, 'steps': 34736, 'loss/train': 2.1146278381347656} +03/05/2022 06:17:17 - INFO - codeparrot_training - Skipping example with length 446 (seq_length=1024) +03/05/2022 06:17:21 - INFO - codeparrot_training - Step 34737: {'lr': 0.0004420282241291862, 'samples': 17785856, 'steps': 34737, 'loss/train': 2.235307455062866} +03/05/2022 06:17:24 - INFO - codeparrot_training - Step 34738: {'lr': 0.0004420248261009051, 'samples': 17786368, 'steps': 34738, 'loss/train': 2.1142139434814453} +03/05/2022 06:17:25 - INFO - codeparrot_training - Skipping example with length 440 (seq_length=1024) +03/05/2022 06:17:29 - INFO - codeparrot_training - Step 34739: {'lr': 0.0004420214279861005, 'samples': 17786880, 'steps': 34739, 'loss/train': 1.6127471923828125} +03/05/2022 06:17:32 - INFO - codeparrot_training - Step 34740: {'lr': 0.000442018029784774, 'samples': 17787392, 'steps': 34740, 'loss/train': 1.2814568281173706} +03/05/2022 06:17:33 - INFO - codeparrot_training - Skipping example with length 1003 (seq_length=1024) +03/05/2022 06:17:37 - INFO - codeparrot_training - Step 34741: {'lr': 0.00044201463149692725, 'samples': 17787904, 'steps': 34741, 'loss/train': 2.0485661029815674} +03/05/2022 06:17:41 - INFO - codeparrot_training - Step 34742: {'lr': 0.0004420112331225616, 'samples': 17788416, 'steps': 34742, 'loss/train': 0.7049129009246826} +03/05/2022 06:17:42 - INFO - codeparrot_training - Skipping example with length 324 (seq_length=1024) +03/05/2022 06:17:46 - INFO - codeparrot_training - Step 34743: {'lr': 0.0004420078346616786, 'samples': 17788928, 'steps': 34743, 'loss/train': 2.3652329444885254} +03/05/2022 06:17:49 - INFO - codeparrot_training - Step 34744: {'lr': 0.00044200443611427985, 'samples': 17789440, 'steps': 34744, 'loss/train': 1.6950198411941528} +03/05/2022 06:17:50 - INFO - codeparrot_training - Skipping example with length 629 (seq_length=1024) +03/05/2022 06:17:54 - INFO - codeparrot_training - Step 34745: {'lr': 0.000442001037480367, 'samples': 17789952, 'steps': 34745, 'loss/train': 1.8679709434509277} +03/05/2022 06:17:57 - INFO - codeparrot_training - Step 34746: {'lr': 0.0004419976387599413, 'samples': 17790464, 'steps': 34746, 'loss/train': 2.327646493911743} +03/05/2022 06:17:58 - INFO - codeparrot_training - Skipping example with length 227 (seq_length=1024) +03/05/2022 06:18:03 - INFO - codeparrot_training - Step 34747: {'lr': 0.0004419942399530045, 'samples': 17790976, 'steps': 34747, 'loss/train': 1.438119649887085} +03/05/2022 06:18:06 - INFO - codeparrot_training - Step 34748: {'lr': 0.000441990841059558, 'samples': 17791488, 'steps': 34748, 'loss/train': 1.0234674215316772} +03/05/2022 06:18:06 - INFO - codeparrot_training - Skipping example with length 740 (seq_length=1024) +03/05/2022 06:18:11 - INFO - codeparrot_training - Step 34749: {'lr': 0.0004419874420796034, 'samples': 17792000, 'steps': 34749, 'loss/train': 1.802757978439331} +03/05/2022 06:18:14 - INFO - codeparrot_training - Step 34750: {'lr': 0.00044198404301314223, 'samples': 17792512, 'steps': 34750, 'loss/train': 1.5785678625106812} +03/05/2022 06:18:14 - INFO - codeparrot_training - Skipping example with length 603 (seq_length=1024) +03/05/2022 06:18:19 - INFO - codeparrot_training - Step 34751: {'lr': 0.000441980643860176, 'samples': 17793024, 'steps': 34751, 'loss/train': 0.638883650302887} +03/05/2022 06:18:23 - INFO - codeparrot_training - Step 34752: {'lr': 0.0004419772446207063, 'samples': 17793536, 'steps': 34752, 'loss/train': 2.0817904472351074} +03/05/2022 06:18:23 - INFO - codeparrot_training - Skipping example with length 925 (seq_length=1024) +03/05/2022 06:18:28 - INFO - codeparrot_training - Step 34753: {'lr': 0.0004419738452947346, 'samples': 17794048, 'steps': 34753, 'loss/train': 1.991413950920105} +03/05/2022 06:18:31 - INFO - codeparrot_training - Step 34754: {'lr': 0.00044197044588226245, 'samples': 17794560, 'steps': 34754, 'loss/train': 1.5427950620651245} +03/05/2022 06:18:32 - INFO - codeparrot_training - Skipping example with length 188 (seq_length=1024) +03/05/2022 06:18:36 - INFO - codeparrot_training - Step 34755: {'lr': 0.00044196704638329134, 'samples': 17795072, 'steps': 34755, 'loss/train': 1.6483997106552124} +03/05/2022 06:18:40 - INFO - codeparrot_training - Step 34756: {'lr': 0.00044196364679782284, 'samples': 17795584, 'steps': 34756, 'loss/train': 1.0142407417297363} +03/05/2022 06:18:40 - INFO - codeparrot_training - Skipping example with length 441 (seq_length=1024) +03/05/2022 06:18:45 - INFO - codeparrot_training - Step 34757: {'lr': 0.00044196024712585854, 'samples': 17796096, 'steps': 34757, 'loss/train': 1.6757601499557495} +03/05/2022 06:18:48 - INFO - codeparrot_training - Step 34758: {'lr': 0.0004419568473673999, 'samples': 17796608, 'steps': 34758, 'loss/train': 2.249492645263672} +03/05/2022 06:18:49 - INFO - codeparrot_training - Skipping example with length 733 (seq_length=1024) +03/05/2022 06:18:53 - INFO - codeparrot_training - Step 34759: {'lr': 0.00044195344752244844, 'samples': 17797120, 'steps': 34759, 'loss/train': 2.4136264324188232} +03/05/2022 06:18:57 - INFO - codeparrot_training - Step 34760: {'lr': 0.0004419500475910057, 'samples': 17797632, 'steps': 34760, 'loss/train': 1.2814266681671143} +03/05/2022 06:18:58 - INFO - codeparrot_training - Skipping example with length 470 (seq_length=1024) +03/05/2022 06:19:02 - INFO - codeparrot_training - Step 34761: {'lr': 0.0004419466475730732, 'samples': 17798144, 'steps': 34761, 'loss/train': 1.8868883848190308} +03/05/2022 06:19:05 - INFO - codeparrot_training - Step 34762: {'lr': 0.00044194324746865265, 'samples': 17798656, 'steps': 34762, 'loss/train': 1.704897403717041} +03/05/2022 06:19:06 - INFO - codeparrot_training - Skipping example with length 141 (seq_length=1024) +03/05/2022 06:19:10 - INFO - codeparrot_training - Step 34763: {'lr': 0.00044193984727774533, 'samples': 17799168, 'steps': 34763, 'loss/train': 1.2163739204406738} +03/05/2022 06:19:13 - INFO - codeparrot_training - Step 34764: {'lr': 0.0004419364470003529, 'samples': 17799680, 'steps': 34764, 'loss/train': 1.9033769369125366} +03/05/2022 06:19:14 - INFO - codeparrot_training - Skipping example with length 348 (seq_length=1024) +03/05/2022 06:19:19 - INFO - codeparrot_training - Step 34765: {'lr': 0.00044193304663647684, 'samples': 17800192, 'steps': 34765, 'loss/train': 1.9086840152740479} +03/05/2022 06:19:22 - INFO - codeparrot_training - Step 34766: {'lr': 0.00044192964618611875, 'samples': 17800704, 'steps': 34766, 'loss/train': 2.563309907913208} +03/05/2022 06:19:22 - INFO - codeparrot_training - Skipping example with length 165 (seq_length=1024) +03/05/2022 06:19:27 - INFO - codeparrot_training - Step 34767: {'lr': 0.0004419262456492801, 'samples': 17801216, 'steps': 34767, 'loss/train': 1.6083649396896362} +03/05/2022 06:19:31 - INFO - codeparrot_training - Step 34768: {'lr': 0.0004419228450259625, 'samples': 17801728, 'steps': 34768, 'loss/train': 0.8915947675704956} +03/05/2022 06:19:32 - INFO - codeparrot_training - Skipping example with length 618 (seq_length=1024) +03/05/2022 06:19:36 - INFO - codeparrot_training - Step 34769: {'lr': 0.00044191944431616734, 'samples': 17802240, 'steps': 34769, 'loss/train': 1.388028860092163} +03/05/2022 06:19:39 - INFO - codeparrot_training - Step 34770: {'lr': 0.0004419160435198963, 'samples': 17802752, 'steps': 34770, 'loss/train': 1.617478370666504} +03/05/2022 06:19:40 - INFO - codeparrot_training - Skipping example with length 942 (seq_length=1024) +03/05/2022 06:19:45 - INFO - codeparrot_training - Step 34771: {'lr': 0.00044191264263715083, 'samples': 17803264, 'steps': 34771, 'loss/train': 1.431685209274292} +03/05/2022 06:19:48 - INFO - codeparrot_training - Step 34772: {'lr': 0.00044190924166793245, 'samples': 17803776, 'steps': 34772, 'loss/train': 1.5003126859664917} +03/05/2022 06:19:49 - INFO - codeparrot_training - Skipping example with length 647 (seq_length=1024) +03/05/2022 06:19:53 - INFO - codeparrot_training - Step 34773: {'lr': 0.00044190584061224277, 'samples': 17804288, 'steps': 34773, 'loss/train': 6.4721550941467285} +03/05/2022 06:19:56 - INFO - codeparrot_training - Step 34774: {'lr': 0.0004419024394700833, 'samples': 17804800, 'steps': 34774, 'loss/train': 1.7067549228668213} +03/05/2022 06:19:59 - INFO - codeparrot_training - Skipping example with length 714 (seq_length=1024) +03/05/2022 06:20:01 - INFO - codeparrot_training - Step 34775: {'lr': 0.0004418990382414555, 'samples': 17805312, 'steps': 34775, 'loss/train': 2.051708698272705} +03/05/2022 06:20:05 - INFO - codeparrot_training - Step 34776: {'lr': 0.000441895636926361, 'samples': 17805824, 'steps': 34776, 'loss/train': 1.4361144304275513} +03/05/2022 06:20:07 - INFO - codeparrot_training - Skipping example with length 265 (seq_length=1024) +03/05/2022 06:20:10 - INFO - codeparrot_training - Step 34777: {'lr': 0.0004418922355248013, 'samples': 17806336, 'steps': 34777, 'loss/train': 1.7085236310958862} +03/05/2022 06:20:13 - INFO - codeparrot_training - Step 34778: {'lr': 0.00044188883403677783, 'samples': 17806848, 'steps': 34778, 'loss/train': 2.1923513412475586} +03/05/2022 06:20:15 - INFO - codeparrot_training - Skipping example with length 226 (seq_length=1024) +03/05/2022 06:20:18 - INFO - codeparrot_training - Step 34779: {'lr': 0.0004418854324622923, 'samples': 17807360, 'steps': 34779, 'loss/train': 1.9976255893707275} +03/05/2022 06:20:21 - INFO - codeparrot_training - Step 34780: {'lr': 0.0004418820308013461, 'samples': 17807872, 'steps': 34780, 'loss/train': 2.2966229915618896} +03/05/2022 06:20:23 - INFO - codeparrot_training - Skipping example with length 563 (seq_length=1024) +03/05/2022 06:20:27 - INFO - codeparrot_training - Step 34781: {'lr': 0.0004418786290539408, 'samples': 17808384, 'steps': 34781, 'loss/train': 0.49917879700660706} +03/05/2022 06:20:30 - INFO - codeparrot_training - Step 34782: {'lr': 0.000441875227220078, 'samples': 17808896, 'steps': 34782, 'loss/train': 1.8395239114761353} +03/05/2022 06:20:32 - INFO - codeparrot_training - Skipping example with length 1020 (seq_length=1024) +03/05/2022 06:20:35 - INFO - codeparrot_training - Step 34783: {'lr': 0.00044187182529975924, 'samples': 17809408, 'steps': 34783, 'loss/train': 1.547330617904663} +03/05/2022 06:20:39 - INFO - codeparrot_training - Step 34784: {'lr': 0.00044186842329298594, 'samples': 17809920, 'steps': 34784, 'loss/train': 2.057607412338257} +03/05/2022 06:20:41 - INFO - codeparrot_training - Skipping example with length 559 (seq_length=1024) +03/05/2022 06:20:44 - INFO - codeparrot_training - Step 34785: {'lr': 0.0004418650211997596, 'samples': 17810432, 'steps': 34785, 'loss/train': 2.403320550918579} +03/05/2022 06:20:47 - INFO - codeparrot_training - Step 34786: {'lr': 0.00044186161902008193, 'samples': 17810944, 'steps': 34786, 'loss/train': 1.6032514572143555} +03/05/2022 06:20:49 - INFO - codeparrot_training - Skipping example with length 816 (seq_length=1024) +03/05/2022 06:20:52 - INFO - codeparrot_training - Step 34787: {'lr': 0.0004418582167539544, 'samples': 17811456, 'steps': 34787, 'loss/train': 2.04004168510437} +03/05/2022 06:20:55 - INFO - codeparrot_training - Step 34788: {'lr': 0.00044185481440137846, 'samples': 17811968, 'steps': 34788, 'loss/train': 1.5111654996871948} +03/05/2022 06:20:58 - INFO - codeparrot_training - Skipping example with length 177 (seq_length=1024) +03/05/2022 06:21:01 - INFO - codeparrot_training - Step 34789: {'lr': 0.0004418514119623557, 'samples': 17812480, 'steps': 34789, 'loss/train': 1.140149712562561} +03/05/2022 06:21:04 - INFO - codeparrot_training - Step 34790: {'lr': 0.00044184800943688774, 'samples': 17812992, 'steps': 34790, 'loss/train': 3.132916212081909} +03/05/2022 06:21:06 - INFO - codeparrot_training - Skipping example with length 289 (seq_length=1024) +03/05/2022 06:21:09 - INFO - codeparrot_training - Step 34791: {'lr': 0.00044184460682497595, 'samples': 17813504, 'steps': 34791, 'loss/train': 2.01381778717041} +03/05/2022 06:21:12 - INFO - codeparrot_training - Step 34792: {'lr': 0.00044184120412662196, 'samples': 17814016, 'steps': 34792, 'loss/train': 2.316624402999878} +03/05/2022 06:21:15 - INFO - codeparrot_training - Skipping example with length 636 (seq_length=1024) +03/05/2022 06:21:18 - INFO - codeparrot_training - Step 34793: {'lr': 0.00044183780134182725, 'samples': 17814528, 'steps': 34793, 'loss/train': 1.9853283166885376} +03/05/2022 06:21:21 - INFO - codeparrot_training - Step 34794: {'lr': 0.0004418343984705935, 'samples': 17815040, 'steps': 34794, 'loss/train': 1.3579590320587158} +03/05/2022 06:21:23 - INFO - codeparrot_training - Skipping example with length 490 (seq_length=1024) +03/05/2022 06:21:26 - INFO - codeparrot_training - Step 34795: {'lr': 0.000441830995512922, 'samples': 17815552, 'steps': 34795, 'loss/train': 2.7011172771453857} +03/05/2022 06:21:29 - INFO - codeparrot_training - Step 34796: {'lr': 0.00044182759246881446, 'samples': 17816064, 'steps': 34796, 'loss/train': 0.963615894317627} +03/05/2022 06:21:31 - INFO - codeparrot_training - Skipping example with length 31 (seq_length=1024) +03/05/2022 06:21:34 - INFO - codeparrot_training - Step 34797: {'lr': 0.0004418241893382724, 'samples': 17816576, 'steps': 34797, 'loss/train': 1.7839312553405762} +03/05/2022 06:21:38 - INFO - codeparrot_training - Step 34798: {'lr': 0.0004418207861212973, 'samples': 17817088, 'steps': 34798, 'loss/train': 2.1674461364746094} +03/05/2022 06:21:39 - INFO - codeparrot_training - Skipping example with length 822 (seq_length=1024) +03/05/2022 06:21:43 - INFO - codeparrot_training - Step 34799: {'lr': 0.0004418173828178906, 'samples': 17817600, 'steps': 34799, 'loss/train': 1.9776021242141724} +03/05/2022 06:21:46 - INFO - codeparrot_training - Step 34800: {'lr': 0.0004418139794280541, 'samples': 17818112, 'steps': 34800, 'loss/train': 1.7851351499557495} +03/05/2022 06:21:48 - INFO - codeparrot_training - Skipping example with length 805 (seq_length=1024) +03/05/2022 06:21:51 - INFO - codeparrot_training - Step 34801: {'lr': 0.0004418105759517892, 'samples': 17818624, 'steps': 34801, 'loss/train': 1.4928101301193237} +03/05/2022 06:21:55 - INFO - codeparrot_training - Step 34802: {'lr': 0.0004418071723890973, 'samples': 17819136, 'steps': 34802, 'loss/train': 1.4727814197540283} +03/05/2022 06:21:57 - INFO - codeparrot_training - Skipping example with length 810 (seq_length=1024) +03/05/2022 06:22:00 - INFO - codeparrot_training - Step 34803: {'lr': 0.0004418037687399801, 'samples': 17819648, 'steps': 34803, 'loss/train': 1.5155882835388184} +03/05/2022 06:22:03 - INFO - codeparrot_training - Step 34804: {'lr': 0.0004418003650044391, 'samples': 17820160, 'steps': 34804, 'loss/train': 0.5956745743751526} +03/05/2022 06:22:05 - INFO - codeparrot_training - Skipping example with length 927 (seq_length=1024) +03/05/2022 06:22:08 - INFO - codeparrot_training - Step 34805: {'lr': 0.0004417969611824758, 'samples': 17820672, 'steps': 34805, 'loss/train': 0.6937854290008545} +03/05/2022 06:22:11 - INFO - codeparrot_training - Step 34806: {'lr': 0.00044179355727409173, 'samples': 17821184, 'steps': 34806, 'loss/train': 1.4317811727523804} +03/05/2022 06:22:13 - INFO - codeparrot_training - Skipping example with length 537 (seq_length=1024) +03/05/2022 06:22:17 - INFO - codeparrot_training - Step 34807: {'lr': 0.00044179015327928847, 'samples': 17821696, 'steps': 34807, 'loss/train': 1.8110909461975098} +03/05/2022 06:22:20 - INFO - codeparrot_training - Step 34808: {'lr': 0.0004417867491980675, 'samples': 17822208, 'steps': 34808, 'loss/train': 1.2459276914596558} +03/05/2022 06:22:21 - INFO - codeparrot_training - Skipping example with length 451 (seq_length=1024) +03/05/2022 06:22:25 - INFO - codeparrot_training - Step 34809: {'lr': 0.0004417833450304304, 'samples': 17822720, 'steps': 34809, 'loss/train': 1.4649474620819092} +03/05/2022 06:22:28 - INFO - codeparrot_training - Step 34810: {'lr': 0.0004417799407763786, 'samples': 17823232, 'steps': 34810, 'loss/train': 1.9763818979263306} +03/05/2022 06:22:30 - INFO - codeparrot_training - Skipping example with length 87 (seq_length=1024) +03/05/2022 06:22:33 - INFO - codeparrot_training - Step 34811: {'lr': 0.00044177653643591387, 'samples': 17823744, 'steps': 34811, 'loss/train': 2.1348869800567627} +03/05/2022 06:22:37 - INFO - codeparrot_training - Step 34812: {'lr': 0.00044177313200903745, 'samples': 17824256, 'steps': 34812, 'loss/train': 1.6223477125167847} +03/05/2022 06:22:38 - INFO - codeparrot_training - Skipping example with length 1017 (seq_length=1024) +03/05/2022 06:22:42 - INFO - codeparrot_training - Step 34813: {'lr': 0.0004417697274957511, 'samples': 17824768, 'steps': 34813, 'loss/train': 1.8909236192703247} +03/05/2022 06:22:45 - INFO - codeparrot_training - Step 34814: {'lr': 0.0004417663228960562, 'samples': 17825280, 'steps': 34814, 'loss/train': 1.661768913269043} +03/05/2022 06:22:46 - INFO - codeparrot_training - Skipping example with length 616 (seq_length=1024) +03/05/2022 06:22:50 - INFO - codeparrot_training - Step 34815: {'lr': 0.0004417629182099545, 'samples': 17825792, 'steps': 34815, 'loss/train': 0.7484272122383118} +03/05/2022 06:22:53 - INFO - codeparrot_training - Step 34816: {'lr': 0.00044175951343744725, 'samples': 17826304, 'steps': 34816, 'loss/train': 2.1084091663360596} +03/05/2022 06:22:55 - INFO - codeparrot_training - Skipping example with length 57 (seq_length=1024) +03/05/2022 06:22:59 - INFO - codeparrot_training - Step 34817: {'lr': 0.0004417561085785362, 'samples': 17826816, 'steps': 34817, 'loss/train': 1.6282190084457397} +03/05/2022 06:23:02 - INFO - codeparrot_training - Step 34818: {'lr': 0.0004417527036332227, 'samples': 17827328, 'steps': 34818, 'loss/train': 1.4261828660964966} +03/05/2022 06:23:04 - INFO - codeparrot_training - Skipping example with length 943 (seq_length=1024) +03/05/2022 06:23:07 - INFO - codeparrot_training - Step 34819: {'lr': 0.0004417492986015085, 'samples': 17827840, 'steps': 34819, 'loss/train': 1.8855311870574951} +03/05/2022 06:23:10 - INFO - codeparrot_training - Step 34820: {'lr': 0.000441745893483395, 'samples': 17828352, 'steps': 34820, 'loss/train': 1.7528315782546997} +03/05/2022 06:23:12 - INFO - codeparrot_training - Skipping example with length 38 (seq_length=1024) +03/05/2022 06:23:16 - INFO - codeparrot_training - Step 34821: {'lr': 0.00044174248827888376, 'samples': 17828864, 'steps': 34821, 'loss/train': 2.0814781188964844} +03/05/2022 06:23:19 - INFO - codeparrot_training - Step 34822: {'lr': 0.00044173908298797627, 'samples': 17829376, 'steps': 34822, 'loss/train': 1.948156476020813} +03/05/2022 06:23:21 - INFO - codeparrot_training - Skipping example with length 522 (seq_length=1024) +03/05/2022 06:23:24 - INFO - codeparrot_training - Step 34823: {'lr': 0.0004417356776106741, 'samples': 17829888, 'steps': 34823, 'loss/train': 2.0892181396484375} +03/05/2022 06:23:27 - INFO - codeparrot_training - Step 34824: {'lr': 0.00044173227214697885, 'samples': 17830400, 'steps': 34824, 'loss/train': 2.120286703109741} +03/05/2022 06:23:30 - INFO - codeparrot_training - Skipping example with length 996 (seq_length=1024) +03/05/2022 06:23:32 - INFO - codeparrot_training - Step 34825: {'lr': 0.000441728866596892, 'samples': 17830912, 'steps': 34825, 'loss/train': 1.2275387048721313} +03/05/2022 06:23:36 - INFO - codeparrot_training - Step 34826: {'lr': 0.00044172546096041504, 'samples': 17831424, 'steps': 34826, 'loss/train': 1.0015193223953247} +03/05/2022 06:23:38 - INFO - codeparrot_training - Skipping example with length 475 (seq_length=1024) +03/05/2022 06:23:41 - INFO - codeparrot_training - Step 34827: {'lr': 0.0004417220552375496, 'samples': 17831936, 'steps': 34827, 'loss/train': 0.7252134680747986} +03/05/2022 06:23:44 - INFO - codeparrot_training - Step 34828: {'lr': 0.00044171864942829707, 'samples': 17832448, 'steps': 34828, 'loss/train': 1.033115267753601} +03/05/2022 06:23:46 - INFO - codeparrot_training - Skipping example with length 286 (seq_length=1024) +03/05/2022 06:23:49 - INFO - codeparrot_training - Step 34829: {'lr': 0.0004417152435326591, 'samples': 17832960, 'steps': 34829, 'loss/train': 1.0243782997131348} +03/05/2022 06:23:53 - INFO - codeparrot_training - Step 34830: {'lr': 0.00044171183755063726, 'samples': 17833472, 'steps': 34830, 'loss/train': 2.412767171859741} +03/05/2022 06:23:55 - INFO - codeparrot_training - Skipping example with length 652 (seq_length=1024) +03/05/2022 06:23:58 - INFO - codeparrot_training - Step 34831: {'lr': 0.00044170843148223305, 'samples': 17833984, 'steps': 34831, 'loss/train': 2.0161173343658447} +03/05/2022 06:24:01 - INFO - codeparrot_training - Step 34832: {'lr': 0.0004417050253274479, 'samples': 17834496, 'steps': 34832, 'loss/train': 1.3677895069122314} +03/05/2022 06:24:03 - INFO - codeparrot_training - Skipping example with length 967 (seq_length=1024) +03/05/2022 06:24:06 - INFO - codeparrot_training - Step 34833: {'lr': 0.00044170161908628345, 'samples': 17835008, 'steps': 34833, 'loss/train': 2.1176159381866455} +03/05/2022 06:24:09 - INFO - codeparrot_training - Step 34834: {'lr': 0.0004416982127587412, 'samples': 17835520, 'steps': 34834, 'loss/train': 2.0389223098754883} +03/05/2022 06:24:11 - INFO - codeparrot_training - Skipping example with length 532 (seq_length=1024) +03/05/2022 06:24:15 - INFO - codeparrot_training - Step 34835: {'lr': 0.00044169480634482274, 'samples': 17836032, 'steps': 34835, 'loss/train': 1.626057744026184} +03/05/2022 06:24:18 - INFO - codeparrot_training - Step 34836: {'lr': 0.0004416913998445294, 'samples': 17836544, 'steps': 34836, 'loss/train': 1.3532754182815552} +03/05/2022 06:24:20 - INFO - codeparrot_training - Skipping example with length 774 (seq_length=1024) +03/05/2022 06:24:23 - INFO - codeparrot_training - Step 34837: {'lr': 0.000441687993257863, 'samples': 17837056, 'steps': 34837, 'loss/train': 1.734352469444275} +03/05/2022 06:24:27 - INFO - codeparrot_training - Step 34838: {'lr': 0.000441684586584825, 'samples': 17837568, 'steps': 34838, 'loss/train': 1.7379499673843384} +03/05/2022 06:24:28 - INFO - codeparrot_training - Skipping example with length 290 (seq_length=1024) +03/05/2022 06:24:32 - INFO - codeparrot_training - Step 34839: {'lr': 0.0004416811798254168, 'samples': 17838080, 'steps': 34839, 'loss/train': 1.6498956680297852} +03/05/2022 06:24:35 - INFO - codeparrot_training - Step 34840: {'lr': 0.00044167777297964006, 'samples': 17838592, 'steps': 34840, 'loss/train': 2.126178026199341} +03/05/2022 06:24:37 - INFO - codeparrot_training - Skipping example with length 808 (seq_length=1024) +03/05/2022 06:24:40 - INFO - codeparrot_training - Step 34841: {'lr': 0.0004416743660474962, 'samples': 17839104, 'steps': 34841, 'loss/train': 2.112391948699951} +03/05/2022 06:24:44 - INFO - codeparrot_training - Step 34842: {'lr': 0.0004416709590289869, 'samples': 17839616, 'steps': 34842, 'loss/train': 1.608580231666565} +03/05/2022 06:24:46 - INFO - codeparrot_training - Skipping example with length 810 (seq_length=1024) +03/05/2022 06:24:49 - INFO - codeparrot_training - Step 34843: {'lr': 0.00044166755192411364, 'samples': 17840128, 'steps': 34843, 'loss/train': 1.6516684293746948} +03/05/2022 06:24:52 - INFO - codeparrot_training - Step 34844: {'lr': 0.00044166414473287784, 'samples': 17840640, 'steps': 34844, 'loss/train': 1.9520206451416016} +03/05/2022 06:24:54 - INFO - codeparrot_training - Skipping example with length 44 (seq_length=1024) +03/05/2022 06:24:57 - INFO - codeparrot_training - Step 34845: {'lr': 0.0004416607374552812, 'samples': 17841152, 'steps': 34845, 'loss/train': 0.8440061807632446} +03/05/2022 06:25:01 - INFO - codeparrot_training - Step 34846: {'lr': 0.00044165733009132524, 'samples': 17841664, 'steps': 34846, 'loss/train': 0.5976382493972778} +03/05/2022 06:25:03 - INFO - codeparrot_training - Skipping example with length 241 (seq_length=1024) +03/05/2022 06:25:06 - INFO - codeparrot_training - Step 34847: {'lr': 0.00044165392264101136, 'samples': 17842176, 'steps': 34847, 'loss/train': 1.5502822399139404} +03/05/2022 06:25:09 - INFO - codeparrot_training - Step 34848: {'lr': 0.0004416505151043412, 'samples': 17842688, 'steps': 34848, 'loss/train': 1.9006861448287964} +03/05/2022 06:25:11 - INFO - codeparrot_training - Skipping example with length 985 (seq_length=1024) +03/05/2022 06:25:14 - INFO - codeparrot_training - Step 34849: {'lr': 0.0004416471074813163, 'samples': 17843200, 'steps': 34849, 'loss/train': 1.16095769405365} +03/05/2022 06:25:17 - INFO - codeparrot_training - Step 34850: {'lr': 0.0004416436997719382, 'samples': 17843712, 'steps': 34850, 'loss/train': 0.833154559135437} +03/05/2022 06:25:19 - INFO - codeparrot_training - Skipping example with length 1001 (seq_length=1024) +03/05/2022 06:25:22 - INFO - codeparrot_training - Step 34851: {'lr': 0.0004416402919762084, 'samples': 17844224, 'steps': 34851, 'loss/train': 2.4870381355285645} +03/05/2022 06:25:26 - INFO - codeparrot_training - Step 34852: {'lr': 0.00044163688409412833, 'samples': 17844736, 'steps': 34852, 'loss/train': 2.227492570877075} +03/05/2022 06:25:27 - INFO - codeparrot_training - Skipping example with length 432 (seq_length=1024) +03/05/2022 06:25:31 - INFO - codeparrot_training - Step 34853: {'lr': 0.0004416334761256997, 'samples': 17845248, 'steps': 34853, 'loss/train': 1.3923370838165283} +03/05/2022 06:25:34 - INFO - codeparrot_training - Step 34854: {'lr': 0.000441630068070924, 'samples': 17845760, 'steps': 34854, 'loss/train': 0.9838761687278748} +03/05/2022 06:25:37 - INFO - codeparrot_training - Step 34855: {'lr': 0.0004416266599298028, 'samples': 17846272, 'steps': 34855, 'loss/train': 1.393255591392517} +03/05/2022 06:25:37 - INFO - codeparrot_training - Skipping example with length 236 (seq_length=1024) +03/05/2022 06:25:43 - INFO - codeparrot_training - Step 34856: {'lr': 0.00044162325170233745, 'samples': 17846784, 'steps': 34856, 'loss/train': 1.5085633993148804} +03/05/2022 06:25:46 - INFO - codeparrot_training - Step 34857: {'lr': 0.00044161984338852967, 'samples': 17847296, 'steps': 34857, 'loss/train': 1.5105082988739014} +03/05/2022 06:25:47 - INFO - codeparrot_training - Skipping example with length 599 (seq_length=1024) +03/05/2022 06:25:52 - INFO - codeparrot_training - Step 34858: {'lr': 0.000441616434988381, 'samples': 17847808, 'steps': 34858, 'loss/train': 1.9892284870147705} +03/05/2022 06:25:55 - INFO - codeparrot_training - Step 34859: {'lr': 0.00044161302650189295, 'samples': 17848320, 'steps': 34859, 'loss/train': 1.1708277463912964} +03/05/2022 06:25:56 - INFO - codeparrot_training - Skipping example with length 638 (seq_length=1024) +03/05/2022 06:26:00 - INFO - codeparrot_training - Step 34860: {'lr': 0.00044160961792906694, 'samples': 17848832, 'steps': 34860, 'loss/train': 0.7018491625785828} +03/05/2022 06:26:03 - INFO - codeparrot_training - Step 34861: {'lr': 0.00044160620926990456, 'samples': 17849344, 'steps': 34861, 'loss/train': 2.1297495365142822} +03/05/2022 06:26:04 - INFO - codeparrot_training - Skipping example with length 803 (seq_length=1024) +03/05/2022 06:26:09 - INFO - codeparrot_training - Step 34862: {'lr': 0.0004416028005244075, 'samples': 17849856, 'steps': 34862, 'loss/train': 2.461374282836914} +03/05/2022 06:26:12 - INFO - codeparrot_training - Step 34863: {'lr': 0.0004415993916925771, 'samples': 17850368, 'steps': 34863, 'loss/train': 1.8185118436813354} +03/05/2022 06:26:13 - INFO - codeparrot_training - Skipping example with length 172 (seq_length=1024) +03/05/2022 06:26:17 - INFO - codeparrot_training - Step 34864: {'lr': 0.000441595982774415, 'samples': 17850880, 'steps': 34864, 'loss/train': 1.9066054821014404} +03/05/2022 06:26:20 - INFO - codeparrot_training - Step 34865: {'lr': 0.00044159257376992267, 'samples': 17851392, 'steps': 34865, 'loss/train': 0.8716073632240295} +03/05/2022 06:26:21 - INFO - codeparrot_training - Skipping example with length 880 (seq_length=1024) +03/05/2022 06:26:25 - INFO - codeparrot_training - Step 34866: {'lr': 0.0004415891646791017, 'samples': 17851904, 'steps': 34866, 'loss/train': 2.6436846256256104} +03/05/2022 06:26:29 - INFO - codeparrot_training - Step 34867: {'lr': 0.0004415857555019536, 'samples': 17852416, 'steps': 34867, 'loss/train': 1.5450636148452759} +03/05/2022 06:26:30 - INFO - codeparrot_training - Skipping example with length 927 (seq_length=1024) +03/05/2022 06:26:34 - INFO - codeparrot_training - Step 34868: {'lr': 0.00044158234623847993, 'samples': 17852928, 'steps': 34868, 'loss/train': 0.5596045851707458} +03/05/2022 06:26:37 - INFO - codeparrot_training - Step 34869: {'lr': 0.00044157893688868223, 'samples': 17853440, 'steps': 34869, 'loss/train': 1.8349541425704956} +03/05/2022 06:26:38 - INFO - codeparrot_training - Skipping example with length 534 (seq_length=1024) +03/05/2022 06:26:42 - INFO - codeparrot_training - Step 34870: {'lr': 0.00044157552745256203, 'samples': 17853952, 'steps': 34870, 'loss/train': 1.8813645839691162} +03/05/2022 06:26:46 - INFO - codeparrot_training - Step 34871: {'lr': 0.0004415721179301208, 'samples': 17854464, 'steps': 34871, 'loss/train': 2.0009145736694336} +03/05/2022 06:26:47 - INFO - codeparrot_training - Skipping example with length 224 (seq_length=1024) +03/05/2022 06:26:51 - INFO - codeparrot_training - Step 34872: {'lr': 0.00044156870832136015, 'samples': 17854976, 'steps': 34872, 'loss/train': 1.7372632026672363} +03/05/2022 06:26:54 - INFO - codeparrot_training - Step 34873: {'lr': 0.00044156529862628157, 'samples': 17855488, 'steps': 34873, 'loss/train': 2.6415295600891113} +03/05/2022 06:26:55 - INFO - codeparrot_training - Skipping example with length 238 (seq_length=1024) +03/05/2022 06:26:59 - INFO - codeparrot_training - Step 34874: {'lr': 0.00044156188884488667, 'samples': 17856000, 'steps': 34874, 'loss/train': 1.8939578533172607} +03/05/2022 06:27:02 - INFO - codeparrot_training - Step 34875: {'lr': 0.0004415584789771769, 'samples': 17856512, 'steps': 34875, 'loss/train': 2.014019012451172} +03/05/2022 06:27:03 - INFO - codeparrot_training - Skipping example with length 490 (seq_length=1024) +03/05/2022 06:27:08 - INFO - codeparrot_training - Step 34876: {'lr': 0.0004415550690231539, 'samples': 17857024, 'steps': 34876, 'loss/train': 1.6249971389770508} +03/05/2022 06:27:11 - INFO - codeparrot_training - Step 34877: {'lr': 0.0004415516589828191, 'samples': 17857536, 'steps': 34877, 'loss/train': 1.6736602783203125} +03/05/2022 06:27:12 - INFO - codeparrot_training - Skipping example with length 612 (seq_length=1024) +03/05/2022 06:27:16 - INFO - codeparrot_training - Step 34878: {'lr': 0.00044154824885617405, 'samples': 17858048, 'steps': 34878, 'loss/train': 1.391919732093811} +03/05/2022 06:27:19 - INFO - codeparrot_training - Step 34879: {'lr': 0.0004415448386432204, 'samples': 17858560, 'steps': 34879, 'loss/train': 1.7402628660202026} +03/05/2022 06:27:20 - INFO - codeparrot_training - Skipping example with length 1008 (seq_length=1024) +03/05/2022 06:27:24 - INFO - codeparrot_training - Step 34880: {'lr': 0.00044154142834395947, 'samples': 17859072, 'steps': 34880, 'loss/train': 1.3522852659225464} +03/05/2022 06:27:28 - INFO - codeparrot_training - Step 34881: {'lr': 0.00044153801795839296, 'samples': 17859584, 'steps': 34881, 'loss/train': 1.4678255319595337} +03/05/2022 06:27:29 - INFO - codeparrot_training - Skipping example with length 148 (seq_length=1024) +03/05/2022 06:27:33 - INFO - codeparrot_training - Step 34882: {'lr': 0.00044153460748652245, 'samples': 17860096, 'steps': 34882, 'loss/train': 2.2553961277008057} +03/05/2022 06:27:36 - INFO - codeparrot_training - Step 34883: {'lr': 0.00044153119692834944, 'samples': 17860608, 'steps': 34883, 'loss/train': 1.4326810836791992} +03/05/2022 06:27:37 - INFO - codeparrot_training - Skipping example with length 374 (seq_length=1024) +03/05/2022 06:27:41 - INFO - codeparrot_training - Step 34884: {'lr': 0.0004415277862838753, 'samples': 17861120, 'steps': 34884, 'loss/train': 1.4568833112716675} +03/05/2022 06:27:44 - INFO - codeparrot_training - Step 34885: {'lr': 0.00044152437555310174, 'samples': 17861632, 'steps': 34885, 'loss/train': 1.6534831523895264} +03/05/2022 06:27:45 - INFO - codeparrot_training - Skipping example with length 44 (seq_length=1024) +03/05/2022 06:27:50 - INFO - codeparrot_training - Step 34886: {'lr': 0.00044152096473603025, 'samples': 17862144, 'steps': 34886, 'loss/train': 2.23323655128479} +03/05/2022 06:27:53 - INFO - codeparrot_training - Step 34887: {'lr': 0.00044151755383266234, 'samples': 17862656, 'steps': 34887, 'loss/train': 1.913790225982666} +03/05/2022 06:27:53 - INFO - codeparrot_training - Skipping example with length 458 (seq_length=1024) +03/05/2022 06:27:58 - INFO - codeparrot_training - Step 34888: {'lr': 0.0004415141428429997, 'samples': 17863168, 'steps': 34888, 'loss/train': 1.3857903480529785} +03/05/2022 06:28:01 - INFO - codeparrot_training - Step 34889: {'lr': 0.0004415107317670436, 'samples': 17863680, 'steps': 34889, 'loss/train': 2.1948859691619873} +03/05/2022 06:28:02 - INFO - codeparrot_training - Skipping example with length 33 (seq_length=1024) +03/05/2022 06:28:07 - INFO - codeparrot_training - Step 34890: {'lr': 0.0004415073206047958, 'samples': 17864192, 'steps': 34890, 'loss/train': 0.27649974822998047} +03/05/2022 06:28:10 - INFO - codeparrot_training - Step 34891: {'lr': 0.0004415039093562577, 'samples': 17864704, 'steps': 34891, 'loss/train': 1.521222710609436} +03/05/2022 06:28:11 - INFO - codeparrot_training - Skipping example with length 966 (seq_length=1024) +03/05/2022 06:28:15 - INFO - codeparrot_training - Step 34892: {'lr': 0.00044150049802143095, 'samples': 17865216, 'steps': 34892, 'loss/train': 2.058128833770752} +03/05/2022 06:28:18 - INFO - codeparrot_training - Step 34893: {'lr': 0.00044149708660031704, 'samples': 17865728, 'steps': 34893, 'loss/train': 1.9542064666748047} +03/05/2022 06:28:20 - INFO - codeparrot_training - Skipping example with length 968 (seq_length=1024) +03/05/2022 06:28:24 - INFO - codeparrot_training - Step 34894: {'lr': 0.0004414936750929174, 'samples': 17866240, 'steps': 34894, 'loss/train': 2.216167449951172} +03/05/2022 06:28:27 - INFO - codeparrot_training - Step 34895: {'lr': 0.0004414902634992338, 'samples': 17866752, 'steps': 34895, 'loss/train': 1.5830042362213135} +03/05/2022 06:28:28 - INFO - codeparrot_training - Skipping example with length 133 (seq_length=1024) +03/05/2022 06:28:32 - INFO - codeparrot_training - Step 34896: {'lr': 0.0004414868518192675, 'samples': 17867264, 'steps': 34896, 'loss/train': 1.9079699516296387} +03/05/2022 06:28:35 - INFO - codeparrot_training - Step 34897: {'lr': 0.0004414834400530203, 'samples': 17867776, 'steps': 34897, 'loss/train': 1.9057271480560303} +03/05/2022 06:28:36 - INFO - codeparrot_training - Skipping example with length 879 (seq_length=1024) +03/05/2022 06:28:40 - INFO - codeparrot_training - Step 34898: {'lr': 0.00044148002820049354, 'samples': 17868288, 'steps': 34898, 'loss/train': 1.3559982776641846} +03/05/2022 06:28:44 - INFO - codeparrot_training - Step 34899: {'lr': 0.00044147661626168887, 'samples': 17868800, 'steps': 34899, 'loss/train': 1.4642717838287354} +03/05/2022 06:28:44 - INFO - codeparrot_training - Skipping example with length 895 (seq_length=1024) +03/05/2022 06:28:49 - INFO - codeparrot_training - Step 34900: {'lr': 0.0004414732042366078, 'samples': 17869312, 'steps': 34900, 'loss/train': 1.8140931129455566} +03/05/2022 06:28:52 - INFO - codeparrot_training - Step 34901: {'lr': 0.00044146979212525184, 'samples': 17869824, 'steps': 34901, 'loss/train': 1.3249456882476807} +03/05/2022 06:28:53 - INFO - codeparrot_training - Skipping example with length 880 (seq_length=1024) +03/05/2022 06:28:57 - INFO - codeparrot_training - Step 34902: {'lr': 0.0004414663799276225, 'samples': 17870336, 'steps': 34902, 'loss/train': 1.7898298501968384} +03/05/2022 06:29:01 - INFO - codeparrot_training - Step 34903: {'lr': 0.0004414629676437214, 'samples': 17870848, 'steps': 34903, 'loss/train': 1.941007375717163} +03/05/2022 06:29:01 - INFO - codeparrot_training - Skipping example with length 304 (seq_length=1024) +03/05/2022 06:29:06 - INFO - codeparrot_training - Step 34904: {'lr': 0.00044145955527355007, 'samples': 17871360, 'steps': 34904, 'loss/train': 2.0956506729125977} +03/05/2022 06:29:09 - INFO - codeparrot_training - Step 34905: {'lr': 0.00044145614281711, 'samples': 17871872, 'steps': 34905, 'loss/train': 1.3394807577133179} +03/05/2022 06:29:11 - INFO - codeparrot_training - Skipping example with length 972 (seq_length=1024) +03/05/2022 06:29:14 - INFO - codeparrot_training - Step 34906: {'lr': 0.00044145273027440275, 'samples': 17872384, 'steps': 34906, 'loss/train': 1.3507471084594727} +03/05/2022 06:29:17 - INFO - codeparrot_training - Step 34907: {'lr': 0.0004414493176454298, 'samples': 17872896, 'steps': 34907, 'loss/train': 1.6828564405441284} +03/05/2022 06:29:19 - INFO - codeparrot_training - Skipping example with length 39 (seq_length=1024) +03/05/2022 06:29:23 - INFO - codeparrot_training - Step 34908: {'lr': 0.0004414459049301929, 'samples': 17873408, 'steps': 34908, 'loss/train': 1.4212250709533691} +03/05/2022 06:29:26 - INFO - codeparrot_training - Step 34909: {'lr': 0.00044144249212869327, 'samples': 17873920, 'steps': 34909, 'loss/train': 1.5350430011749268} +03/05/2022 06:29:27 - INFO - codeparrot_training - Skipping example with length 998 (seq_length=1024) +03/05/2022 06:29:31 - INFO - codeparrot_training - Step 34910: {'lr': 0.0004414390792409326, 'samples': 17874432, 'steps': 34910, 'loss/train': 1.6525355577468872} +03/05/2022 06:29:34 - INFO - codeparrot_training - Step 34911: {'lr': 0.0004414356662669126, 'samples': 17874944, 'steps': 34911, 'loss/train': 2.043109893798828} +03/05/2022 06:29:36 - INFO - codeparrot_training - Skipping example with length 142 (seq_length=1024) +03/05/2022 06:29:40 - INFO - codeparrot_training - Step 34912: {'lr': 0.0004414322532066345, 'samples': 17875456, 'steps': 34912, 'loss/train': 1.9442780017852783} +03/05/2022 06:29:43 - INFO - codeparrot_training - Step 34913: {'lr': 0.0004414288400601, 'samples': 17875968, 'steps': 34913, 'loss/train': 1.5154223442077637} +03/05/2022 06:29:44 - INFO - codeparrot_training - Skipping example with length 428 (seq_length=1024) +03/05/2022 06:29:48 - INFO - codeparrot_training - Step 34914: {'lr': 0.0004414254268273107, 'samples': 17876480, 'steps': 34914, 'loss/train': 1.9016990661621094} +03/05/2022 06:29:51 - INFO - codeparrot_training - Step 34915: {'lr': 0.0004414220135082679, 'samples': 17876992, 'steps': 34915, 'loss/train': 1.9976986646652222} +03/05/2022 06:29:52 - INFO - codeparrot_training - Skipping example with length 116 (seq_length=1024) +03/05/2022 06:29:56 - INFO - codeparrot_training - Step 34916: {'lr': 0.0004414186001029734, 'samples': 17877504, 'steps': 34916, 'loss/train': 2.005429983139038} +03/05/2022 06:30:00 - INFO - codeparrot_training - Step 34917: {'lr': 0.00044141518661142864, 'samples': 17878016, 'steps': 34917, 'loss/train': 1.9350430965423584} +03/05/2022 06:30:01 - INFO - codeparrot_training - Skipping example with length 135 (seq_length=1024) +03/05/2022 06:30:05 - INFO - codeparrot_training - Step 34918: {'lr': 0.0004414117730336351, 'samples': 17878528, 'steps': 34918, 'loss/train': 2.531646966934204} +03/05/2022 06:30:08 - INFO - codeparrot_training - Step 34919: {'lr': 0.0004414083593695944, 'samples': 17879040, 'steps': 34919, 'loss/train': 1.0820378065109253} +03/05/2022 06:30:09 - INFO - codeparrot_training - Skipping example with length 1019 (seq_length=1024) +03/05/2022 06:30:13 - INFO - codeparrot_training - Step 34920: {'lr': 0.0004414049456193081, 'samples': 17879552, 'steps': 34920, 'loss/train': 2.08001446723938} +03/05/2022 06:30:17 - INFO - codeparrot_training - Step 34921: {'lr': 0.00044140153178277765, 'samples': 17880064, 'steps': 34921, 'loss/train': 1.464718222618103} +03/05/2022 06:30:22 - INFO - codeparrot_training - Step 34922: {'lr': 0.0004413981178600046, 'samples': 17880576, 'steps': 34922, 'loss/train': 1.1355311870574951} +03/05/2022 06:30:25 - INFO - codeparrot_training - Step 34923: {'lr': 0.00044139470385099047, 'samples': 17881088, 'steps': 34923, 'loss/train': 2.5171875953674316} +03/05/2022 06:30:26 - INFO - codeparrot_training - Skipping example with length 453 (seq_length=1024) +03/05/2022 06:30:30 - INFO - codeparrot_training - Step 34924: {'lr': 0.0004413912897557369, 'samples': 17881600, 'steps': 34924, 'loss/train': 1.6745734214782715} +03/05/2022 06:30:34 - INFO - codeparrot_training - Step 34925: {'lr': 0.0004413878755742454, 'samples': 17882112, 'steps': 34925, 'loss/train': 2.324354410171509} +03/05/2022 06:30:34 - INFO - codeparrot_training - Skipping example with length 842 (seq_length=1024) +03/05/2022 06:30:39 - INFO - codeparrot_training - Step 34926: {'lr': 0.00044138446130651736, 'samples': 17882624, 'steps': 34926, 'loss/train': 1.5801204442977905} +03/05/2022 06:30:42 - INFO - codeparrot_training - Step 34927: {'lr': 0.00044138104695255455, 'samples': 17883136, 'steps': 34927, 'loss/train': 0.6715707778930664} +03/05/2022 06:30:43 - INFO - codeparrot_training - Skipping example with length 102 (seq_length=1024) +03/05/2022 06:30:47 - INFO - codeparrot_training - Step 34928: {'lr': 0.00044137763251235837, 'samples': 17883648, 'steps': 34928, 'loss/train': 1.1433969736099243} +03/05/2022 06:30:50 - INFO - codeparrot_training - Step 34929: {'lr': 0.0004413742179859304, 'samples': 17884160, 'steps': 34929, 'loss/train': 1.5350388288497925} +03/05/2022 06:30:51 - INFO - codeparrot_training - Skipping example with length 122 (seq_length=1024) +03/05/2022 06:30:56 - INFO - codeparrot_training - Step 34930: {'lr': 0.00044137080337327205, 'samples': 17884672, 'steps': 34930, 'loss/train': 1.422473669052124} +03/05/2022 06:30:59 - INFO - codeparrot_training - Step 34931: {'lr': 0.000441367388674385, 'samples': 17885184, 'steps': 34931, 'loss/train': 1.985186219215393} +03/05/2022 06:31:00 - INFO - codeparrot_training - Skipping example with length 752 (seq_length=1024) +03/05/2022 06:31:04 - INFO - codeparrot_training - Step 34932: {'lr': 0.00044136397388927083, 'samples': 17885696, 'steps': 34932, 'loss/train': 1.69344961643219} +03/05/2022 06:31:07 - INFO - codeparrot_training - Step 34933: {'lr': 0.000441360559017931, 'samples': 17886208, 'steps': 34933, 'loss/train': 0.6037330031394958} +03/05/2022 06:31:08 - INFO - codeparrot_training - Skipping example with length 771 (seq_length=1024) +03/05/2022 06:31:13 - INFO - codeparrot_training - Step 34934: {'lr': 0.00044135714406036696, 'samples': 17886720, 'steps': 34934, 'loss/train': 1.2142333984375} +03/05/2022 06:31:16 - INFO - codeparrot_training - Step 34935: {'lr': 0.00044135372901658046, 'samples': 17887232, 'steps': 34935, 'loss/train': 2.2215306758880615} +03/05/2022 06:31:17 - INFO - codeparrot_training - Skipping example with length 345 (seq_length=1024) +03/05/2022 06:31:21 - INFO - codeparrot_training - Step 34936: {'lr': 0.0004413503138865729, 'samples': 17887744, 'steps': 34936, 'loss/train': 1.8244150876998901} +03/05/2022 06:31:24 - INFO - codeparrot_training - Step 34937: {'lr': 0.00044134689867034583, 'samples': 17888256, 'steps': 34937, 'loss/train': 1.8244725465774536} +03/05/2022 06:31:25 - INFO - codeparrot_training - Skipping example with length 378 (seq_length=1024) +03/05/2022 06:31:29 - INFO - codeparrot_training - Step 34938: {'lr': 0.00044134348336790074, 'samples': 17888768, 'steps': 34938, 'loss/train': 2.8450660705566406} +03/05/2022 06:31:33 - INFO - codeparrot_training - Step 34939: {'lr': 0.0004413400679792393, 'samples': 17889280, 'steps': 34939, 'loss/train': 1.809972882270813} +03/05/2022 06:31:34 - INFO - codeparrot_training - Skipping example with length 893 (seq_length=1024) +03/05/2022 06:31:38 - INFO - codeparrot_training - Step 34940: {'lr': 0.00044133665250436295, 'samples': 17889792, 'steps': 34940, 'loss/train': 1.190192699432373} +03/05/2022 06:31:41 - INFO - codeparrot_training - Step 34941: {'lr': 0.00044133323694327324, 'samples': 17890304, 'steps': 34941, 'loss/train': 1.6284505128860474} +03/05/2022 06:31:42 - INFO - codeparrot_training - Skipping example with length 424 (seq_length=1024) +03/05/2022 06:31:46 - INFO - codeparrot_training - Step 34942: {'lr': 0.0004413298212959718, 'samples': 17890816, 'steps': 34942, 'loss/train': 2.1109745502471924} +03/05/2022 06:31:49 - INFO - codeparrot_training - Step 34943: {'lr': 0.00044132640556246, 'samples': 17891328, 'steps': 34943, 'loss/train': 2.0893192291259766} +03/05/2022 06:31:50 - INFO - codeparrot_training - Skipping example with length 269 (seq_length=1024) +03/05/2022 06:31:55 - INFO - codeparrot_training - Step 34944: {'lr': 0.00044132298974273955, 'samples': 17891840, 'steps': 34944, 'loss/train': 1.3159205913543701} +03/05/2022 06:31:58 - INFO - codeparrot_training - Step 34945: {'lr': 0.00044131957383681186, 'samples': 17892352, 'steps': 34945, 'loss/train': 1.7453482151031494} +03/05/2022 06:31:59 - INFO - codeparrot_training - Skipping example with length 250 (seq_length=1024) +03/05/2022 06:32:03 - INFO - codeparrot_training - Step 34946: {'lr': 0.0004413161578446785, 'samples': 17892864, 'steps': 34946, 'loss/train': 1.7412831783294678} +03/05/2022 06:32:06 - INFO - codeparrot_training - Step 34947: {'lr': 0.00044131274176634113, 'samples': 17893376, 'steps': 34947, 'loss/train': 2.1667580604553223} +03/05/2022 06:32:07 - INFO - codeparrot_training - Skipping example with length 88 (seq_length=1024) +03/05/2022 06:32:12 - INFO - codeparrot_training - Step 34948: {'lr': 0.00044130932560180114, 'samples': 17893888, 'steps': 34948, 'loss/train': 1.0999799966812134} +03/05/2022 06:32:15 - INFO - codeparrot_training - Step 34949: {'lr': 0.0004413059093510601, 'samples': 17894400, 'steps': 34949, 'loss/train': 6.522251605987549} +03/05/2022 06:32:17 - INFO - codeparrot_training - Skipping example with length 981 (seq_length=1024) +03/05/2022 06:32:20 - INFO - codeparrot_training - Step 34950: {'lr': 0.00044130249301411957, 'samples': 17894912, 'steps': 34950, 'loss/train': 1.9802055358886719} +03/05/2022 06:32:23 - INFO - codeparrot_training - Step 34951: {'lr': 0.0004412990765909811, 'samples': 17895424, 'steps': 34951, 'loss/train': 1.7496472597122192} +03/05/2022 06:32:25 - INFO - codeparrot_training - Skipping example with length 271 (seq_length=1024) +03/05/2022 06:32:29 - INFO - codeparrot_training - Step 34952: {'lr': 0.0004412956600816462, 'samples': 17895936, 'steps': 34952, 'loss/train': 1.7567912340164185} +03/05/2022 06:32:32 - INFO - codeparrot_training - Step 34953: {'lr': 0.00044129224348611644, 'samples': 17896448, 'steps': 34953, 'loss/train': 1.2723947763442993} +03/05/2022 06:32:33 - INFO - codeparrot_training - Skipping example with length 670 (seq_length=1024) +03/05/2022 06:32:37 - INFO - codeparrot_training - Step 34954: {'lr': 0.0004412888268043934, 'samples': 17896960, 'steps': 34954, 'loss/train': 1.2555564641952515} +03/05/2022 06:32:40 - INFO - codeparrot_training - Step 34955: {'lr': 0.0004412854100364785, 'samples': 17897472, 'steps': 34955, 'loss/train': 1.5003790855407715} +03/05/2022 06:32:42 - INFO - codeparrot_training - Skipping example with length 513 (seq_length=1024) +03/05/2022 06:32:45 - INFO - codeparrot_training - Step 34956: {'lr': 0.0004412819931823734, 'samples': 17897984, 'steps': 34956, 'loss/train': 2.3147830963134766} +03/05/2022 06:32:49 - INFO - codeparrot_training - Step 34957: {'lr': 0.0004412785762420795, 'samples': 17898496, 'steps': 34957, 'loss/train': 0.25216546654701233} +03/05/2022 06:32:51 - INFO - codeparrot_training - Skipping example with length 183 (seq_length=1024) +03/05/2022 06:32:54 - INFO - codeparrot_training - Step 34958: {'lr': 0.0004412751592155985, 'samples': 17899008, 'steps': 34958, 'loss/train': 2.6953213214874268} +03/05/2022 06:32:57 - INFO - codeparrot_training - Step 34959: {'lr': 0.00044127174210293186, 'samples': 17899520, 'steps': 34959, 'loss/train': 2.280088424682617} +03/05/2022 06:32:59 - INFO - codeparrot_training - Skipping example with length 421 (seq_length=1024) +03/05/2022 06:33:02 - INFO - codeparrot_training - Step 34960: {'lr': 0.0004412683249040811, 'samples': 17900032, 'steps': 34960, 'loss/train': 2.6089258193969727} +03/05/2022 06:33:06 - INFO - codeparrot_training - Step 34961: {'lr': 0.0004412649076190478, 'samples': 17900544, 'steps': 34961, 'loss/train': 1.863905668258667} +03/05/2022 06:33:08 - INFO - codeparrot_training - Skipping example with length 176 (seq_length=1024) +03/05/2022 06:33:11 - INFO - codeparrot_training - Step 34962: {'lr': 0.00044126149024783346, 'samples': 17901056, 'steps': 34962, 'loss/train': 2.5443789958953857} +03/05/2022 06:33:14 - INFO - codeparrot_training - Step 34963: {'lr': 0.0004412580727904396, 'samples': 17901568, 'steps': 34963, 'loss/train': 1.5223264694213867} +03/05/2022 06:33:17 - INFO - codeparrot_training - Skipping example with length 640 (seq_length=1024) +03/05/2022 06:33:19 - INFO - codeparrot_training - Step 34964: {'lr': 0.0004412546552468679, 'samples': 17902080, 'steps': 34964, 'loss/train': 1.4610614776611328} +03/05/2022 06:33:23 - INFO - codeparrot_training - Step 34965: {'lr': 0.00044125123761711975, 'samples': 17902592, 'steps': 34965, 'loss/train': 1.9106993675231934} +03/05/2022 06:33:25 - INFO - codeparrot_training - Skipping example with length 124 (seq_length=1024) +03/05/2022 06:33:28 - INFO - codeparrot_training - Step 34966: {'lr': 0.00044124781990119677, 'samples': 17903104, 'steps': 34966, 'loss/train': 1.859367847442627} +03/05/2022 06:33:31 - INFO - codeparrot_training - Step 34967: {'lr': 0.0004412444020991004, 'samples': 17903616, 'steps': 34967, 'loss/train': 1.2246556282043457} +03/05/2022 06:33:33 - INFO - codeparrot_training - Skipping example with length 213 (seq_length=1024) +03/05/2022 06:33:36 - INFO - codeparrot_training - Step 34968: {'lr': 0.0004412409842108324, 'samples': 17904128, 'steps': 34968, 'loss/train': 1.358432412147522} +03/05/2022 06:33:40 - INFO - codeparrot_training - Step 34969: {'lr': 0.0004412375662363941, 'samples': 17904640, 'steps': 34969, 'loss/train': 2.53106951713562} +03/05/2022 06:33:42 - INFO - codeparrot_training - Skipping example with length 977 (seq_length=1024) +03/05/2022 06:33:45 - INFO - codeparrot_training - Step 34970: {'lr': 0.00044123414817578705, 'samples': 17905152, 'steps': 34970, 'loss/train': 1.6233115196228027} +03/05/2022 06:33:48 - INFO - codeparrot_training - Step 34971: {'lr': 0.00044123073002901286, 'samples': 17905664, 'steps': 34971, 'loss/train': 1.4780207872390747} +03/05/2022 06:33:50 - INFO - codeparrot_training - Skipping example with length 140 (seq_length=1024) +03/05/2022 06:33:53 - INFO - codeparrot_training - Step 34972: {'lr': 0.0004412273117960731, 'samples': 17906176, 'steps': 34972, 'loss/train': 1.4425920248031616} +03/05/2022 06:33:56 - INFO - codeparrot_training - Step 34973: {'lr': 0.00044122389347696925, 'samples': 17906688, 'steps': 34973, 'loss/train': 1.4676014184951782} +03/05/2022 06:33:59 - INFO - codeparrot_training - Skipping example with length 941 (seq_length=1024) +03/05/2022 06:34:02 - INFO - codeparrot_training - Step 34974: {'lr': 0.0004412204750717028, 'samples': 17907200, 'steps': 34974, 'loss/train': 1.9555248022079468} +03/05/2022 06:34:05 - INFO - codeparrot_training - Step 34975: {'lr': 0.00044121705658027545, 'samples': 17907712, 'steps': 34975, 'loss/train': 1.5807853937149048} +03/05/2022 06:34:07 - INFO - codeparrot_training - Skipping example with length 716 (seq_length=1024) +03/05/2022 06:34:10 - INFO - codeparrot_training - Step 34976: {'lr': 0.00044121363800268853, 'samples': 17908224, 'steps': 34976, 'loss/train': 1.85499107837677} +03/05/2022 06:34:13 - INFO - codeparrot_training - Step 34977: {'lr': 0.0004412102193389438, 'samples': 17908736, 'steps': 34977, 'loss/train': 1.8151769638061523} +03/05/2022 06:34:16 - INFO - codeparrot_training - Skipping example with length 472 (seq_length=1024) +03/05/2022 06:34:18 - INFO - codeparrot_training - Step 34978: {'lr': 0.0004412068005890427, 'samples': 17909248, 'steps': 34978, 'loss/train': 1.7757508754730225} +03/05/2022 06:34:22 - INFO - codeparrot_training - Step 34979: {'lr': 0.0004412033817529867, 'samples': 17909760, 'steps': 34979, 'loss/train': 0.6116886138916016} +03/05/2022 06:34:24 - INFO - codeparrot_training - Skipping example with length 570 (seq_length=1024) +03/05/2022 06:34:27 - INFO - codeparrot_training - Step 34980: {'lr': 0.0004411999628307775, 'samples': 17910272, 'steps': 34980, 'loss/train': 1.2069125175476074} +03/05/2022 06:34:30 - INFO - codeparrot_training - Step 34981: {'lr': 0.0004411965438224164, 'samples': 17910784, 'steps': 34981, 'loss/train': 1.580447793006897} +03/05/2022 06:34:33 - INFO - codeparrot_training - Skipping example with length 533 (seq_length=1024) +03/05/2022 06:34:35 - INFO - codeparrot_training - Step 34982: {'lr': 0.0004411931247279052, 'samples': 17911296, 'steps': 34982, 'loss/train': 0.15457546710968018} +03/05/2022 06:34:38 - INFO - codeparrot_training - Step 34983: {'lr': 0.00044118970554724523, 'samples': 17911808, 'steps': 34983, 'loss/train': 1.6314420700073242} +03/05/2022 06:34:41 - INFO - codeparrot_training - Skipping example with length 930 (seq_length=1024) +03/05/2022 06:34:44 - INFO - codeparrot_training - Step 34984: {'lr': 0.0004411862862804382, 'samples': 17912320, 'steps': 34984, 'loss/train': 0.7085153460502625} +03/05/2022 06:34:47 - INFO - codeparrot_training - Step 34985: {'lr': 0.0004411828669274856, 'samples': 17912832, 'steps': 34985, 'loss/train': 1.6789199113845825} +03/05/2022 06:34:50 - INFO - codeparrot_training - Step 34986: {'lr': 0.0004411794474883889, 'samples': 17913344, 'steps': 34986, 'loss/train': 1.7990858554840088} +03/05/2022 06:34:50 - INFO - codeparrot_training - Skipping example with length 278 (seq_length=1024) +03/05/2022 06:34:56 - INFO - codeparrot_training - Step 34987: {'lr': 0.0004411760279631497, 'samples': 17913856, 'steps': 34987, 'loss/train': 1.3297609090805054} +03/05/2022 06:34:58 - INFO - codeparrot_training - Skipping example with length 161 (seq_length=1024) +03/05/2022 06:35:01 - INFO - codeparrot_training - Step 34988: {'lr': 0.0004411726083517696, 'samples': 17914368, 'steps': 34988, 'loss/train': 1.4986047744750977} +03/05/2022 06:35:04 - INFO - codeparrot_training - Step 34989: {'lr': 0.00044116918865425004, 'samples': 17914880, 'steps': 34989, 'loss/train': 1.6168302297592163} +03/05/2022 06:35:07 - INFO - codeparrot_training - Step 34990: {'lr': 0.00044116576887059255, 'samples': 17915392, 'steps': 34990, 'loss/train': 1.833122968673706} +03/05/2022 06:35:13 - INFO - codeparrot_training - Step 34991: {'lr': 0.0004411623490007988, 'samples': 17915904, 'steps': 34991, 'loss/train': 1.6909750699996948} +03/05/2022 06:35:16 - INFO - codeparrot_training - Step 34992: {'lr': 0.0004411589290448701, 'samples': 17916416, 'steps': 34992, 'loss/train': 2.2682623863220215} +03/05/2022 06:35:16 - INFO - codeparrot_training - Skipping example with length 491 (seq_length=1024) +03/05/2022 06:35:21 - INFO - codeparrot_training - Step 34993: {'lr': 0.0004411555090028082, 'samples': 17916928, 'steps': 34993, 'loss/train': 1.3395839929580688} +03/05/2022 06:35:24 - INFO - codeparrot_training - Step 34994: {'lr': 0.00044115208887461464, 'samples': 17917440, 'steps': 34994, 'loss/train': 1.7266957759857178} +03/05/2022 06:35:25 - INFO - codeparrot_training - Skipping example with length 521 (seq_length=1024) +03/05/2022 06:35:30 - INFO - codeparrot_training - Step 34995: {'lr': 0.00044114866866029086, 'samples': 17917952, 'steps': 34995, 'loss/train': 1.4539505243301392} +03/05/2022 06:35:33 - INFO - codeparrot_training - Step 34996: {'lr': 0.00044114524835983844, 'samples': 17918464, 'steps': 34996, 'loss/train': 1.9073495864868164} +03/05/2022 06:35:34 - INFO - codeparrot_training - Skipping example with length 231 (seq_length=1024) +03/05/2022 06:35:38 - INFO - codeparrot_training - Step 34997: {'lr': 0.00044114182797325884, 'samples': 17918976, 'steps': 34997, 'loss/train': 1.963602900505066} +03/05/2022 06:35:41 - INFO - codeparrot_training - Step 34998: {'lr': 0.0004411384075005538, 'samples': 17919488, 'steps': 34998, 'loss/train': 0.9859839081764221} +03/05/2022 06:35:42 - INFO - codeparrot_training - Skipping example with length 698 (seq_length=1024) +03/05/2022 06:35:47 - INFO - codeparrot_training - Step 34999: {'lr': 0.0004411349869417247, 'samples': 17920000, 'steps': 34999, 'loss/train': 1.3265409469604492} +03/05/2022 06:35:47 - INFO - codeparrot_training - Evaluating and saving model checkpoint