{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.34787448688513184, "eval_steps": 500, "global_step": 15000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 7.727975270479135e-09, "loss": 2.2931, "step": 1 }, { "epoch": 0.0, "learning_rate": 1.545595054095827e-08, "loss": 2.3449, "step": 2 }, { "epoch": 0.0, "learning_rate": 2.3183925811437404e-08, "loss": 3.1199, "step": 3 }, { "epoch": 0.0, "learning_rate": 3.091190108191654e-08, "loss": 2.4593, "step": 4 }, { "epoch": 0.0, "learning_rate": 3.863987635239568e-08, "loss": 2.8635, "step": 5 }, { "epoch": 0.0, "learning_rate": 4.636785162287481e-08, "loss": 2.8181, "step": 6 }, { "epoch": 0.0, "learning_rate": 5.4095826893353944e-08, "loss": 3.0884, "step": 7 }, { "epoch": 0.0, "learning_rate": 6.182380216383308e-08, "loss": 2.8522, "step": 8 }, { "epoch": 0.0, "learning_rate": 6.955177743431221e-08, "loss": 2.4496, "step": 9 }, { "epoch": 0.0, "learning_rate": 7.727975270479135e-08, "loss": 2.6519, "step": 10 }, { "epoch": 0.0, "learning_rate": 8.500772797527048e-08, "loss": 2.4888, "step": 11 }, { "epoch": 0.0, "learning_rate": 9.273570324574961e-08, "loss": 3.1319, "step": 12 }, { "epoch": 0.0, "learning_rate": 1.0046367851622876e-07, "loss": 2.6695, "step": 13 }, { "epoch": 0.0, "learning_rate": 1.0819165378670789e-07, "loss": 2.6447, "step": 14 }, { "epoch": 0.0, "learning_rate": 1.1591962905718703e-07, "loss": 2.3883, "step": 15 }, { "epoch": 0.0, "learning_rate": 1.2364760432766616e-07, "loss": 2.7252, "step": 16 }, { "epoch": 0.0, "learning_rate": 1.313755795981453e-07, "loss": 3.0519, "step": 17 }, { "epoch": 0.0, "learning_rate": 1.3910355486862442e-07, "loss": 2.5641, "step": 18 }, { "epoch": 0.0, "learning_rate": 1.4683153013910355e-07, "loss": 2.7555, "step": 19 }, { "epoch": 0.0, "learning_rate": 1.545595054095827e-07, "loss": 2.6233, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.6228748068006184e-07, "loss": 2.6874, "step": 21 }, { "epoch": 0.0, "learning_rate": 1.7001545595054097e-07, "loss": 2.4484, "step": 22 }, { "epoch": 0.0, "learning_rate": 1.7774343122102013e-07, "loss": 3.3117, "step": 23 }, { "epoch": 0.0, "learning_rate": 1.8547140649149923e-07, "loss": 2.7778, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.9319938176197839e-07, "loss": 2.4847, "step": 25 }, { "epoch": 0.0, "learning_rate": 2.0092735703245752e-07, "loss": 2.6591, "step": 26 }, { "epoch": 0.0, "learning_rate": 2.0865533230293667e-07, "loss": 2.7363, "step": 27 }, { "epoch": 0.0, "learning_rate": 2.1638330757341578e-07, "loss": 2.3763, "step": 28 }, { "epoch": 0.0, "learning_rate": 2.241112828438949e-07, "loss": 2.345, "step": 29 }, { "epoch": 0.0, "learning_rate": 2.3183925811437406e-07, "loss": 3.3071, "step": 30 }, { "epoch": 0.0, "learning_rate": 2.3956723338485317e-07, "loss": 3.558, "step": 31 }, { "epoch": 0.0, "learning_rate": 2.472952086553323e-07, "loss": 2.4276, "step": 32 }, { "epoch": 0.0, "learning_rate": 2.550231839258115e-07, "loss": 2.7492, "step": 33 }, { "epoch": 0.0, "learning_rate": 2.627511591962906e-07, "loss": 2.2478, "step": 34 }, { "epoch": 0.0, "learning_rate": 2.7047913446676974e-07, "loss": 2.6074, "step": 35 }, { "epoch": 0.0, "learning_rate": 2.7820710973724884e-07, "loss": 2.3372, "step": 36 }, { "epoch": 0.0, "learning_rate": 2.85935085007728e-07, "loss": 2.6465, "step": 37 }, { "epoch": 0.0, "learning_rate": 2.936630602782071e-07, "loss": 2.3942, "step": 38 }, { "epoch": 0.0, "learning_rate": 3.0139103554868626e-07, "loss": 2.524, "step": 39 }, { "epoch": 0.0, "learning_rate": 3.091190108191654e-07, "loss": 2.3285, "step": 40 }, { "epoch": 0.0, "learning_rate": 3.168469860896446e-07, "loss": 2.4557, "step": 41 }, { "epoch": 0.0, "learning_rate": 3.245749613601237e-07, "loss": 2.4891, "step": 42 }, { "epoch": 0.0, "learning_rate": 3.3230293663060283e-07, "loss": 2.2078, "step": 43 }, { "epoch": 0.0, "learning_rate": 3.4003091190108194e-07, "loss": 1.9521, "step": 44 }, { "epoch": 0.0, "learning_rate": 3.4775888717156104e-07, "loss": 2.879, "step": 45 }, { "epoch": 0.0, "learning_rate": 3.5548686244204025e-07, "loss": 2.3088, "step": 46 }, { "epoch": 0.0, "learning_rate": 3.6321483771251936e-07, "loss": 2.0741, "step": 47 }, { "epoch": 0.0, "learning_rate": 3.7094281298299846e-07, "loss": 2.4153, "step": 48 }, { "epoch": 0.0, "learning_rate": 3.786707882534776e-07, "loss": 2.3456, "step": 49 }, { "epoch": 0.0, "learning_rate": 3.8639876352395677e-07, "loss": 2.183, "step": 50 }, { "epoch": 0.0, "learning_rate": 3.941267387944359e-07, "loss": 2.2101, "step": 51 }, { "epoch": 0.0, "learning_rate": 4.0185471406491503e-07, "loss": 2.3656, "step": 52 }, { "epoch": 0.0, "learning_rate": 4.0958268933539414e-07, "loss": 2.0658, "step": 53 }, { "epoch": 0.0, "learning_rate": 4.1731066460587335e-07, "loss": 2.0589, "step": 54 }, { "epoch": 0.0, "learning_rate": 4.2503863987635245e-07, "loss": 1.9948, "step": 55 }, { "epoch": 0.0, "learning_rate": 4.3276661514683155e-07, "loss": 2.1037, "step": 56 }, { "epoch": 0.0, "learning_rate": 4.404945904173107e-07, "loss": 1.7966, "step": 57 }, { "epoch": 0.0, "learning_rate": 4.482225656877898e-07, "loss": 1.8509, "step": 58 }, { "epoch": 0.0, "learning_rate": 4.5595054095826897e-07, "loss": 1.9969, "step": 59 }, { "epoch": 0.0, "learning_rate": 4.6367851622874813e-07, "loss": 2.0279, "step": 60 }, { "epoch": 0.0, "learning_rate": 4.7140649149922723e-07, "loss": 1.9795, "step": 61 }, { "epoch": 0.0, "learning_rate": 4.791344667697063e-07, "loss": 1.7996, "step": 62 }, { "epoch": 0.0, "learning_rate": 4.868624420401855e-07, "loss": 1.9823, "step": 63 }, { "epoch": 0.0, "learning_rate": 4.945904173106646e-07, "loss": 1.8125, "step": 64 }, { "epoch": 0.0, "learning_rate": 5.023183925811439e-07, "loss": 1.8728, "step": 65 }, { "epoch": 0.0, "learning_rate": 5.10046367851623e-07, "loss": 1.6876, "step": 66 }, { "epoch": 0.0, "learning_rate": 5.177743431221021e-07, "loss": 1.7476, "step": 67 }, { "epoch": 0.0, "learning_rate": 5.255023183925812e-07, "loss": 1.6162, "step": 68 }, { "epoch": 0.0, "learning_rate": 5.332302936630604e-07, "loss": 1.65, "step": 69 }, { "epoch": 0.0, "learning_rate": 5.409582689335395e-07, "loss": 1.5924, "step": 70 }, { "epoch": 0.0, "learning_rate": 5.486862442040186e-07, "loss": 1.6156, "step": 71 }, { "epoch": 0.0, "learning_rate": 5.564142194744977e-07, "loss": 1.6495, "step": 72 }, { "epoch": 0.0, "learning_rate": 5.641421947449768e-07, "loss": 1.6621, "step": 73 }, { "epoch": 0.0, "learning_rate": 5.71870170015456e-07, "loss": 1.2976, "step": 74 }, { "epoch": 0.0, "learning_rate": 5.795981452859351e-07, "loss": 1.7546, "step": 75 }, { "epoch": 0.0, "learning_rate": 5.873261205564142e-07, "loss": 1.538, "step": 76 }, { "epoch": 0.0, "learning_rate": 5.950540958268934e-07, "loss": 1.5236, "step": 77 }, { "epoch": 0.0, "learning_rate": 6.027820710973725e-07, "loss": 1.27, "step": 78 }, { "epoch": 0.0, "learning_rate": 6.105100463678517e-07, "loss": 1.78, "step": 79 }, { "epoch": 0.0, "learning_rate": 6.182380216383308e-07, "loss": 1.8089, "step": 80 }, { "epoch": 0.0, "learning_rate": 6.259659969088099e-07, "loss": 1.6762, "step": 81 }, { "epoch": 0.0, "learning_rate": 6.336939721792891e-07, "loss": 1.5622, "step": 82 }, { "epoch": 0.0, "learning_rate": 6.414219474497683e-07, "loss": 1.4921, "step": 83 }, { "epoch": 0.0, "learning_rate": 6.491499227202474e-07, "loss": 1.4867, "step": 84 }, { "epoch": 0.0, "learning_rate": 6.568778979907265e-07, "loss": 1.737, "step": 85 }, { "epoch": 0.0, "learning_rate": 6.646058732612057e-07, "loss": 1.3997, "step": 86 }, { "epoch": 0.0, "learning_rate": 6.723338485316848e-07, "loss": 1.5297, "step": 87 }, { "epoch": 0.0, "learning_rate": 6.800618238021639e-07, "loss": 1.3141, "step": 88 }, { "epoch": 0.0, "learning_rate": 6.87789799072643e-07, "loss": 1.7022, "step": 89 }, { "epoch": 0.0, "learning_rate": 6.955177743431221e-07, "loss": 1.3224, "step": 90 }, { "epoch": 0.0, "learning_rate": 7.032457496136012e-07, "loss": 1.2317, "step": 91 }, { "epoch": 0.0, "learning_rate": 7.109737248840805e-07, "loss": 1.5758, "step": 92 }, { "epoch": 0.0, "learning_rate": 7.187017001545596e-07, "loss": 1.3038, "step": 93 }, { "epoch": 0.0, "learning_rate": 7.264296754250387e-07, "loss": 1.5212, "step": 94 }, { "epoch": 0.0, "learning_rate": 7.341576506955178e-07, "loss": 1.2761, "step": 95 }, { "epoch": 0.0, "learning_rate": 7.418856259659969e-07, "loss": 1.4376, "step": 96 }, { "epoch": 0.0, "learning_rate": 7.496136012364761e-07, "loss": 1.54, "step": 97 }, { "epoch": 0.0, "learning_rate": 7.573415765069552e-07, "loss": 1.7241, "step": 98 }, { "epoch": 0.0, "learning_rate": 7.650695517774344e-07, "loss": 1.2662, "step": 99 }, { "epoch": 0.0, "learning_rate": 7.727975270479135e-07, "loss": 1.172, "step": 100 }, { "epoch": 0.0, "learning_rate": 7.805255023183926e-07, "loss": 1.3014, "step": 101 }, { "epoch": 0.0, "learning_rate": 7.882534775888718e-07, "loss": 1.1871, "step": 102 }, { "epoch": 0.0, "learning_rate": 7.95981452859351e-07, "loss": 1.436, "step": 103 }, { "epoch": 0.0, "learning_rate": 8.037094281298301e-07, "loss": 1.6671, "step": 104 }, { "epoch": 0.0, "learning_rate": 8.114374034003092e-07, "loss": 1.4592, "step": 105 }, { "epoch": 0.0, "learning_rate": 8.191653786707883e-07, "loss": 1.3194, "step": 106 }, { "epoch": 0.0, "learning_rate": 8.268933539412674e-07, "loss": 1.3289, "step": 107 }, { "epoch": 0.0, "learning_rate": 8.346213292117467e-07, "loss": 1.241, "step": 108 }, { "epoch": 0.0, "learning_rate": 8.423493044822258e-07, "loss": 1.3951, "step": 109 }, { "epoch": 0.0, "learning_rate": 8.500772797527049e-07, "loss": 1.5699, "step": 110 }, { "epoch": 0.0, "learning_rate": 8.57805255023184e-07, "loss": 1.3149, "step": 111 }, { "epoch": 0.0, "learning_rate": 8.655332302936631e-07, "loss": 1.5291, "step": 112 }, { "epoch": 0.0, "learning_rate": 8.732612055641422e-07, "loss": 1.4352, "step": 113 }, { "epoch": 0.0, "learning_rate": 8.809891808346214e-07, "loss": 1.3655, "step": 114 }, { "epoch": 0.0, "learning_rate": 8.887171561051005e-07, "loss": 1.1939, "step": 115 }, { "epoch": 0.0, "learning_rate": 8.964451313755796e-07, "loss": 1.2788, "step": 116 }, { "epoch": 0.0, "learning_rate": 9.041731066460588e-07, "loss": 1.2352, "step": 117 }, { "epoch": 0.0, "learning_rate": 9.119010819165379e-07, "loss": 1.5089, "step": 118 }, { "epoch": 0.0, "learning_rate": 9.196290571870171e-07, "loss": 1.3979, "step": 119 }, { "epoch": 0.0, "learning_rate": 9.273570324574963e-07, "loss": 1.378, "step": 120 }, { "epoch": 0.0, "learning_rate": 9.350850077279754e-07, "loss": 1.1833, "step": 121 }, { "epoch": 0.0, "learning_rate": 9.428129829984545e-07, "loss": 1.7065, "step": 122 }, { "epoch": 0.0, "learning_rate": 9.505409582689336e-07, "loss": 1.4275, "step": 123 }, { "epoch": 0.0, "learning_rate": 9.582689335394127e-07, "loss": 1.2258, "step": 124 }, { "epoch": 0.0, "learning_rate": 9.65996908809892e-07, "loss": 1.5104, "step": 125 }, { "epoch": 0.0, "learning_rate": 9.73724884080371e-07, "loss": 1.5453, "step": 126 }, { "epoch": 0.0, "learning_rate": 9.814528593508502e-07, "loss": 1.297, "step": 127 }, { "epoch": 0.0, "learning_rate": 9.891808346213293e-07, "loss": 1.1416, "step": 128 }, { "epoch": 0.0, "learning_rate": 9.969088098918084e-07, "loss": 1.4373, "step": 129 }, { "epoch": 0.0, "learning_rate": 1.0046367851622877e-06, "loss": 1.4038, "step": 130 }, { "epoch": 0.0, "learning_rate": 1.0123647604327668e-06, "loss": 1.4834, "step": 131 }, { "epoch": 0.0, "learning_rate": 1.020092735703246e-06, "loss": 1.2655, "step": 132 }, { "epoch": 0.0, "learning_rate": 1.027820710973725e-06, "loss": 1.5367, "step": 133 }, { "epoch": 0.0, "learning_rate": 1.0355486862442041e-06, "loss": 1.6032, "step": 134 }, { "epoch": 0.0, "learning_rate": 1.0432766615146832e-06, "loss": 1.5178, "step": 135 }, { "epoch": 0.0, "learning_rate": 1.0510046367851623e-06, "loss": 1.3513, "step": 136 }, { "epoch": 0.0, "learning_rate": 1.0587326120556414e-06, "loss": 1.4336, "step": 137 }, { "epoch": 0.0, "learning_rate": 1.0664605873261208e-06, "loss": 1.5365, "step": 138 }, { "epoch": 0.0, "learning_rate": 1.0741885625965999e-06, "loss": 1.2688, "step": 139 }, { "epoch": 0.0, "learning_rate": 1.081916537867079e-06, "loss": 1.1308, "step": 140 }, { "epoch": 0.0, "learning_rate": 1.089644513137558e-06, "loss": 1.4585, "step": 141 }, { "epoch": 0.0, "learning_rate": 1.0973724884080372e-06, "loss": 1.3182, "step": 142 }, { "epoch": 0.0, "learning_rate": 1.1051004636785163e-06, "loss": 1.263, "step": 143 }, { "epoch": 0.0, "learning_rate": 1.1128284389489954e-06, "loss": 1.3138, "step": 144 }, { "epoch": 0.0, "learning_rate": 1.1205564142194745e-06, "loss": 1.3829, "step": 145 }, { "epoch": 0.0, "learning_rate": 1.1282843894899536e-06, "loss": 1.2723, "step": 146 }, { "epoch": 0.0, "learning_rate": 1.136012364760433e-06, "loss": 1.0018, "step": 147 }, { "epoch": 0.0, "learning_rate": 1.143740340030912e-06, "loss": 1.2995, "step": 148 }, { "epoch": 0.0, "learning_rate": 1.1514683153013911e-06, "loss": 1.1457, "step": 149 }, { "epoch": 0.0, "learning_rate": 1.1591962905718702e-06, "loss": 1.1206, "step": 150 }, { "epoch": 0.0, "learning_rate": 1.1669242658423493e-06, "loss": 1.4278, "step": 151 }, { "epoch": 0.0, "learning_rate": 1.1746522411128284e-06, "loss": 1.2867, "step": 152 }, { "epoch": 0.0, "learning_rate": 1.1823802163833077e-06, "loss": 1.4715, "step": 153 }, { "epoch": 0.0, "learning_rate": 1.1901081916537868e-06, "loss": 1.7179, "step": 154 }, { "epoch": 0.0, "learning_rate": 1.197836166924266e-06, "loss": 1.5918, "step": 155 }, { "epoch": 0.0, "learning_rate": 1.205564142194745e-06, "loss": 1.1561, "step": 156 }, { "epoch": 0.0, "learning_rate": 1.2132921174652241e-06, "loss": 1.7272, "step": 157 }, { "epoch": 0.0, "learning_rate": 1.2210200927357035e-06, "loss": 1.1849, "step": 158 }, { "epoch": 0.0, "learning_rate": 1.2287480680061826e-06, "loss": 1.152, "step": 159 }, { "epoch": 0.0, "learning_rate": 1.2364760432766617e-06, "loss": 0.8599, "step": 160 }, { "epoch": 0.0, "learning_rate": 1.2442040185471408e-06, "loss": 1.2931, "step": 161 }, { "epoch": 0.0, "learning_rate": 1.2519319938176199e-06, "loss": 1.2395, "step": 162 }, { "epoch": 0.0, "learning_rate": 1.259659969088099e-06, "loss": 1.1549, "step": 163 }, { "epoch": 0.0, "learning_rate": 1.2673879443585783e-06, "loss": 1.2306, "step": 164 }, { "epoch": 0.0, "learning_rate": 1.2751159196290572e-06, "loss": 1.3115, "step": 165 }, { "epoch": 0.0, "learning_rate": 1.2828438948995365e-06, "loss": 1.3662, "step": 166 }, { "epoch": 0.0, "learning_rate": 1.2905718701700156e-06, "loss": 1.1904, "step": 167 }, { "epoch": 0.0, "learning_rate": 1.2982998454404947e-06, "loss": 1.4409, "step": 168 }, { "epoch": 0.0, "learning_rate": 1.3060278207109738e-06, "loss": 1.0001, "step": 169 }, { "epoch": 0.0, "learning_rate": 1.313755795981453e-06, "loss": 1.0936, "step": 170 }, { "epoch": 0.0, "learning_rate": 1.321483771251932e-06, "loss": 1.382, "step": 171 }, { "epoch": 0.0, "learning_rate": 1.3292117465224113e-06, "loss": 1.6164, "step": 172 }, { "epoch": 0.0, "learning_rate": 1.3369397217928902e-06, "loss": 1.1166, "step": 173 }, { "epoch": 0.0, "learning_rate": 1.3446676970633695e-06, "loss": 1.4625, "step": 174 }, { "epoch": 0.0, "learning_rate": 1.3523956723338486e-06, "loss": 1.2964, "step": 175 }, { "epoch": 0.0, "learning_rate": 1.3601236476043278e-06, "loss": 1.3508, "step": 176 }, { "epoch": 0.0, "learning_rate": 1.367851622874807e-06, "loss": 1.345, "step": 177 }, { "epoch": 0.0, "learning_rate": 1.375579598145286e-06, "loss": 1.5836, "step": 178 }, { "epoch": 0.0, "learning_rate": 1.3833075734157653e-06, "loss": 1.3335, "step": 179 }, { "epoch": 0.0, "learning_rate": 1.3910355486862442e-06, "loss": 1.4888, "step": 180 }, { "epoch": 0.0, "learning_rate": 1.3987635239567235e-06, "loss": 1.0348, "step": 181 }, { "epoch": 0.0, "learning_rate": 1.4064914992272024e-06, "loss": 1.1437, "step": 182 }, { "epoch": 0.0, "learning_rate": 1.4142194744976817e-06, "loss": 1.0498, "step": 183 }, { "epoch": 0.0, "learning_rate": 1.421947449768161e-06, "loss": 1.2981, "step": 184 }, { "epoch": 0.0, "learning_rate": 1.42967542503864e-06, "loss": 1.2842, "step": 185 }, { "epoch": 0.0, "learning_rate": 1.4374034003091192e-06, "loss": 1.5818, "step": 186 }, { "epoch": 0.0, "learning_rate": 1.445131375579598e-06, "loss": 1.2794, "step": 187 }, { "epoch": 0.0, "learning_rate": 1.4528593508500774e-06, "loss": 1.185, "step": 188 }, { "epoch": 0.0, "learning_rate": 1.4605873261205567e-06, "loss": 1.3391, "step": 189 }, { "epoch": 0.0, "learning_rate": 1.4683153013910356e-06, "loss": 1.1255, "step": 190 }, { "epoch": 0.0, "learning_rate": 1.476043276661515e-06, "loss": 1.254, "step": 191 }, { "epoch": 0.0, "learning_rate": 1.4837712519319938e-06, "loss": 1.0749, "step": 192 }, { "epoch": 0.0, "learning_rate": 1.4914992272024732e-06, "loss": 1.0715, "step": 193 }, { "epoch": 0.0, "learning_rate": 1.4992272024729523e-06, "loss": 1.0415, "step": 194 }, { "epoch": 0.0, "learning_rate": 1.5069551777434314e-06, "loss": 1.4251, "step": 195 }, { "epoch": 0.0, "learning_rate": 1.5146831530139105e-06, "loss": 1.4161, "step": 196 }, { "epoch": 0.0, "learning_rate": 1.5224111282843896e-06, "loss": 0.9244, "step": 197 }, { "epoch": 0.0, "learning_rate": 1.5301391035548689e-06, "loss": 1.2109, "step": 198 }, { "epoch": 0.0, "learning_rate": 1.5378670788253478e-06, "loss": 1.0854, "step": 199 }, { "epoch": 0.0, "learning_rate": 1.545595054095827e-06, "loss": 1.0815, "step": 200 }, { "epoch": 0.0, "learning_rate": 1.5533230293663062e-06, "loss": 1.5258, "step": 201 }, { "epoch": 0.0, "learning_rate": 1.5610510046367853e-06, "loss": 1.4119, "step": 202 }, { "epoch": 0.0, "learning_rate": 1.5687789799072644e-06, "loss": 1.4017, "step": 203 }, { "epoch": 0.0, "learning_rate": 1.5765069551777435e-06, "loss": 1.4762, "step": 204 }, { "epoch": 0.0, "learning_rate": 1.5842349304482226e-06, "loss": 1.1644, "step": 205 }, { "epoch": 0.0, "learning_rate": 1.591962905718702e-06, "loss": 1.4856, "step": 206 }, { "epoch": 0.0, "learning_rate": 1.5996908809891808e-06, "loss": 1.2342, "step": 207 }, { "epoch": 0.0, "learning_rate": 1.6074188562596601e-06, "loss": 1.3089, "step": 208 }, { "epoch": 0.0, "learning_rate": 1.615146831530139e-06, "loss": 1.5171, "step": 209 }, { "epoch": 0.0, "learning_rate": 1.6228748068006183e-06, "loss": 1.2524, "step": 210 }, { "epoch": 0.0, "learning_rate": 1.6306027820710977e-06, "loss": 1.1537, "step": 211 }, { "epoch": 0.0, "learning_rate": 1.6383307573415765e-06, "loss": 1.1721, "step": 212 }, { "epoch": 0.0, "learning_rate": 1.6460587326120559e-06, "loss": 1.1174, "step": 213 }, { "epoch": 0.0, "learning_rate": 1.6537867078825348e-06, "loss": 1.2553, "step": 214 }, { "epoch": 0.0, "learning_rate": 1.661514683153014e-06, "loss": 1.1377, "step": 215 }, { "epoch": 0.01, "learning_rate": 1.6692426584234934e-06, "loss": 1.3596, "step": 216 }, { "epoch": 0.01, "learning_rate": 1.6769706336939723e-06, "loss": 1.2929, "step": 217 }, { "epoch": 0.01, "learning_rate": 1.6846986089644516e-06, "loss": 1.5419, "step": 218 }, { "epoch": 0.01, "learning_rate": 1.6924265842349305e-06, "loss": 1.193, "step": 219 }, { "epoch": 0.01, "learning_rate": 1.7001545595054098e-06, "loss": 1.096, "step": 220 }, { "epoch": 0.01, "learning_rate": 1.7078825347758887e-06, "loss": 1.2455, "step": 221 }, { "epoch": 0.01, "learning_rate": 1.715610510046368e-06, "loss": 1.3578, "step": 222 }, { "epoch": 0.01, "learning_rate": 1.7233384853168473e-06, "loss": 1.0786, "step": 223 }, { "epoch": 0.01, "learning_rate": 1.7310664605873262e-06, "loss": 1.04, "step": 224 }, { "epoch": 0.01, "learning_rate": 1.7387944358578055e-06, "loss": 1.2586, "step": 225 }, { "epoch": 0.01, "learning_rate": 1.7465224111282844e-06, "loss": 1.3006, "step": 226 }, { "epoch": 0.01, "learning_rate": 1.7542503863987637e-06, "loss": 1.0062, "step": 227 }, { "epoch": 0.01, "learning_rate": 1.7619783616692428e-06, "loss": 1.4124, "step": 228 }, { "epoch": 0.01, "learning_rate": 1.769706336939722e-06, "loss": 1.1559, "step": 229 }, { "epoch": 0.01, "learning_rate": 1.777434312210201e-06, "loss": 1.2943, "step": 230 }, { "epoch": 0.01, "learning_rate": 1.7851622874806801e-06, "loss": 1.2482, "step": 231 }, { "epoch": 0.01, "learning_rate": 1.7928902627511593e-06, "loss": 0.9883, "step": 232 }, { "epoch": 0.01, "learning_rate": 1.8006182380216386e-06, "loss": 1.1575, "step": 233 }, { "epoch": 0.01, "learning_rate": 1.8083462132921177e-06, "loss": 1.5491, "step": 234 }, { "epoch": 0.01, "learning_rate": 1.8160741885625968e-06, "loss": 1.3182, "step": 235 }, { "epoch": 0.01, "learning_rate": 1.8238021638330759e-06, "loss": 1.1481, "step": 236 }, { "epoch": 0.01, "learning_rate": 1.831530139103555e-06, "loss": 0.921, "step": 237 }, { "epoch": 0.01, "learning_rate": 1.8392581143740343e-06, "loss": 1.2817, "step": 238 }, { "epoch": 0.01, "learning_rate": 1.8469860896445132e-06, "loss": 1.3573, "step": 239 }, { "epoch": 0.01, "learning_rate": 1.8547140649149925e-06, "loss": 1.1618, "step": 240 }, { "epoch": 0.01, "learning_rate": 1.8624420401854714e-06, "loss": 1.5487, "step": 241 }, { "epoch": 0.01, "learning_rate": 1.8701700154559507e-06, "loss": 0.9629, "step": 242 }, { "epoch": 0.01, "learning_rate": 1.8778979907264296e-06, "loss": 1.4002, "step": 243 }, { "epoch": 0.01, "learning_rate": 1.885625965996909e-06, "loss": 1.2174, "step": 244 }, { "epoch": 0.01, "learning_rate": 1.8933539412673882e-06, "loss": 1.4701, "step": 245 }, { "epoch": 0.01, "learning_rate": 1.9010819165378671e-06, "loss": 1.205, "step": 246 }, { "epoch": 0.01, "learning_rate": 1.9088098918083462e-06, "loss": 1.3006, "step": 247 }, { "epoch": 0.01, "learning_rate": 1.9165378670788253e-06, "loss": 1.4203, "step": 248 }, { "epoch": 0.01, "learning_rate": 1.9242658423493044e-06, "loss": 1.4927, "step": 249 }, { "epoch": 0.01, "learning_rate": 1.931993817619784e-06, "loss": 1.3514, "step": 250 }, { "epoch": 0.01, "learning_rate": 1.9397217928902626e-06, "loss": 1.3234, "step": 251 }, { "epoch": 0.01, "learning_rate": 1.947449768160742e-06, "loss": 1.5456, "step": 252 }, { "epoch": 0.01, "learning_rate": 1.9551777434312213e-06, "loss": 1.5114, "step": 253 }, { "epoch": 0.01, "learning_rate": 1.9629057187017004e-06, "loss": 1.3371, "step": 254 }, { "epoch": 0.01, "learning_rate": 1.9706336939721795e-06, "loss": 1.59, "step": 255 }, { "epoch": 0.01, "learning_rate": 1.9783616692426586e-06, "loss": 1.1611, "step": 256 }, { "epoch": 0.01, "learning_rate": 1.9860896445131377e-06, "loss": 1.5932, "step": 257 }, { "epoch": 0.01, "learning_rate": 1.993817619783617e-06, "loss": 1.2864, "step": 258 }, { "epoch": 0.01, "learning_rate": 2.001545595054096e-06, "loss": 1.3168, "step": 259 }, { "epoch": 0.01, "learning_rate": 2.0092735703245754e-06, "loss": 1.2432, "step": 260 }, { "epoch": 0.01, "learning_rate": 2.017001545595054e-06, "loss": 1.388, "step": 261 }, { "epoch": 0.01, "learning_rate": 2.0247295208655336e-06, "loss": 1.4357, "step": 262 }, { "epoch": 0.01, "learning_rate": 2.0324574961360123e-06, "loss": 1.5013, "step": 263 }, { "epoch": 0.01, "learning_rate": 2.040185471406492e-06, "loss": 1.2545, "step": 264 }, { "epoch": 0.01, "learning_rate": 2.0479134466769705e-06, "loss": 1.2871, "step": 265 }, { "epoch": 0.01, "learning_rate": 2.05564142194745e-06, "loss": 1.1835, "step": 266 }, { "epoch": 0.01, "learning_rate": 2.063369397217929e-06, "loss": 1.1417, "step": 267 }, { "epoch": 0.01, "learning_rate": 2.0710973724884083e-06, "loss": 1.1718, "step": 268 }, { "epoch": 0.01, "learning_rate": 2.0788253477588874e-06, "loss": 1.2569, "step": 269 }, { "epoch": 0.01, "learning_rate": 2.0865533230293665e-06, "loss": 0.8723, "step": 270 }, { "epoch": 0.01, "learning_rate": 2.0942812982998456e-06, "loss": 1.2188, "step": 271 }, { "epoch": 0.01, "learning_rate": 2.1020092735703247e-06, "loss": 1.0924, "step": 272 }, { "epoch": 0.01, "learning_rate": 2.1097372488408038e-06, "loss": 1.2829, "step": 273 }, { "epoch": 0.01, "learning_rate": 2.117465224111283e-06, "loss": 1.2606, "step": 274 }, { "epoch": 0.01, "learning_rate": 2.125193199381762e-06, "loss": 1.2475, "step": 275 }, { "epoch": 0.01, "learning_rate": 2.1329211746522415e-06, "loss": 1.3414, "step": 276 }, { "epoch": 0.01, "learning_rate": 2.1406491499227206e-06, "loss": 1.4344, "step": 277 }, { "epoch": 0.01, "learning_rate": 2.1483771251931997e-06, "loss": 1.0516, "step": 278 }, { "epoch": 0.01, "learning_rate": 2.156105100463679e-06, "loss": 1.1721, "step": 279 }, { "epoch": 0.01, "learning_rate": 2.163833075734158e-06, "loss": 1.0635, "step": 280 }, { "epoch": 0.01, "learning_rate": 2.171561051004637e-06, "loss": 1.5116, "step": 281 }, { "epoch": 0.01, "learning_rate": 2.179289026275116e-06, "loss": 1.4212, "step": 282 }, { "epoch": 0.01, "learning_rate": 2.1870170015455952e-06, "loss": 1.2306, "step": 283 }, { "epoch": 0.01, "learning_rate": 2.1947449768160743e-06, "loss": 1.2153, "step": 284 }, { "epoch": 0.01, "learning_rate": 2.2024729520865534e-06, "loss": 1.1762, "step": 285 }, { "epoch": 0.01, "learning_rate": 2.2102009273570325e-06, "loss": 1.2163, "step": 286 }, { "epoch": 0.01, "learning_rate": 2.2179289026275116e-06, "loss": 1.1805, "step": 287 }, { "epoch": 0.01, "learning_rate": 2.2256568778979908e-06, "loss": 1.4171, "step": 288 }, { "epoch": 0.01, "learning_rate": 2.2333848531684703e-06, "loss": 1.4836, "step": 289 }, { "epoch": 0.01, "learning_rate": 2.241112828438949e-06, "loss": 1.0107, "step": 290 }, { "epoch": 0.01, "learning_rate": 2.2488408037094285e-06, "loss": 1.2116, "step": 291 }, { "epoch": 0.01, "learning_rate": 2.256568778979907e-06, "loss": 1.3679, "step": 292 }, { "epoch": 0.01, "learning_rate": 2.2642967542503867e-06, "loss": 1.0301, "step": 293 }, { "epoch": 0.01, "learning_rate": 2.272024729520866e-06, "loss": 1.313, "step": 294 }, { "epoch": 0.01, "learning_rate": 2.279752704791345e-06, "loss": 0.9755, "step": 295 }, { "epoch": 0.01, "learning_rate": 2.287480680061824e-06, "loss": 1.4204, "step": 296 }, { "epoch": 0.01, "learning_rate": 2.295208655332303e-06, "loss": 1.1289, "step": 297 }, { "epoch": 0.01, "learning_rate": 2.3029366306027822e-06, "loss": 1.2812, "step": 298 }, { "epoch": 0.01, "learning_rate": 2.3106646058732613e-06, "loss": 1.0564, "step": 299 }, { "epoch": 0.01, "learning_rate": 2.3183925811437404e-06, "loss": 1.2387, "step": 300 }, { "epoch": 0.01, "learning_rate": 2.32612055641422e-06, "loss": 0.9543, "step": 301 }, { "epoch": 0.01, "learning_rate": 2.3338485316846986e-06, "loss": 1.1935, "step": 302 }, { "epoch": 0.01, "learning_rate": 2.341576506955178e-06, "loss": 1.3333, "step": 303 }, { "epoch": 0.01, "learning_rate": 2.349304482225657e-06, "loss": 1.3996, "step": 304 }, { "epoch": 0.01, "learning_rate": 2.3570324574961364e-06, "loss": 1.2323, "step": 305 }, { "epoch": 0.01, "learning_rate": 2.3647604327666155e-06, "loss": 1.0988, "step": 306 }, { "epoch": 0.01, "learning_rate": 2.3724884080370946e-06, "loss": 1.3991, "step": 307 }, { "epoch": 0.01, "learning_rate": 2.3802163833075737e-06, "loss": 1.2453, "step": 308 }, { "epoch": 0.01, "learning_rate": 2.3879443585780528e-06, "loss": 1.1582, "step": 309 }, { "epoch": 0.01, "learning_rate": 2.395672333848532e-06, "loss": 1.0753, "step": 310 }, { "epoch": 0.01, "learning_rate": 2.403400309119011e-06, "loss": 1.1751, "step": 311 }, { "epoch": 0.01, "learning_rate": 2.41112828438949e-06, "loss": 1.1911, "step": 312 }, { "epoch": 0.01, "learning_rate": 2.418856259659969e-06, "loss": 1.2496, "step": 313 }, { "epoch": 0.01, "learning_rate": 2.4265842349304483e-06, "loss": 1.2231, "step": 314 }, { "epoch": 0.01, "learning_rate": 2.4343122102009274e-06, "loss": 1.0726, "step": 315 }, { "epoch": 0.01, "learning_rate": 2.442040185471407e-06, "loss": 1.2714, "step": 316 }, { "epoch": 0.01, "learning_rate": 2.4497681607418856e-06, "loss": 1.4325, "step": 317 }, { "epoch": 0.01, "learning_rate": 2.457496136012365e-06, "loss": 1.0503, "step": 318 }, { "epoch": 0.01, "learning_rate": 2.465224111282844e-06, "loss": 1.0211, "step": 319 }, { "epoch": 0.01, "learning_rate": 2.4729520865533233e-06, "loss": 1.4132, "step": 320 }, { "epoch": 0.01, "learning_rate": 2.4806800618238024e-06, "loss": 1.215, "step": 321 }, { "epoch": 0.01, "learning_rate": 2.4884080370942815e-06, "loss": 1.0295, "step": 322 }, { "epoch": 0.01, "learning_rate": 2.4961360123647607e-06, "loss": 1.2604, "step": 323 }, { "epoch": 0.01, "learning_rate": 2.5038639876352398e-06, "loss": 1.1653, "step": 324 }, { "epoch": 0.01, "learning_rate": 2.511591962905719e-06, "loss": 1.1451, "step": 325 }, { "epoch": 0.01, "learning_rate": 2.519319938176198e-06, "loss": 1.1996, "step": 326 }, { "epoch": 0.01, "learning_rate": 2.5270479134466775e-06, "loss": 1.4474, "step": 327 }, { "epoch": 0.01, "learning_rate": 2.5347758887171566e-06, "loss": 1.1767, "step": 328 }, { "epoch": 0.01, "learning_rate": 2.5425038639876353e-06, "loss": 1.1176, "step": 329 }, { "epoch": 0.01, "learning_rate": 2.5502318392581144e-06, "loss": 1.1659, "step": 330 }, { "epoch": 0.01, "learning_rate": 2.557959814528594e-06, "loss": 1.2333, "step": 331 }, { "epoch": 0.01, "learning_rate": 2.565687789799073e-06, "loss": 0.8517, "step": 332 }, { "epoch": 0.01, "learning_rate": 2.5734157650695517e-06, "loss": 1.146, "step": 333 }, { "epoch": 0.01, "learning_rate": 2.5811437403400312e-06, "loss": 1.4031, "step": 334 }, { "epoch": 0.01, "learning_rate": 2.5888717156105103e-06, "loss": 1.3495, "step": 335 }, { "epoch": 0.01, "learning_rate": 2.5965996908809894e-06, "loss": 1.2534, "step": 336 }, { "epoch": 0.01, "learning_rate": 2.604327666151468e-06, "loss": 1.5338, "step": 337 }, { "epoch": 0.01, "learning_rate": 2.6120556414219476e-06, "loss": 0.8921, "step": 338 }, { "epoch": 0.01, "learning_rate": 2.6197836166924267e-06, "loss": 1.1412, "step": 339 }, { "epoch": 0.01, "learning_rate": 2.627511591962906e-06, "loss": 1.138, "step": 340 }, { "epoch": 0.01, "learning_rate": 2.6352395672333854e-06, "loss": 1.0738, "step": 341 }, { "epoch": 0.01, "learning_rate": 2.642967542503864e-06, "loss": 1.3338, "step": 342 }, { "epoch": 0.01, "learning_rate": 2.650695517774343e-06, "loss": 1.0484, "step": 343 }, { "epoch": 0.01, "learning_rate": 2.6584234930448227e-06, "loss": 1.2806, "step": 344 }, { "epoch": 0.01, "learning_rate": 2.6661514683153018e-06, "loss": 1.2843, "step": 345 }, { "epoch": 0.01, "learning_rate": 2.6738794435857805e-06, "loss": 1.0751, "step": 346 }, { "epoch": 0.01, "learning_rate": 2.6816074188562596e-06, "loss": 1.3177, "step": 347 }, { "epoch": 0.01, "learning_rate": 2.689335394126739e-06, "loss": 1.3157, "step": 348 }, { "epoch": 0.01, "learning_rate": 2.697063369397218e-06, "loss": 1.2467, "step": 349 }, { "epoch": 0.01, "learning_rate": 2.7047913446676973e-06, "loss": 1.2476, "step": 350 }, { "epoch": 0.01, "learning_rate": 2.712519319938177e-06, "loss": 1.0204, "step": 351 }, { "epoch": 0.01, "learning_rate": 2.7202472952086555e-06, "loss": 1.2446, "step": 352 }, { "epoch": 0.01, "learning_rate": 2.7279752704791346e-06, "loss": 1.202, "step": 353 }, { "epoch": 0.01, "learning_rate": 2.735703245749614e-06, "loss": 1.0302, "step": 354 }, { "epoch": 0.01, "learning_rate": 2.7434312210200932e-06, "loss": 1.3204, "step": 355 }, { "epoch": 0.01, "learning_rate": 2.751159196290572e-06, "loss": 1.1462, "step": 356 }, { "epoch": 0.01, "learning_rate": 2.758887171561051e-06, "loss": 1.2289, "step": 357 }, { "epoch": 0.01, "learning_rate": 2.7666151468315306e-06, "loss": 0.9908, "step": 358 }, { "epoch": 0.01, "learning_rate": 2.7743431221020097e-06, "loss": 1.0835, "step": 359 }, { "epoch": 0.01, "learning_rate": 2.7820710973724883e-06, "loss": 1.2771, "step": 360 }, { "epoch": 0.01, "learning_rate": 2.789799072642968e-06, "loss": 1.1362, "step": 361 }, { "epoch": 0.01, "learning_rate": 2.797527047913447e-06, "loss": 1.2491, "step": 362 }, { "epoch": 0.01, "learning_rate": 2.805255023183926e-06, "loss": 1.3369, "step": 363 }, { "epoch": 0.01, "learning_rate": 2.8129829984544048e-06, "loss": 0.831, "step": 364 }, { "epoch": 0.01, "learning_rate": 2.8207109737248843e-06, "loss": 1.2707, "step": 365 }, { "epoch": 0.01, "learning_rate": 2.8284389489953634e-06, "loss": 1.4716, "step": 366 }, { "epoch": 0.01, "learning_rate": 2.8361669242658425e-06, "loss": 1.0358, "step": 367 }, { "epoch": 0.01, "learning_rate": 2.843894899536322e-06, "loss": 1.178, "step": 368 }, { "epoch": 0.01, "learning_rate": 2.8516228748068007e-06, "loss": 1.2869, "step": 369 }, { "epoch": 0.01, "learning_rate": 2.85935085007728e-06, "loss": 1.1426, "step": 370 }, { "epoch": 0.01, "learning_rate": 2.8670788253477593e-06, "loss": 1.3326, "step": 371 }, { "epoch": 0.01, "learning_rate": 2.8748068006182384e-06, "loss": 1.1517, "step": 372 }, { "epoch": 0.01, "learning_rate": 2.8825347758887175e-06, "loss": 1.214, "step": 373 }, { "epoch": 0.01, "learning_rate": 2.890262751159196e-06, "loss": 1.3438, "step": 374 }, { "epoch": 0.01, "learning_rate": 2.8979907264296757e-06, "loss": 1.2978, "step": 375 }, { "epoch": 0.01, "learning_rate": 2.905718701700155e-06, "loss": 1.2967, "step": 376 }, { "epoch": 0.01, "learning_rate": 2.913446676970634e-06, "loss": 1.2931, "step": 377 }, { "epoch": 0.01, "learning_rate": 2.9211746522411135e-06, "loss": 1.2915, "step": 378 }, { "epoch": 0.01, "learning_rate": 2.928902627511592e-06, "loss": 1.1122, "step": 379 }, { "epoch": 0.01, "learning_rate": 2.9366306027820713e-06, "loss": 1.1211, "step": 380 }, { "epoch": 0.01, "learning_rate": 2.9443585780525504e-06, "loss": 1.2955, "step": 381 }, { "epoch": 0.01, "learning_rate": 2.95208655332303e-06, "loss": 1.2128, "step": 382 }, { "epoch": 0.01, "learning_rate": 2.9598145285935086e-06, "loss": 1.0886, "step": 383 }, { "epoch": 0.01, "learning_rate": 2.9675425038639877e-06, "loss": 1.1348, "step": 384 }, { "epoch": 0.01, "learning_rate": 2.975270479134467e-06, "loss": 1.2923, "step": 385 }, { "epoch": 0.01, "learning_rate": 2.9829984544049463e-06, "loss": 1.1668, "step": 386 }, { "epoch": 0.01, "learning_rate": 2.990726429675425e-06, "loss": 1.0422, "step": 387 }, { "epoch": 0.01, "learning_rate": 2.9984544049459045e-06, "loss": 0.9646, "step": 388 }, { "epoch": 0.01, "learning_rate": 3.0061823802163836e-06, "loss": 1.181, "step": 389 }, { "epoch": 0.01, "learning_rate": 3.0139103554868627e-06, "loss": 1.0642, "step": 390 }, { "epoch": 0.01, "learning_rate": 3.0216383307573414e-06, "loss": 1.0061, "step": 391 }, { "epoch": 0.01, "learning_rate": 3.029366306027821e-06, "loss": 1.1424, "step": 392 }, { "epoch": 0.01, "learning_rate": 3.0370942812983e-06, "loss": 1.2735, "step": 393 }, { "epoch": 0.01, "learning_rate": 3.044822256568779e-06, "loss": 1.267, "step": 394 }, { "epoch": 0.01, "learning_rate": 3.0525502318392587e-06, "loss": 1.2057, "step": 395 }, { "epoch": 0.01, "learning_rate": 3.0602782071097378e-06, "loss": 1.2965, "step": 396 }, { "epoch": 0.01, "learning_rate": 3.0680061823802164e-06, "loss": 1.4145, "step": 397 }, { "epoch": 0.01, "learning_rate": 3.0757341576506955e-06, "loss": 1.1218, "step": 398 }, { "epoch": 0.01, "learning_rate": 3.083462132921175e-06, "loss": 0.9857, "step": 399 }, { "epoch": 0.01, "learning_rate": 3.091190108191654e-06, "loss": 1.03, "step": 400 }, { "epoch": 0.01, "learning_rate": 3.098918083462133e-06, "loss": 0.9238, "step": 401 }, { "epoch": 0.01, "learning_rate": 3.1066460587326124e-06, "loss": 1.1575, "step": 402 }, { "epoch": 0.01, "learning_rate": 3.1143740340030915e-06, "loss": 1.1131, "step": 403 }, { "epoch": 0.01, "learning_rate": 3.1221020092735706e-06, "loss": 1.2554, "step": 404 }, { "epoch": 0.01, "learning_rate": 3.12982998454405e-06, "loss": 1.0403, "step": 405 }, { "epoch": 0.01, "learning_rate": 3.137557959814529e-06, "loss": 1.161, "step": 406 }, { "epoch": 0.01, "learning_rate": 3.145285935085008e-06, "loss": 1.1336, "step": 407 }, { "epoch": 0.01, "learning_rate": 3.153013910355487e-06, "loss": 1.1143, "step": 408 }, { "epoch": 0.01, "learning_rate": 3.1607418856259665e-06, "loss": 1.1681, "step": 409 }, { "epoch": 0.01, "learning_rate": 3.1684698608964452e-06, "loss": 1.3419, "step": 410 }, { "epoch": 0.01, "learning_rate": 3.1761978361669243e-06, "loss": 1.0868, "step": 411 }, { "epoch": 0.01, "learning_rate": 3.183925811437404e-06, "loss": 1.2586, "step": 412 }, { "epoch": 0.01, "learning_rate": 3.191653786707883e-06, "loss": 1.2593, "step": 413 }, { "epoch": 0.01, "learning_rate": 3.1993817619783616e-06, "loss": 1.3095, "step": 414 }, { "epoch": 0.01, "learning_rate": 3.207109737248841e-06, "loss": 0.9798, "step": 415 }, { "epoch": 0.01, "learning_rate": 3.2148377125193203e-06, "loss": 1.2238, "step": 416 }, { "epoch": 0.01, "learning_rate": 3.2225656877897994e-06, "loss": 1.0106, "step": 417 }, { "epoch": 0.01, "learning_rate": 3.230293663060278e-06, "loss": 0.8064, "step": 418 }, { "epoch": 0.01, "learning_rate": 3.2380216383307576e-06, "loss": 1.1823, "step": 419 }, { "epoch": 0.01, "learning_rate": 3.2457496136012367e-06, "loss": 1.1955, "step": 420 }, { "epoch": 0.01, "learning_rate": 3.2534775888717158e-06, "loss": 1.0973, "step": 421 }, { "epoch": 0.01, "learning_rate": 3.2612055641421953e-06, "loss": 1.2272, "step": 422 }, { "epoch": 0.01, "learning_rate": 3.2689335394126744e-06, "loss": 1.1356, "step": 423 }, { "epoch": 0.01, "learning_rate": 3.276661514683153e-06, "loss": 1.3237, "step": 424 }, { "epoch": 0.01, "learning_rate": 3.284389489953632e-06, "loss": 1.1273, "step": 425 }, { "epoch": 0.01, "learning_rate": 3.2921174652241117e-06, "loss": 1.348, "step": 426 }, { "epoch": 0.01, "learning_rate": 3.299845440494591e-06, "loss": 1.1015, "step": 427 }, { "epoch": 0.01, "learning_rate": 3.3075734157650695e-06, "loss": 1.187, "step": 428 }, { "epoch": 0.01, "learning_rate": 3.315301391035549e-06, "loss": 1.2813, "step": 429 }, { "epoch": 0.01, "learning_rate": 3.323029366306028e-06, "loss": 1.2767, "step": 430 }, { "epoch": 0.01, "learning_rate": 3.3307573415765072e-06, "loss": 0.9732, "step": 431 }, { "epoch": 0.01, "learning_rate": 3.3384853168469868e-06, "loss": 1.0786, "step": 432 }, { "epoch": 0.01, "learning_rate": 3.3462132921174654e-06, "loss": 0.9004, "step": 433 }, { "epoch": 0.01, "learning_rate": 3.3539412673879445e-06, "loss": 1.2309, "step": 434 }, { "epoch": 0.01, "learning_rate": 3.3616692426584237e-06, "loss": 1.3644, "step": 435 }, { "epoch": 0.01, "learning_rate": 3.369397217928903e-06, "loss": 1.2982, "step": 436 }, { "epoch": 0.01, "learning_rate": 3.377125193199382e-06, "loss": 1.2028, "step": 437 }, { "epoch": 0.01, "learning_rate": 3.384853168469861e-06, "loss": 1.3364, "step": 438 }, { "epoch": 0.01, "learning_rate": 3.3925811437403405e-06, "loss": 1.2516, "step": 439 }, { "epoch": 0.01, "learning_rate": 3.4003091190108196e-06, "loss": 1.2797, "step": 440 }, { "epoch": 0.01, "learning_rate": 3.4080370942812983e-06, "loss": 1.0406, "step": 441 }, { "epoch": 0.01, "learning_rate": 3.4157650695517774e-06, "loss": 1.1972, "step": 442 }, { "epoch": 0.01, "learning_rate": 3.423493044822257e-06, "loss": 1.0979, "step": 443 }, { "epoch": 0.01, "learning_rate": 3.431221020092736e-06, "loss": 1.1361, "step": 444 }, { "epoch": 0.01, "learning_rate": 3.438948995363215e-06, "loss": 1.4631, "step": 445 }, { "epoch": 0.01, "learning_rate": 3.4466769706336946e-06, "loss": 0.9911, "step": 446 }, { "epoch": 0.01, "learning_rate": 3.4544049459041733e-06, "loss": 1.4177, "step": 447 }, { "epoch": 0.01, "learning_rate": 3.4621329211746524e-06, "loss": 0.9367, "step": 448 }, { "epoch": 0.01, "learning_rate": 3.469860896445132e-06, "loss": 1.16, "step": 449 }, { "epoch": 0.01, "learning_rate": 3.477588871715611e-06, "loss": 1.1971, "step": 450 }, { "epoch": 0.01, "learning_rate": 3.4853168469860897e-06, "loss": 1.1651, "step": 451 }, { "epoch": 0.01, "learning_rate": 3.493044822256569e-06, "loss": 1.034, "step": 452 }, { "epoch": 0.01, "learning_rate": 3.5007727975270484e-06, "loss": 1.2375, "step": 453 }, { "epoch": 0.01, "learning_rate": 3.5085007727975275e-06, "loss": 1.1981, "step": 454 }, { "epoch": 0.01, "learning_rate": 3.516228748068006e-06, "loss": 1.4013, "step": 455 }, { "epoch": 0.01, "learning_rate": 3.5239567233384857e-06, "loss": 1.2395, "step": 456 }, { "epoch": 0.01, "learning_rate": 3.5316846986089648e-06, "loss": 1.2208, "step": 457 }, { "epoch": 0.01, "learning_rate": 3.539412673879444e-06, "loss": 1.0931, "step": 458 }, { "epoch": 0.01, "learning_rate": 3.5471406491499234e-06, "loss": 1.1724, "step": 459 }, { "epoch": 0.01, "learning_rate": 3.554868624420402e-06, "loss": 0.9962, "step": 460 }, { "epoch": 0.01, "learning_rate": 3.562596599690881e-06, "loss": 1.1785, "step": 461 }, { "epoch": 0.01, "learning_rate": 3.5703245749613603e-06, "loss": 1.2976, "step": 462 }, { "epoch": 0.01, "learning_rate": 3.57805255023184e-06, "loss": 1.173, "step": 463 }, { "epoch": 0.01, "learning_rate": 3.5857805255023185e-06, "loss": 0.9907, "step": 464 }, { "epoch": 0.01, "learning_rate": 3.5935085007727976e-06, "loss": 1.2784, "step": 465 }, { "epoch": 0.01, "learning_rate": 3.601236476043277e-06, "loss": 1.0666, "step": 466 }, { "epoch": 0.01, "learning_rate": 3.6089644513137562e-06, "loss": 1.0321, "step": 467 }, { "epoch": 0.01, "learning_rate": 3.6166924265842353e-06, "loss": 1.2828, "step": 468 }, { "epoch": 0.01, "learning_rate": 3.624420401854714e-06, "loss": 1.1559, "step": 469 }, { "epoch": 0.01, "learning_rate": 3.6321483771251936e-06, "loss": 0.9794, "step": 470 }, { "epoch": 0.01, "learning_rate": 3.6398763523956727e-06, "loss": 1.2627, "step": 471 }, { "epoch": 0.01, "learning_rate": 3.6476043276661518e-06, "loss": 1.1954, "step": 472 }, { "epoch": 0.01, "learning_rate": 3.6553323029366313e-06, "loss": 0.9862, "step": 473 }, { "epoch": 0.01, "learning_rate": 3.66306027820711e-06, "loss": 1.2741, "step": 474 }, { "epoch": 0.01, "learning_rate": 3.670788253477589e-06, "loss": 1.0803, "step": 475 }, { "epoch": 0.01, "learning_rate": 3.6785162287480686e-06, "loss": 1.1513, "step": 476 }, { "epoch": 0.01, "learning_rate": 3.6862442040185477e-06, "loss": 1.2626, "step": 477 }, { "epoch": 0.01, "learning_rate": 3.6939721792890264e-06, "loss": 1.1324, "step": 478 }, { "epoch": 0.01, "learning_rate": 3.7017001545595055e-06, "loss": 1.269, "step": 479 }, { "epoch": 0.01, "learning_rate": 3.709428129829985e-06, "loss": 1.4412, "step": 480 }, { "epoch": 0.01, "learning_rate": 3.717156105100464e-06, "loss": 1.0391, "step": 481 }, { "epoch": 0.01, "learning_rate": 3.724884080370943e-06, "loss": 1.2362, "step": 482 }, { "epoch": 0.01, "learning_rate": 3.7326120556414223e-06, "loss": 1.3555, "step": 483 }, { "epoch": 0.01, "learning_rate": 3.7403400309119014e-06, "loss": 1.1124, "step": 484 }, { "epoch": 0.01, "learning_rate": 3.7480680061823805e-06, "loss": 1.1243, "step": 485 }, { "epoch": 0.01, "learning_rate": 3.755795981452859e-06, "loss": 1.2084, "step": 486 }, { "epoch": 0.01, "learning_rate": 3.7635239567233387e-06, "loss": 1.1857, "step": 487 }, { "epoch": 0.01, "learning_rate": 3.771251931993818e-06, "loss": 1.3521, "step": 488 }, { "epoch": 0.01, "learning_rate": 3.778979907264297e-06, "loss": 1.201, "step": 489 }, { "epoch": 0.01, "learning_rate": 3.7867078825347765e-06, "loss": 1.003, "step": 490 }, { "epoch": 0.01, "learning_rate": 3.794435857805255e-06, "loss": 1.0912, "step": 491 }, { "epoch": 0.01, "learning_rate": 3.8021638330757343e-06, "loss": 1.3112, "step": 492 }, { "epoch": 0.01, "learning_rate": 3.8098918083462138e-06, "loss": 1.1133, "step": 493 }, { "epoch": 0.01, "learning_rate": 3.8176197836166925e-06, "loss": 1.2222, "step": 494 }, { "epoch": 0.01, "learning_rate": 3.8253477588871716e-06, "loss": 1.0627, "step": 495 }, { "epoch": 0.01, "learning_rate": 3.833075734157651e-06, "loss": 1.1687, "step": 496 }, { "epoch": 0.01, "learning_rate": 3.840803709428131e-06, "loss": 1.3112, "step": 497 }, { "epoch": 0.01, "learning_rate": 3.848531684698609e-06, "loss": 1.165, "step": 498 }, { "epoch": 0.01, "learning_rate": 3.856259659969088e-06, "loss": 1.2613, "step": 499 }, { "epoch": 0.01, "learning_rate": 3.863987635239568e-06, "loss": 1.3281, "step": 500 }, { "epoch": 0.01, "learning_rate": 3.871715610510047e-06, "loss": 0.9355, "step": 501 }, { "epoch": 0.01, "learning_rate": 3.879443585780525e-06, "loss": 1.288, "step": 502 }, { "epoch": 0.01, "learning_rate": 3.887171561051004e-06, "loss": 1.1583, "step": 503 }, { "epoch": 0.01, "learning_rate": 3.894899536321484e-06, "loss": 1.4387, "step": 504 }, { "epoch": 0.01, "learning_rate": 3.9026275115919635e-06, "loss": 1.1613, "step": 505 }, { "epoch": 0.01, "learning_rate": 3.9103554868624426e-06, "loss": 1.2217, "step": 506 }, { "epoch": 0.01, "learning_rate": 3.918083462132922e-06, "loss": 0.9521, "step": 507 }, { "epoch": 0.01, "learning_rate": 3.925811437403401e-06, "loss": 1.1849, "step": 508 }, { "epoch": 0.01, "learning_rate": 3.93353941267388e-06, "loss": 0.9544, "step": 509 }, { "epoch": 0.01, "learning_rate": 3.941267387944359e-06, "loss": 1.0377, "step": 510 }, { "epoch": 0.01, "learning_rate": 3.948995363214838e-06, "loss": 1.2011, "step": 511 }, { "epoch": 0.01, "learning_rate": 3.956723338485317e-06, "loss": 0.7807, "step": 512 }, { "epoch": 0.01, "learning_rate": 3.964451313755796e-06, "loss": 1.3283, "step": 513 }, { "epoch": 0.01, "learning_rate": 3.972179289026275e-06, "loss": 1.2755, "step": 514 }, { "epoch": 0.01, "learning_rate": 3.9799072642967545e-06, "loss": 1.3062, "step": 515 }, { "epoch": 0.01, "learning_rate": 3.987635239567234e-06, "loss": 1.0843, "step": 516 }, { "epoch": 0.01, "learning_rate": 3.995363214837713e-06, "loss": 1.1723, "step": 517 }, { "epoch": 0.01, "learning_rate": 4.003091190108192e-06, "loss": 1.2218, "step": 518 }, { "epoch": 0.01, "learning_rate": 4.010819165378671e-06, "loss": 1.1524, "step": 519 }, { "epoch": 0.01, "learning_rate": 4.018547140649151e-06, "loss": 1.0157, "step": 520 }, { "epoch": 0.01, "learning_rate": 4.026275115919629e-06, "loss": 1.2449, "step": 521 }, { "epoch": 0.01, "learning_rate": 4.034003091190108e-06, "loss": 1.2647, "step": 522 }, { "epoch": 0.01, "learning_rate": 4.041731066460587e-06, "loss": 1.1297, "step": 523 }, { "epoch": 0.01, "learning_rate": 4.049459041731067e-06, "loss": 1.0968, "step": 524 }, { "epoch": 0.01, "learning_rate": 4.0571870170015455e-06, "loss": 0.9418, "step": 525 }, { "epoch": 0.01, "learning_rate": 4.064914992272025e-06, "loss": 1.0747, "step": 526 }, { "epoch": 0.01, "learning_rate": 4.072642967542505e-06, "loss": 1.015, "step": 527 }, { "epoch": 0.01, "learning_rate": 4.080370942812984e-06, "loss": 1.1308, "step": 528 }, { "epoch": 0.01, "learning_rate": 4.088098918083463e-06, "loss": 0.9755, "step": 529 }, { "epoch": 0.01, "learning_rate": 4.095826893353941e-06, "loss": 1.3236, "step": 530 }, { "epoch": 0.01, "learning_rate": 4.103554868624421e-06, "loss": 1.2814, "step": 531 }, { "epoch": 0.01, "learning_rate": 4.1112828438949e-06, "loss": 1.2181, "step": 532 }, { "epoch": 0.01, "learning_rate": 4.119010819165379e-06, "loss": 0.9872, "step": 533 }, { "epoch": 0.01, "learning_rate": 4.126738794435858e-06, "loss": 1.0472, "step": 534 }, { "epoch": 0.01, "learning_rate": 4.134466769706337e-06, "loss": 1.259, "step": 535 }, { "epoch": 0.01, "learning_rate": 4.1421947449768165e-06, "loss": 0.9202, "step": 536 }, { "epoch": 0.01, "learning_rate": 4.149922720247296e-06, "loss": 1.2436, "step": 537 }, { "epoch": 0.01, "learning_rate": 4.157650695517775e-06, "loss": 1.2164, "step": 538 }, { "epoch": 0.01, "learning_rate": 4.165378670788254e-06, "loss": 1.2529, "step": 539 }, { "epoch": 0.01, "learning_rate": 4.173106646058733e-06, "loss": 1.2817, "step": 540 }, { "epoch": 0.01, "learning_rate": 4.180834621329212e-06, "loss": 1.005, "step": 541 }, { "epoch": 0.01, "learning_rate": 4.188562596599691e-06, "loss": 0.9786, "step": 542 }, { "epoch": 0.01, "learning_rate": 4.19629057187017e-06, "loss": 1.5753, "step": 543 }, { "epoch": 0.01, "learning_rate": 4.204018547140649e-06, "loss": 1.0355, "step": 544 }, { "epoch": 0.01, "learning_rate": 4.2117465224111284e-06, "loss": 1.0384, "step": 545 }, { "epoch": 0.01, "learning_rate": 4.2194744976816075e-06, "loss": 1.2239, "step": 546 }, { "epoch": 0.01, "learning_rate": 4.227202472952087e-06, "loss": 1.2164, "step": 547 }, { "epoch": 0.01, "learning_rate": 4.234930448222566e-06, "loss": 1.1333, "step": 548 }, { "epoch": 0.01, "learning_rate": 4.242658423493045e-06, "loss": 1.3142, "step": 549 }, { "epoch": 0.01, "learning_rate": 4.250386398763524e-06, "loss": 1.0895, "step": 550 }, { "epoch": 0.01, "learning_rate": 4.258114374034004e-06, "loss": 1.0458, "step": 551 }, { "epoch": 0.01, "learning_rate": 4.265842349304483e-06, "loss": 1.235, "step": 552 }, { "epoch": 0.01, "learning_rate": 4.273570324574961e-06, "loss": 1.0799, "step": 553 }, { "epoch": 0.01, "learning_rate": 4.281298299845441e-06, "loss": 1.1324, "step": 554 }, { "epoch": 0.01, "learning_rate": 4.28902627511592e-06, "loss": 1.3718, "step": 555 }, { "epoch": 0.01, "learning_rate": 4.2967542503863994e-06, "loss": 1.0402, "step": 556 }, { "epoch": 0.01, "learning_rate": 4.304482225656878e-06, "loss": 1.2337, "step": 557 }, { "epoch": 0.01, "learning_rate": 4.312210200927358e-06, "loss": 1.2208, "step": 558 }, { "epoch": 0.01, "learning_rate": 4.319938176197837e-06, "loss": 1.2777, "step": 559 }, { "epoch": 0.01, "learning_rate": 4.327666151468316e-06, "loss": 0.917, "step": 560 }, { "epoch": 0.01, "learning_rate": 4.335394126738795e-06, "loss": 1.1228, "step": 561 }, { "epoch": 0.01, "learning_rate": 4.343122102009274e-06, "loss": 1.1711, "step": 562 }, { "epoch": 0.01, "learning_rate": 4.350850077279753e-06, "loss": 1.2368, "step": 563 }, { "epoch": 0.01, "learning_rate": 4.358578052550232e-06, "loss": 1.0033, "step": 564 }, { "epoch": 0.01, "learning_rate": 4.366306027820711e-06, "loss": 1.1545, "step": 565 }, { "epoch": 0.01, "learning_rate": 4.3740340030911905e-06, "loss": 1.0187, "step": 566 }, { "epoch": 0.01, "learning_rate": 4.3817619783616696e-06, "loss": 1.1098, "step": 567 }, { "epoch": 0.01, "learning_rate": 4.389489953632149e-06, "loss": 1.4235, "step": 568 }, { "epoch": 0.01, "learning_rate": 4.397217928902628e-06, "loss": 1.0846, "step": 569 }, { "epoch": 0.01, "learning_rate": 4.404945904173107e-06, "loss": 1.1894, "step": 570 }, { "epoch": 0.01, "learning_rate": 4.412673879443586e-06, "loss": 0.9525, "step": 571 }, { "epoch": 0.01, "learning_rate": 4.420401854714065e-06, "loss": 1.365, "step": 572 }, { "epoch": 0.01, "learning_rate": 4.428129829984544e-06, "loss": 1.2002, "step": 573 }, { "epoch": 0.01, "learning_rate": 4.435857805255023e-06, "loss": 1.3736, "step": 574 }, { "epoch": 0.01, "learning_rate": 4.443585780525502e-06, "loss": 1.1231, "step": 575 }, { "epoch": 0.01, "learning_rate": 4.4513137557959815e-06, "loss": 1.3374, "step": 576 }, { "epoch": 0.01, "learning_rate": 4.459041731066461e-06, "loss": 1.2426, "step": 577 }, { "epoch": 0.01, "learning_rate": 4.4667697063369406e-06, "loss": 0.9628, "step": 578 }, { "epoch": 0.01, "learning_rate": 4.47449768160742e-06, "loss": 1.0648, "step": 579 }, { "epoch": 0.01, "learning_rate": 4.482225656877898e-06, "loss": 1.0518, "step": 580 }, { "epoch": 0.01, "learning_rate": 4.489953632148378e-06, "loss": 1.0902, "step": 581 }, { "epoch": 0.01, "learning_rate": 4.497681607418857e-06, "loss": 1.4489, "step": 582 }, { "epoch": 0.01, "learning_rate": 4.505409582689336e-06, "loss": 1.1616, "step": 583 }, { "epoch": 0.01, "learning_rate": 4.513137557959814e-06, "loss": 1.0204, "step": 584 }, { "epoch": 0.01, "learning_rate": 4.520865533230294e-06, "loss": 1.1349, "step": 585 }, { "epoch": 0.01, "learning_rate": 4.528593508500773e-06, "loss": 1.0685, "step": 586 }, { "epoch": 0.01, "learning_rate": 4.5363214837712525e-06, "loss": 1.0321, "step": 587 }, { "epoch": 0.01, "learning_rate": 4.544049459041732e-06, "loss": 1.1874, "step": 588 }, { "epoch": 0.01, "learning_rate": 4.551777434312211e-06, "loss": 1.1442, "step": 589 }, { "epoch": 0.01, "learning_rate": 4.55950540958269e-06, "loss": 1.032, "step": 590 }, { "epoch": 0.01, "learning_rate": 4.567233384853169e-06, "loss": 1.0491, "step": 591 }, { "epoch": 0.01, "learning_rate": 4.574961360123648e-06, "loss": 1.1763, "step": 592 }, { "epoch": 0.01, "learning_rate": 4.582689335394127e-06, "loss": 1.111, "step": 593 }, { "epoch": 0.01, "learning_rate": 4.590417310664606e-06, "loss": 1.1227, "step": 594 }, { "epoch": 0.01, "learning_rate": 4.598145285935085e-06, "loss": 1.2225, "step": 595 }, { "epoch": 0.01, "learning_rate": 4.6058732612055644e-06, "loss": 1.2842, "step": 596 }, { "epoch": 0.01, "learning_rate": 4.6136012364760435e-06, "loss": 1.083, "step": 597 }, { "epoch": 0.01, "learning_rate": 4.621329211746523e-06, "loss": 1.2028, "step": 598 }, { "epoch": 0.01, "learning_rate": 4.629057187017002e-06, "loss": 1.3131, "step": 599 }, { "epoch": 0.01, "learning_rate": 4.636785162287481e-06, "loss": 1.0428, "step": 600 }, { "epoch": 0.01, "learning_rate": 4.64451313755796e-06, "loss": 1.0905, "step": 601 }, { "epoch": 0.01, "learning_rate": 4.65224111282844e-06, "loss": 1.3066, "step": 602 }, { "epoch": 0.01, "learning_rate": 4.659969088098918e-06, "loss": 1.1218, "step": 603 }, { "epoch": 0.01, "learning_rate": 4.667697063369397e-06, "loss": 1.0534, "step": 604 }, { "epoch": 0.01, "learning_rate": 4.675425038639877e-06, "loss": 1.3491, "step": 605 }, { "epoch": 0.01, "learning_rate": 4.683153013910356e-06, "loss": 0.9694, "step": 606 }, { "epoch": 0.01, "learning_rate": 4.6908809891808346e-06, "loss": 1.2585, "step": 607 }, { "epoch": 0.01, "learning_rate": 4.698608964451314e-06, "loss": 1.0402, "step": 608 }, { "epoch": 0.01, "learning_rate": 4.706336939721794e-06, "loss": 1.1586, "step": 609 }, { "epoch": 0.01, "learning_rate": 4.714064914992273e-06, "loss": 1.0391, "step": 610 }, { "epoch": 0.01, "learning_rate": 4.721792890262751e-06, "loss": 1.2653, "step": 611 }, { "epoch": 0.01, "learning_rate": 4.729520865533231e-06, "loss": 1.3555, "step": 612 }, { "epoch": 0.01, "learning_rate": 4.73724884080371e-06, "loss": 0.9979, "step": 613 }, { "epoch": 0.01, "learning_rate": 4.744976816074189e-06, "loss": 1.3617, "step": 614 }, { "epoch": 0.01, "learning_rate": 4.752704791344668e-06, "loss": 1.1649, "step": 615 }, { "epoch": 0.01, "learning_rate": 4.760432766615147e-06, "loss": 0.9393, "step": 616 }, { "epoch": 0.01, "learning_rate": 4.7681607418856265e-06, "loss": 1.1197, "step": 617 }, { "epoch": 0.01, "learning_rate": 4.7758887171561056e-06, "loss": 1.232, "step": 618 }, { "epoch": 0.01, "learning_rate": 4.783616692426585e-06, "loss": 1.2103, "step": 619 }, { "epoch": 0.01, "learning_rate": 4.791344667697064e-06, "loss": 0.938, "step": 620 }, { "epoch": 0.01, "learning_rate": 4.799072642967543e-06, "loss": 0.8926, "step": 621 }, { "epoch": 0.01, "learning_rate": 4.806800618238022e-06, "loss": 1.07, "step": 622 }, { "epoch": 0.01, "learning_rate": 4.814528593508501e-06, "loss": 1.2392, "step": 623 }, { "epoch": 0.01, "learning_rate": 4.82225656877898e-06, "loss": 1.2958, "step": 624 }, { "epoch": 0.01, "learning_rate": 4.82998454404946e-06, "loss": 0.8828, "step": 625 }, { "epoch": 0.01, "learning_rate": 4.837712519319938e-06, "loss": 1.2453, "step": 626 }, { "epoch": 0.01, "learning_rate": 4.8454404945904175e-06, "loss": 0.9983, "step": 627 }, { "epoch": 0.01, "learning_rate": 4.853168469860897e-06, "loss": 1.1146, "step": 628 }, { "epoch": 0.01, "learning_rate": 4.8608964451313765e-06, "loss": 1.3291, "step": 629 }, { "epoch": 0.01, "learning_rate": 4.868624420401855e-06, "loss": 1.1606, "step": 630 }, { "epoch": 0.01, "learning_rate": 4.876352395672334e-06, "loss": 1.3064, "step": 631 }, { "epoch": 0.01, "learning_rate": 4.884080370942814e-06, "loss": 1.0064, "step": 632 }, { "epoch": 0.01, "learning_rate": 4.891808346213293e-06, "loss": 1.2504, "step": 633 }, { "epoch": 0.01, "learning_rate": 4.899536321483771e-06, "loss": 1.21, "step": 634 }, { "epoch": 0.01, "learning_rate": 4.90726429675425e-06, "loss": 1.1414, "step": 635 }, { "epoch": 0.01, "learning_rate": 4.91499227202473e-06, "loss": 1.141, "step": 636 }, { "epoch": 0.01, "learning_rate": 4.922720247295209e-06, "loss": 1.2382, "step": 637 }, { "epoch": 0.01, "learning_rate": 4.930448222565688e-06, "loss": 1.1605, "step": 638 }, { "epoch": 0.01, "learning_rate": 4.938176197836168e-06, "loss": 1.2249, "step": 639 }, { "epoch": 0.01, "learning_rate": 4.945904173106647e-06, "loss": 1.0314, "step": 640 }, { "epoch": 0.01, "learning_rate": 4.953632148377126e-06, "loss": 1.1543, "step": 641 }, { "epoch": 0.01, "learning_rate": 4.961360123647605e-06, "loss": 1.2661, "step": 642 }, { "epoch": 0.01, "learning_rate": 4.969088098918084e-06, "loss": 0.8644, "step": 643 }, { "epoch": 0.01, "learning_rate": 4.976816074188563e-06, "loss": 1.2664, "step": 644 }, { "epoch": 0.01, "learning_rate": 4.984544049459042e-06, "loss": 1.0741, "step": 645 }, { "epoch": 0.01, "learning_rate": 4.992272024729521e-06, "loss": 1.2099, "step": 646 }, { "epoch": 0.02, "learning_rate": 5e-06, "loss": 1.1871, "step": 647 }, { "epoch": 0.02, "learning_rate": 5.0077279752704795e-06, "loss": 1.4221, "step": 648 }, { "epoch": 0.02, "learning_rate": 5.015455950540959e-06, "loss": 1.2522, "step": 649 }, { "epoch": 0.02, "learning_rate": 5.023183925811438e-06, "loss": 1.3309, "step": 650 }, { "epoch": 0.02, "learning_rate": 5.030911901081918e-06, "loss": 1.3977, "step": 651 }, { "epoch": 0.02, "learning_rate": 5.038639876352396e-06, "loss": 1.3258, "step": 652 }, { "epoch": 0.02, "learning_rate": 5.046367851622875e-06, "loss": 1.1793, "step": 653 }, { "epoch": 0.02, "learning_rate": 5.054095826893355e-06, "loss": 1.1084, "step": 654 }, { "epoch": 0.02, "learning_rate": 5.061823802163833e-06, "loss": 1.0061, "step": 655 }, { "epoch": 0.02, "learning_rate": 5.069551777434313e-06, "loss": 1.0781, "step": 656 }, { "epoch": 0.02, "learning_rate": 5.0772797527047914e-06, "loss": 1.1394, "step": 657 }, { "epoch": 0.02, "learning_rate": 5.0850077279752705e-06, "loss": 1.19, "step": 658 }, { "epoch": 0.02, "learning_rate": 5.0927357032457505e-06, "loss": 1.1168, "step": 659 }, { "epoch": 0.02, "learning_rate": 5.100463678516229e-06, "loss": 0.9153, "step": 660 }, { "epoch": 0.02, "learning_rate": 5.108191653786708e-06, "loss": 1.2749, "step": 661 }, { "epoch": 0.02, "learning_rate": 5.115919629057188e-06, "loss": 1.0398, "step": 662 }, { "epoch": 0.02, "learning_rate": 5.123647604327666e-06, "loss": 1.1782, "step": 663 }, { "epoch": 0.02, "learning_rate": 5.131375579598146e-06, "loss": 1.2248, "step": 664 }, { "epoch": 0.02, "learning_rate": 5.139103554868625e-06, "loss": 1.0177, "step": 665 }, { "epoch": 0.02, "learning_rate": 5.146831530139103e-06, "loss": 1.1872, "step": 666 }, { "epoch": 0.02, "learning_rate": 5.154559505409583e-06, "loss": 1.0639, "step": 667 }, { "epoch": 0.02, "learning_rate": 5.1622874806800624e-06, "loss": 1.205, "step": 668 }, { "epoch": 0.02, "learning_rate": 5.170015455950541e-06, "loss": 1.2139, "step": 669 }, { "epoch": 0.02, "learning_rate": 5.177743431221021e-06, "loss": 1.1227, "step": 670 }, { "epoch": 0.02, "learning_rate": 5.1854714064915e-06, "loss": 1.0538, "step": 671 }, { "epoch": 0.02, "learning_rate": 5.193199381761979e-06, "loss": 1.1649, "step": 672 }, { "epoch": 0.02, "learning_rate": 5.200927357032458e-06, "loss": 0.998, "step": 673 }, { "epoch": 0.02, "learning_rate": 5.208655332302936e-06, "loss": 0.9708, "step": 674 }, { "epoch": 0.02, "learning_rate": 5.216383307573416e-06, "loss": 1.0017, "step": 675 }, { "epoch": 0.02, "learning_rate": 5.224111282843895e-06, "loss": 0.9842, "step": 676 }, { "epoch": 0.02, "learning_rate": 5.231839258114374e-06, "loss": 1.1367, "step": 677 }, { "epoch": 0.02, "learning_rate": 5.2395672333848535e-06, "loss": 1.2371, "step": 678 }, { "epoch": 0.02, "learning_rate": 5.247295208655333e-06, "loss": 1.2402, "step": 679 }, { "epoch": 0.02, "learning_rate": 5.255023183925812e-06, "loss": 0.9942, "step": 680 }, { "epoch": 0.02, "learning_rate": 5.262751159196291e-06, "loss": 1.1088, "step": 681 }, { "epoch": 0.02, "learning_rate": 5.270479134466771e-06, "loss": 1.041, "step": 682 }, { "epoch": 0.02, "learning_rate": 5.278207109737249e-06, "loss": 1.1365, "step": 683 }, { "epoch": 0.02, "learning_rate": 5.285935085007728e-06, "loss": 1.2864, "step": 684 }, { "epoch": 0.02, "learning_rate": 5.293663060278208e-06, "loss": 1.2023, "step": 685 }, { "epoch": 0.02, "learning_rate": 5.301391035548686e-06, "loss": 1.3415, "step": 686 }, { "epoch": 0.02, "learning_rate": 5.309119010819166e-06, "loss": 0.8853, "step": 687 }, { "epoch": 0.02, "learning_rate": 5.316846986089645e-06, "loss": 1.8153, "step": 688 }, { "epoch": 0.02, "learning_rate": 5.324574961360124e-06, "loss": 0.9826, "step": 689 }, { "epoch": 0.02, "learning_rate": 5.3323029366306036e-06, "loss": 1.1378, "step": 690 }, { "epoch": 0.02, "learning_rate": 5.340030911901082e-06, "loss": 1.0378, "step": 691 }, { "epoch": 0.02, "learning_rate": 5.347758887171561e-06, "loss": 1.0699, "step": 692 }, { "epoch": 0.02, "learning_rate": 5.355486862442041e-06, "loss": 1.3665, "step": 693 }, { "epoch": 0.02, "learning_rate": 5.363214837712519e-06, "loss": 1.1092, "step": 694 }, { "epoch": 0.02, "learning_rate": 5.370942812982999e-06, "loss": 1.155, "step": 695 }, { "epoch": 0.02, "learning_rate": 5.378670788253478e-06, "loss": 0.9979, "step": 696 }, { "epoch": 0.02, "learning_rate": 5.3863987635239564e-06, "loss": 1.2828, "step": 697 }, { "epoch": 0.02, "learning_rate": 5.394126738794436e-06, "loss": 1.0717, "step": 698 }, { "epoch": 0.02, "learning_rate": 5.4018547140649155e-06, "loss": 1.1905, "step": 699 }, { "epoch": 0.02, "learning_rate": 5.409582689335395e-06, "loss": 1.3261, "step": 700 }, { "epoch": 0.02, "learning_rate": 5.417310664605874e-06, "loss": 1.1499, "step": 701 }, { "epoch": 0.02, "learning_rate": 5.425038639876354e-06, "loss": 1.274, "step": 702 }, { "epoch": 0.02, "learning_rate": 5.432766615146832e-06, "loss": 1.4245, "step": 703 }, { "epoch": 0.02, "learning_rate": 5.440494590417311e-06, "loss": 1.0003, "step": 704 }, { "epoch": 0.02, "learning_rate": 5.448222565687791e-06, "loss": 1.2356, "step": 705 }, { "epoch": 0.02, "learning_rate": 5.455950540958269e-06, "loss": 1.1903, "step": 706 }, { "epoch": 0.02, "learning_rate": 5.463678516228748e-06, "loss": 1.2715, "step": 707 }, { "epoch": 0.02, "learning_rate": 5.471406491499228e-06, "loss": 1.1163, "step": 708 }, { "epoch": 0.02, "learning_rate": 5.4791344667697065e-06, "loss": 1.2207, "step": 709 }, { "epoch": 0.02, "learning_rate": 5.4868624420401865e-06, "loss": 1.2961, "step": 710 }, { "epoch": 0.02, "learning_rate": 5.494590417310665e-06, "loss": 0.9202, "step": 711 }, { "epoch": 0.02, "learning_rate": 5.502318392581144e-06, "loss": 1.4097, "step": 712 }, { "epoch": 0.02, "learning_rate": 5.510046367851624e-06, "loss": 1.1324, "step": 713 }, { "epoch": 0.02, "learning_rate": 5.517774343122102e-06, "loss": 1.2417, "step": 714 }, { "epoch": 0.02, "learning_rate": 5.525502318392581e-06, "loss": 1.0759, "step": 715 }, { "epoch": 0.02, "learning_rate": 5.533230293663061e-06, "loss": 1.1602, "step": 716 }, { "epoch": 0.02, "learning_rate": 5.540958268933539e-06, "loss": 1.1312, "step": 717 }, { "epoch": 0.02, "learning_rate": 5.548686244204019e-06, "loss": 1.1927, "step": 718 }, { "epoch": 0.02, "learning_rate": 5.556414219474498e-06, "loss": 1.0959, "step": 719 }, { "epoch": 0.02, "learning_rate": 5.564142194744977e-06, "loss": 1.0006, "step": 720 }, { "epoch": 0.02, "learning_rate": 5.571870170015457e-06, "loss": 1.1552, "step": 721 }, { "epoch": 0.02, "learning_rate": 5.579598145285936e-06, "loss": 0.9206, "step": 722 }, { "epoch": 0.02, "learning_rate": 5.587326120556415e-06, "loss": 1.2022, "step": 723 }, { "epoch": 0.02, "learning_rate": 5.595054095826894e-06, "loss": 0.925, "step": 724 }, { "epoch": 0.02, "learning_rate": 5.602782071097374e-06, "loss": 0.95, "step": 725 }, { "epoch": 0.02, "learning_rate": 5.610510046367852e-06, "loss": 1.1383, "step": 726 }, { "epoch": 0.02, "learning_rate": 5.618238021638331e-06, "loss": 1.1511, "step": 727 }, { "epoch": 0.02, "learning_rate": 5.6259659969088095e-06, "loss": 0.9755, "step": 728 }, { "epoch": 0.02, "learning_rate": 5.6336939721792895e-06, "loss": 1.2559, "step": 729 }, { "epoch": 0.02, "learning_rate": 5.6414219474497686e-06, "loss": 1.2027, "step": 730 }, { "epoch": 0.02, "learning_rate": 5.649149922720248e-06, "loss": 1.1157, "step": 731 }, { "epoch": 0.02, "learning_rate": 5.656877897990727e-06, "loss": 1.3806, "step": 732 }, { "epoch": 0.02, "learning_rate": 5.664605873261207e-06, "loss": 1.0786, "step": 733 }, { "epoch": 0.02, "learning_rate": 5.672333848531685e-06, "loss": 1.1089, "step": 734 }, { "epoch": 0.02, "learning_rate": 5.680061823802164e-06, "loss": 1.009, "step": 735 }, { "epoch": 0.02, "learning_rate": 5.687789799072644e-06, "loss": 1.1608, "step": 736 }, { "epoch": 0.02, "learning_rate": 5.695517774343122e-06, "loss": 0.8519, "step": 737 }, { "epoch": 0.02, "learning_rate": 5.703245749613601e-06, "loss": 1.0237, "step": 738 }, { "epoch": 0.02, "learning_rate": 5.710973724884081e-06, "loss": 1.2175, "step": 739 }, { "epoch": 0.02, "learning_rate": 5.71870170015456e-06, "loss": 1.2962, "step": 740 }, { "epoch": 0.02, "learning_rate": 5.7264296754250395e-06, "loss": 0.9431, "step": 741 }, { "epoch": 0.02, "learning_rate": 5.734157650695519e-06, "loss": 1.5369, "step": 742 }, { "epoch": 0.02, "learning_rate": 5.741885625965997e-06, "loss": 1.1497, "step": 743 }, { "epoch": 0.02, "learning_rate": 5.749613601236477e-06, "loss": 0.9925, "step": 744 }, { "epoch": 0.02, "learning_rate": 5.757341576506955e-06, "loss": 1.1918, "step": 745 }, { "epoch": 0.02, "learning_rate": 5.765069551777435e-06, "loss": 1.0919, "step": 746 }, { "epoch": 0.02, "learning_rate": 5.772797527047914e-06, "loss": 1.3039, "step": 747 }, { "epoch": 0.02, "learning_rate": 5.780525502318392e-06, "loss": 1.1674, "step": 748 }, { "epoch": 0.02, "learning_rate": 5.788253477588872e-06, "loss": 1.1326, "step": 749 }, { "epoch": 0.02, "learning_rate": 5.7959814528593515e-06, "loss": 1.0138, "step": 750 }, { "epoch": 0.02, "learning_rate": 5.80370942812983e-06, "loss": 1.1973, "step": 751 }, { "epoch": 0.02, "learning_rate": 5.81143740340031e-06, "loss": 1.3026, "step": 752 }, { "epoch": 0.02, "learning_rate": 5.819165378670789e-06, "loss": 1.1618, "step": 753 }, { "epoch": 0.02, "learning_rate": 5.826893353941268e-06, "loss": 1.3148, "step": 754 }, { "epoch": 0.02, "learning_rate": 5.834621329211747e-06, "loss": 1.0925, "step": 755 }, { "epoch": 0.02, "learning_rate": 5.842349304482227e-06, "loss": 1.3101, "step": 756 }, { "epoch": 0.02, "learning_rate": 5.850077279752705e-06, "loss": 1.1173, "step": 757 }, { "epoch": 0.02, "learning_rate": 5.857805255023184e-06, "loss": 1.0077, "step": 758 }, { "epoch": 0.02, "learning_rate": 5.865533230293664e-06, "loss": 0.8705, "step": 759 }, { "epoch": 0.02, "learning_rate": 5.8732612055641425e-06, "loss": 0.8558, "step": 760 }, { "epoch": 0.02, "learning_rate": 5.880989180834622e-06, "loss": 0.9429, "step": 761 }, { "epoch": 0.02, "learning_rate": 5.888717156105101e-06, "loss": 1.0088, "step": 762 }, { "epoch": 0.02, "learning_rate": 5.89644513137558e-06, "loss": 1.3699, "step": 763 }, { "epoch": 0.02, "learning_rate": 5.90417310664606e-06, "loss": 1.3767, "step": 764 }, { "epoch": 0.02, "learning_rate": 5.911901081916538e-06, "loss": 0.9807, "step": 765 }, { "epoch": 0.02, "learning_rate": 5.919629057187017e-06, "loss": 1.1426, "step": 766 }, { "epoch": 0.02, "learning_rate": 5.927357032457497e-06, "loss": 1.0091, "step": 767 }, { "epoch": 0.02, "learning_rate": 5.935085007727975e-06, "loss": 1.1805, "step": 768 }, { "epoch": 0.02, "learning_rate": 5.942812982998455e-06, "loss": 1.214, "step": 769 }, { "epoch": 0.02, "learning_rate": 5.950540958268934e-06, "loss": 1.1283, "step": 770 }, { "epoch": 0.02, "learning_rate": 5.958268933539413e-06, "loss": 1.123, "step": 771 }, { "epoch": 0.02, "learning_rate": 5.965996908809893e-06, "loss": 1.1144, "step": 772 }, { "epoch": 0.02, "learning_rate": 5.973724884080372e-06, "loss": 1.1767, "step": 773 }, { "epoch": 0.02, "learning_rate": 5.98145285935085e-06, "loss": 1.3216, "step": 774 }, { "epoch": 0.02, "learning_rate": 5.98918083462133e-06, "loss": 1.3461, "step": 775 }, { "epoch": 0.02, "learning_rate": 5.996908809891809e-06, "loss": 1.1773, "step": 776 }, { "epoch": 0.02, "learning_rate": 6.004636785162288e-06, "loss": 1.2211, "step": 777 }, { "epoch": 0.02, "learning_rate": 6.012364760432767e-06, "loss": 1.1419, "step": 778 }, { "epoch": 0.02, "learning_rate": 6.0200927357032455e-06, "loss": 1.1338, "step": 779 }, { "epoch": 0.02, "learning_rate": 6.0278207109737254e-06, "loss": 1.2208, "step": 780 }, { "epoch": 0.02, "learning_rate": 6.0355486862442045e-06, "loss": 0.9854, "step": 781 }, { "epoch": 0.02, "learning_rate": 6.043276661514683e-06, "loss": 1.1029, "step": 782 }, { "epoch": 0.02, "learning_rate": 6.051004636785163e-06, "loss": 1.1511, "step": 783 }, { "epoch": 0.02, "learning_rate": 6.058732612055642e-06, "loss": 1.3313, "step": 784 }, { "epoch": 0.02, "learning_rate": 6.066460587326121e-06, "loss": 1.2616, "step": 785 }, { "epoch": 0.02, "learning_rate": 6.0741885625966e-06, "loss": 1.0601, "step": 786 }, { "epoch": 0.02, "learning_rate": 6.08191653786708e-06, "loss": 1.2552, "step": 787 }, { "epoch": 0.02, "learning_rate": 6.089644513137558e-06, "loss": 0.9217, "step": 788 }, { "epoch": 0.02, "learning_rate": 6.097372488408037e-06, "loss": 1.2576, "step": 789 }, { "epoch": 0.02, "learning_rate": 6.105100463678517e-06, "loss": 1.1031, "step": 790 }, { "epoch": 0.02, "learning_rate": 6.1128284389489956e-06, "loss": 0.9952, "step": 791 }, { "epoch": 0.02, "learning_rate": 6.1205564142194755e-06, "loss": 1.2166, "step": 792 }, { "epoch": 0.02, "learning_rate": 6.128284389489955e-06, "loss": 1.2142, "step": 793 }, { "epoch": 0.02, "learning_rate": 6.136012364760433e-06, "loss": 1.0768, "step": 794 }, { "epoch": 0.02, "learning_rate": 6.143740340030913e-06, "loss": 1.2747, "step": 795 }, { "epoch": 0.02, "learning_rate": 6.151468315301391e-06, "loss": 1.0338, "step": 796 }, { "epoch": 0.02, "learning_rate": 6.15919629057187e-06, "loss": 1.2376, "step": 797 }, { "epoch": 0.02, "learning_rate": 6.16692426584235e-06, "loss": 1.2247, "step": 798 }, { "epoch": 0.02, "learning_rate": 6.174652241112828e-06, "loss": 1.0606, "step": 799 }, { "epoch": 0.02, "learning_rate": 6.182380216383308e-06, "loss": 1.287, "step": 800 }, { "epoch": 0.02, "learning_rate": 6.1901081916537875e-06, "loss": 1.0173, "step": 801 }, { "epoch": 0.02, "learning_rate": 6.197836166924266e-06, "loss": 0.9228, "step": 802 }, { "epoch": 0.02, "learning_rate": 6.205564142194746e-06, "loss": 1.1079, "step": 803 }, { "epoch": 0.02, "learning_rate": 6.213292117465225e-06, "loss": 1.0007, "step": 804 }, { "epoch": 0.02, "learning_rate": 6.221020092735703e-06, "loss": 1.4111, "step": 805 }, { "epoch": 0.02, "learning_rate": 6.228748068006183e-06, "loss": 0.7658, "step": 806 }, { "epoch": 0.02, "learning_rate": 6.236476043276662e-06, "loss": 0.9952, "step": 807 }, { "epoch": 0.02, "learning_rate": 6.244204018547141e-06, "loss": 1.2259, "step": 808 }, { "epoch": 0.02, "learning_rate": 6.25193199381762e-06, "loss": 1.232, "step": 809 }, { "epoch": 0.02, "learning_rate": 6.2596599690881e-06, "loss": 1.1711, "step": 810 }, { "epoch": 0.02, "learning_rate": 6.2673879443585785e-06, "loss": 1.0974, "step": 811 }, { "epoch": 0.02, "learning_rate": 6.275115919629058e-06, "loss": 1.1619, "step": 812 }, { "epoch": 0.02, "learning_rate": 6.2828438948995375e-06, "loss": 1.0999, "step": 813 }, { "epoch": 0.02, "learning_rate": 6.290571870170016e-06, "loss": 1.0482, "step": 814 }, { "epoch": 0.02, "learning_rate": 6.298299845440495e-06, "loss": 1.1381, "step": 815 }, { "epoch": 0.02, "learning_rate": 6.306027820710974e-06, "loss": 0.9564, "step": 816 }, { "epoch": 0.02, "learning_rate": 6.313755795981453e-06, "loss": 0.9743, "step": 817 }, { "epoch": 0.02, "learning_rate": 6.321483771251933e-06, "loss": 1.124, "step": 818 }, { "epoch": 0.02, "learning_rate": 6.329211746522411e-06, "loss": 1.136, "step": 819 }, { "epoch": 0.02, "learning_rate": 6.3369397217928904e-06, "loss": 1.1954, "step": 820 }, { "epoch": 0.02, "learning_rate": 6.34466769706337e-06, "loss": 0.9512, "step": 821 }, { "epoch": 0.02, "learning_rate": 6.352395672333849e-06, "loss": 0.9855, "step": 822 }, { "epoch": 0.02, "learning_rate": 6.360123647604329e-06, "loss": 1.1584, "step": 823 }, { "epoch": 0.02, "learning_rate": 6.367851622874808e-06, "loss": 1.0068, "step": 824 }, { "epoch": 0.02, "learning_rate": 6.375579598145286e-06, "loss": 0.9829, "step": 825 }, { "epoch": 0.02, "learning_rate": 6.383307573415766e-06, "loss": 1.0822, "step": 826 }, { "epoch": 0.02, "learning_rate": 6.391035548686245e-06, "loss": 1.1328, "step": 827 }, { "epoch": 0.02, "learning_rate": 6.398763523956723e-06, "loss": 1.2716, "step": 828 }, { "epoch": 0.02, "learning_rate": 6.406491499227203e-06, "loss": 1.1243, "step": 829 }, { "epoch": 0.02, "learning_rate": 6.414219474497682e-06, "loss": 0.9721, "step": 830 }, { "epoch": 0.02, "learning_rate": 6.421947449768161e-06, "loss": 0.8508, "step": 831 }, { "epoch": 0.02, "learning_rate": 6.4296754250386405e-06, "loss": 1.2676, "step": 832 }, { "epoch": 0.02, "learning_rate": 6.437403400309119e-06, "loss": 1.1887, "step": 833 }, { "epoch": 0.02, "learning_rate": 6.445131375579599e-06, "loss": 1.0417, "step": 834 }, { "epoch": 0.02, "learning_rate": 6.452859350850078e-06, "loss": 1.121, "step": 835 }, { "epoch": 0.02, "learning_rate": 6.460587326120556e-06, "loss": 1.2673, "step": 836 }, { "epoch": 0.02, "learning_rate": 6.468315301391036e-06, "loss": 1.1835, "step": 837 }, { "epoch": 0.02, "learning_rate": 6.476043276661515e-06, "loss": 1.067, "step": 838 }, { "epoch": 0.02, "learning_rate": 6.483771251931994e-06, "loss": 1.1629, "step": 839 }, { "epoch": 0.02, "learning_rate": 6.491499227202473e-06, "loss": 1.1859, "step": 840 }, { "epoch": 0.02, "learning_rate": 6.499227202472953e-06, "loss": 1.1658, "step": 841 }, { "epoch": 0.02, "learning_rate": 6.5069551777434316e-06, "loss": 1.3013, "step": 842 }, { "epoch": 0.02, "learning_rate": 6.514683153013911e-06, "loss": 0.8524, "step": 843 }, { "epoch": 0.02, "learning_rate": 6.522411128284391e-06, "loss": 1.2654, "step": 844 }, { "epoch": 0.02, "learning_rate": 6.530139103554869e-06, "loss": 1.0333, "step": 845 }, { "epoch": 0.02, "learning_rate": 6.537867078825349e-06, "loss": 1.2584, "step": 846 }, { "epoch": 0.02, "learning_rate": 6.545595054095828e-06, "loss": 1.1146, "step": 847 }, { "epoch": 0.02, "learning_rate": 6.553323029366306e-06, "loss": 1.1369, "step": 848 }, { "epoch": 0.02, "learning_rate": 6.561051004636786e-06, "loss": 0.9704, "step": 849 }, { "epoch": 0.02, "learning_rate": 6.568778979907264e-06, "loss": 1.1749, "step": 850 }, { "epoch": 0.02, "learning_rate": 6.5765069551777435e-06, "loss": 1.1932, "step": 851 }, { "epoch": 0.02, "learning_rate": 6.5842349304482234e-06, "loss": 1.055, "step": 852 }, { "epoch": 0.02, "learning_rate": 6.591962905718702e-06, "loss": 1.1029, "step": 853 }, { "epoch": 0.02, "learning_rate": 6.599690880989182e-06, "loss": 1.218, "step": 854 }, { "epoch": 0.02, "learning_rate": 6.607418856259661e-06, "loss": 1.293, "step": 855 }, { "epoch": 0.02, "learning_rate": 6.615146831530139e-06, "loss": 0.9961, "step": 856 }, { "epoch": 0.02, "learning_rate": 6.622874806800619e-06, "loss": 1.2219, "step": 857 }, { "epoch": 0.02, "learning_rate": 6.630602782071098e-06, "loss": 1.5227, "step": 858 }, { "epoch": 0.02, "learning_rate": 6.638330757341576e-06, "loss": 1.0762, "step": 859 }, { "epoch": 0.02, "learning_rate": 6.646058732612056e-06, "loss": 1.0189, "step": 860 }, { "epoch": 0.02, "learning_rate": 6.653786707882535e-06, "loss": 0.9048, "step": 861 }, { "epoch": 0.02, "learning_rate": 6.6615146831530145e-06, "loss": 1.0988, "step": 862 }, { "epoch": 0.02, "learning_rate": 6.669242658423494e-06, "loss": 0.9126, "step": 863 }, { "epoch": 0.02, "learning_rate": 6.6769706336939735e-06, "loss": 1.2749, "step": 864 }, { "epoch": 0.02, "learning_rate": 6.684698608964452e-06, "loss": 1.2258, "step": 865 }, { "epoch": 0.02, "learning_rate": 6.692426584234931e-06, "loss": 1.0604, "step": 866 }, { "epoch": 0.02, "learning_rate": 6.70015455950541e-06, "loss": 1.1047, "step": 867 }, { "epoch": 0.02, "learning_rate": 6.707882534775889e-06, "loss": 1.0101, "step": 868 }, { "epoch": 0.02, "learning_rate": 6.715610510046369e-06, "loss": 1.1556, "step": 869 }, { "epoch": 0.02, "learning_rate": 6.723338485316847e-06, "loss": 1.3196, "step": 870 }, { "epoch": 0.02, "learning_rate": 6.731066460587326e-06, "loss": 1.1394, "step": 871 }, { "epoch": 0.02, "learning_rate": 6.738794435857806e-06, "loss": 0.9759, "step": 872 }, { "epoch": 0.02, "learning_rate": 6.746522411128285e-06, "loss": 0.8942, "step": 873 }, { "epoch": 0.02, "learning_rate": 6.754250386398764e-06, "loss": 1.306, "step": 874 }, { "epoch": 0.02, "learning_rate": 6.761978361669244e-06, "loss": 0.9357, "step": 875 }, { "epoch": 0.02, "learning_rate": 6.769706336939722e-06, "loss": 1.4899, "step": 876 }, { "epoch": 0.02, "learning_rate": 6.777434312210202e-06, "loss": 1.059, "step": 877 }, { "epoch": 0.02, "learning_rate": 6.785162287480681e-06, "loss": 1.4659, "step": 878 }, { "epoch": 0.02, "learning_rate": 6.792890262751159e-06, "loss": 1.461, "step": 879 }, { "epoch": 0.02, "learning_rate": 6.800618238021639e-06, "loss": 1.0882, "step": 880 }, { "epoch": 0.02, "learning_rate": 6.808346213292118e-06, "loss": 1.1598, "step": 881 }, { "epoch": 0.02, "learning_rate": 6.8160741885625965e-06, "loss": 1.4043, "step": 882 }, { "epoch": 0.02, "learning_rate": 6.8238021638330765e-06, "loss": 1.1661, "step": 883 }, { "epoch": 0.02, "learning_rate": 6.831530139103555e-06, "loss": 1.1141, "step": 884 }, { "epoch": 0.02, "learning_rate": 6.839258114374035e-06, "loss": 1.2302, "step": 885 }, { "epoch": 0.02, "learning_rate": 6.846986089644514e-06, "loss": 0.8824, "step": 886 }, { "epoch": 0.02, "learning_rate": 6.854714064914992e-06, "loss": 1.0002, "step": 887 }, { "epoch": 0.02, "learning_rate": 6.862442040185472e-06, "loss": 1.3123, "step": 888 }, { "epoch": 0.02, "learning_rate": 6.870170015455951e-06, "loss": 1.2184, "step": 889 }, { "epoch": 0.02, "learning_rate": 6.87789799072643e-06, "loss": 1.1237, "step": 890 }, { "epoch": 0.02, "learning_rate": 6.885625965996909e-06, "loss": 1.2855, "step": 891 }, { "epoch": 0.02, "learning_rate": 6.893353941267389e-06, "loss": 1.2834, "step": 892 }, { "epoch": 0.02, "learning_rate": 6.9010819165378675e-06, "loss": 0.9692, "step": 893 }, { "epoch": 0.02, "learning_rate": 6.908809891808347e-06, "loss": 1.3507, "step": 894 }, { "epoch": 0.02, "learning_rate": 6.916537867078827e-06, "loss": 1.1002, "step": 895 }, { "epoch": 0.02, "learning_rate": 6.924265842349305e-06, "loss": 1.4163, "step": 896 }, { "epoch": 0.02, "learning_rate": 6.931993817619784e-06, "loss": 1.1617, "step": 897 }, { "epoch": 0.02, "learning_rate": 6.939721792890264e-06, "loss": 1.2598, "step": 898 }, { "epoch": 0.02, "learning_rate": 6.947449768160742e-06, "loss": 1.07, "step": 899 }, { "epoch": 0.02, "learning_rate": 6.955177743431222e-06, "loss": 1.2333, "step": 900 }, { "epoch": 0.02, "learning_rate": 6.9629057187017e-06, "loss": 1.0764, "step": 901 }, { "epoch": 0.02, "learning_rate": 6.9706336939721795e-06, "loss": 1.2463, "step": 902 }, { "epoch": 0.02, "learning_rate": 6.978361669242659e-06, "loss": 1.2011, "step": 903 }, { "epoch": 0.02, "learning_rate": 6.986089644513138e-06, "loss": 1.0994, "step": 904 }, { "epoch": 0.02, "learning_rate": 6.993817619783617e-06, "loss": 0.9344, "step": 905 }, { "epoch": 0.02, "learning_rate": 7.001545595054097e-06, "loss": 1.2878, "step": 906 }, { "epoch": 0.02, "learning_rate": 7.009273570324575e-06, "loss": 1.4148, "step": 907 }, { "epoch": 0.02, "learning_rate": 7.017001545595055e-06, "loss": 1.1303, "step": 908 }, { "epoch": 0.02, "learning_rate": 7.024729520865534e-06, "loss": 1.1416, "step": 909 }, { "epoch": 0.02, "learning_rate": 7.032457496136012e-06, "loss": 0.8939, "step": 910 }, { "epoch": 0.02, "learning_rate": 7.040185471406492e-06, "loss": 1.0848, "step": 911 }, { "epoch": 0.02, "learning_rate": 7.047913446676971e-06, "loss": 0.986, "step": 912 }, { "epoch": 0.02, "learning_rate": 7.0556414219474505e-06, "loss": 1.0411, "step": 913 }, { "epoch": 0.02, "learning_rate": 7.0633693972179296e-06, "loss": 1.2312, "step": 914 }, { "epoch": 0.02, "learning_rate": 7.0710973724884095e-06, "loss": 1.1683, "step": 915 }, { "epoch": 0.02, "learning_rate": 7.078825347758888e-06, "loss": 1.0667, "step": 916 }, { "epoch": 0.02, "learning_rate": 7.086553323029367e-06, "loss": 1.3077, "step": 917 }, { "epoch": 0.02, "learning_rate": 7.094281298299847e-06, "loss": 0.9563, "step": 918 }, { "epoch": 0.02, "learning_rate": 7.102009273570325e-06, "loss": 0.8949, "step": 919 }, { "epoch": 0.02, "learning_rate": 7.109737248840804e-06, "loss": 1.3417, "step": 920 }, { "epoch": 0.02, "learning_rate": 7.117465224111283e-06, "loss": 1.5465, "step": 921 }, { "epoch": 0.02, "learning_rate": 7.125193199381762e-06, "loss": 0.9578, "step": 922 }, { "epoch": 0.02, "learning_rate": 7.132921174652242e-06, "loss": 1.0026, "step": 923 }, { "epoch": 0.02, "learning_rate": 7.140649149922721e-06, "loss": 1.2569, "step": 924 }, { "epoch": 0.02, "learning_rate": 7.1483771251932e-06, "loss": 1.0687, "step": 925 }, { "epoch": 0.02, "learning_rate": 7.15610510046368e-06, "loss": 0.9136, "step": 926 }, { "epoch": 0.02, "learning_rate": 7.163833075734158e-06, "loss": 1.1103, "step": 927 }, { "epoch": 0.02, "learning_rate": 7.171561051004637e-06, "loss": 1.2503, "step": 928 }, { "epoch": 0.02, "learning_rate": 7.179289026275117e-06, "loss": 1.0466, "step": 929 }, { "epoch": 0.02, "learning_rate": 7.187017001545595e-06, "loss": 1.1682, "step": 930 }, { "epoch": 0.02, "learning_rate": 7.194744976816075e-06, "loss": 1.3326, "step": 931 }, { "epoch": 0.02, "learning_rate": 7.202472952086554e-06, "loss": 1.2453, "step": 932 }, { "epoch": 0.02, "learning_rate": 7.2102009273570325e-06, "loss": 1.1808, "step": 933 }, { "epoch": 0.02, "learning_rate": 7.2179289026275125e-06, "loss": 1.3718, "step": 934 }, { "epoch": 0.02, "learning_rate": 7.225656877897992e-06, "loss": 0.8417, "step": 935 }, { "epoch": 0.02, "learning_rate": 7.233384853168471e-06, "loss": 1.3958, "step": 936 }, { "epoch": 0.02, "learning_rate": 7.24111282843895e-06, "loss": 1.1281, "step": 937 }, { "epoch": 0.02, "learning_rate": 7.248840803709428e-06, "loss": 1.3153, "step": 938 }, { "epoch": 0.02, "learning_rate": 7.256568778979908e-06, "loss": 1.0495, "step": 939 }, { "epoch": 0.02, "learning_rate": 7.264296754250387e-06, "loss": 1.0492, "step": 940 }, { "epoch": 0.02, "learning_rate": 7.272024729520865e-06, "loss": 1.1456, "step": 941 }, { "epoch": 0.02, "learning_rate": 7.279752704791345e-06, "loss": 1.1346, "step": 942 }, { "epoch": 0.02, "learning_rate": 7.287480680061824e-06, "loss": 1.0166, "step": 943 }, { "epoch": 0.02, "learning_rate": 7.2952086553323035e-06, "loss": 1.3642, "step": 944 }, { "epoch": 0.02, "learning_rate": 7.302936630602783e-06, "loss": 1.1136, "step": 945 }, { "epoch": 0.02, "learning_rate": 7.3106646058732626e-06, "loss": 1.3273, "step": 946 }, { "epoch": 0.02, "learning_rate": 7.318392581143741e-06, "loss": 1.2572, "step": 947 }, { "epoch": 0.02, "learning_rate": 7.32612055641422e-06, "loss": 1.1498, "step": 948 }, { "epoch": 0.02, "learning_rate": 7.3338485316847e-06, "loss": 1.2166, "step": 949 }, { "epoch": 0.02, "learning_rate": 7.341576506955178e-06, "loss": 1.1491, "step": 950 }, { "epoch": 0.02, "learning_rate": 7.349304482225657e-06, "loss": 1.209, "step": 951 }, { "epoch": 0.02, "learning_rate": 7.357032457496137e-06, "loss": 1.2842, "step": 952 }, { "epoch": 0.02, "learning_rate": 7.3647604327666155e-06, "loss": 1.2642, "step": 953 }, { "epoch": 0.02, "learning_rate": 7.372488408037095e-06, "loss": 1.0394, "step": 954 }, { "epoch": 0.02, "learning_rate": 7.380216383307574e-06, "loss": 1.168, "step": 955 }, { "epoch": 0.02, "learning_rate": 7.387944358578053e-06, "loss": 1.2363, "step": 956 }, { "epoch": 0.02, "learning_rate": 7.395672333848533e-06, "loss": 1.1516, "step": 957 }, { "epoch": 0.02, "learning_rate": 7.403400309119011e-06, "loss": 1.2069, "step": 958 }, { "epoch": 0.02, "learning_rate": 7.411128284389491e-06, "loss": 1.0339, "step": 959 }, { "epoch": 0.02, "learning_rate": 7.41885625965997e-06, "loss": 1.0375, "step": 960 }, { "epoch": 0.02, "learning_rate": 7.426584234930448e-06, "loss": 1.3527, "step": 961 }, { "epoch": 0.02, "learning_rate": 7.434312210200928e-06, "loss": 1.0197, "step": 962 }, { "epoch": 0.02, "learning_rate": 7.442040185471407e-06, "loss": 1.1899, "step": 963 }, { "epoch": 0.02, "learning_rate": 7.449768160741886e-06, "loss": 1.2364, "step": 964 }, { "epoch": 0.02, "learning_rate": 7.4574961360123655e-06, "loss": 1.0224, "step": 965 }, { "epoch": 0.02, "learning_rate": 7.465224111282845e-06, "loss": 0.8946, "step": 966 }, { "epoch": 0.02, "learning_rate": 7.472952086553324e-06, "loss": 1.257, "step": 967 }, { "epoch": 0.02, "learning_rate": 7.480680061823803e-06, "loss": 0.895, "step": 968 }, { "epoch": 0.02, "learning_rate": 7.488408037094283e-06, "loss": 0.9652, "step": 969 }, { "epoch": 0.02, "learning_rate": 7.496136012364761e-06, "loss": 1.3173, "step": 970 }, { "epoch": 0.02, "learning_rate": 7.50386398763524e-06, "loss": 0.8658, "step": 971 }, { "epoch": 0.02, "learning_rate": 7.511591962905718e-06, "loss": 1.1345, "step": 972 }, { "epoch": 0.02, "learning_rate": 7.519319938176198e-06, "loss": 1.3126, "step": 973 }, { "epoch": 0.02, "learning_rate": 7.5270479134466775e-06, "loss": 1.2117, "step": 974 }, { "epoch": 0.02, "learning_rate": 7.534775888717157e-06, "loss": 0.9829, "step": 975 }, { "epoch": 0.02, "learning_rate": 7.542503863987636e-06, "loss": 0.997, "step": 976 }, { "epoch": 0.02, "learning_rate": 7.550231839258116e-06, "loss": 1.112, "step": 977 }, { "epoch": 0.02, "learning_rate": 7.557959814528594e-06, "loss": 1.3173, "step": 978 }, { "epoch": 0.02, "learning_rate": 7.565687789799073e-06, "loss": 1.3632, "step": 979 }, { "epoch": 0.02, "learning_rate": 7.573415765069553e-06, "loss": 1.253, "step": 980 }, { "epoch": 0.02, "learning_rate": 7.581143740340031e-06, "loss": 1.0269, "step": 981 }, { "epoch": 0.02, "learning_rate": 7.58887171561051e-06, "loss": 1.0617, "step": 982 }, { "epoch": 0.02, "learning_rate": 7.59659969088099e-06, "loss": 0.9845, "step": 983 }, { "epoch": 0.02, "learning_rate": 7.6043276661514685e-06, "loss": 1.3333, "step": 984 }, { "epoch": 0.02, "learning_rate": 7.6120556414219485e-06, "loss": 1.0305, "step": 985 }, { "epoch": 0.02, "learning_rate": 7.6197836166924276e-06, "loss": 1.3094, "step": 986 }, { "epoch": 0.02, "learning_rate": 7.627511591962906e-06, "loss": 0.8436, "step": 987 }, { "epoch": 0.02, "learning_rate": 7.635239567233385e-06, "loss": 1.1735, "step": 988 }, { "epoch": 0.02, "learning_rate": 7.642967542503865e-06, "loss": 1.1471, "step": 989 }, { "epoch": 0.02, "learning_rate": 7.650695517774343e-06, "loss": 1.1378, "step": 990 }, { "epoch": 0.02, "learning_rate": 7.658423493044823e-06, "loss": 1.2581, "step": 991 }, { "epoch": 0.02, "learning_rate": 7.666151468315301e-06, "loss": 1.1895, "step": 992 }, { "epoch": 0.02, "learning_rate": 7.673879443585781e-06, "loss": 1.1322, "step": 993 }, { "epoch": 0.02, "learning_rate": 7.681607418856261e-06, "loss": 1.3157, "step": 994 }, { "epoch": 0.02, "learning_rate": 7.68933539412674e-06, "loss": 0.8466, "step": 995 }, { "epoch": 0.02, "learning_rate": 7.697063369397218e-06, "loss": 0.9927, "step": 996 }, { "epoch": 0.02, "learning_rate": 7.704791344667698e-06, "loss": 1.1604, "step": 997 }, { "epoch": 0.02, "learning_rate": 7.712519319938176e-06, "loss": 1.331, "step": 998 }, { "epoch": 0.02, "learning_rate": 7.720247295208656e-06, "loss": 0.9814, "step": 999 }, { "epoch": 0.02, "learning_rate": 7.727975270479136e-06, "loss": 0.9839, "step": 1000 }, { "epoch": 0.02, "learning_rate": 7.735703245749614e-06, "loss": 1.1022, "step": 1001 }, { "epoch": 0.02, "learning_rate": 7.743431221020094e-06, "loss": 1.0828, "step": 1002 }, { "epoch": 0.02, "learning_rate": 7.751159196290572e-06, "loss": 1.0863, "step": 1003 }, { "epoch": 0.02, "learning_rate": 7.75888717156105e-06, "loss": 0.9041, "step": 1004 }, { "epoch": 0.02, "learning_rate": 7.76661514683153e-06, "loss": 1.3117, "step": 1005 }, { "epoch": 0.02, "learning_rate": 7.774343122102009e-06, "loss": 1.1248, "step": 1006 }, { "epoch": 0.02, "learning_rate": 7.782071097372489e-06, "loss": 0.9446, "step": 1007 }, { "epoch": 0.02, "learning_rate": 7.789799072642969e-06, "loss": 1.1631, "step": 1008 }, { "epoch": 0.02, "learning_rate": 7.797527047913447e-06, "loss": 1.2258, "step": 1009 }, { "epoch": 0.02, "learning_rate": 7.805255023183927e-06, "loss": 1.084, "step": 1010 }, { "epoch": 0.02, "learning_rate": 7.812982998454405e-06, "loss": 1.3143, "step": 1011 }, { "epoch": 0.02, "learning_rate": 7.820710973724885e-06, "loss": 0.8999, "step": 1012 }, { "epoch": 0.02, "learning_rate": 7.828438948995363e-06, "loss": 1.0039, "step": 1013 }, { "epoch": 0.02, "learning_rate": 7.836166924265843e-06, "loss": 1.1825, "step": 1014 }, { "epoch": 0.02, "learning_rate": 7.843894899536322e-06, "loss": 1.0915, "step": 1015 }, { "epoch": 0.02, "learning_rate": 7.851622874806802e-06, "loss": 1.1006, "step": 1016 }, { "epoch": 0.02, "learning_rate": 7.859350850077281e-06, "loss": 1.1945, "step": 1017 }, { "epoch": 0.02, "learning_rate": 7.86707882534776e-06, "loss": 1.2009, "step": 1018 }, { "epoch": 0.02, "learning_rate": 7.874806800618238e-06, "loss": 1.2984, "step": 1019 }, { "epoch": 0.02, "learning_rate": 7.882534775888718e-06, "loss": 1.1222, "step": 1020 }, { "epoch": 0.02, "learning_rate": 7.890262751159196e-06, "loss": 1.0052, "step": 1021 }, { "epoch": 0.02, "learning_rate": 7.897990726429676e-06, "loss": 1.3726, "step": 1022 }, { "epoch": 0.02, "learning_rate": 7.905718701700154e-06, "loss": 1.2399, "step": 1023 }, { "epoch": 0.02, "learning_rate": 7.913446676970634e-06, "loss": 0.9956, "step": 1024 }, { "epoch": 0.02, "learning_rate": 7.921174652241114e-06, "loss": 1.2231, "step": 1025 }, { "epoch": 0.02, "learning_rate": 7.928902627511593e-06, "loss": 1.4499, "step": 1026 }, { "epoch": 0.02, "learning_rate": 7.93663060278207e-06, "loss": 1.0061, "step": 1027 }, { "epoch": 0.02, "learning_rate": 7.94435857805255e-06, "loss": 1.0103, "step": 1028 }, { "epoch": 0.02, "learning_rate": 7.952086553323029e-06, "loss": 1.058, "step": 1029 }, { "epoch": 0.02, "learning_rate": 7.959814528593509e-06, "loss": 1.3292, "step": 1030 }, { "epoch": 0.02, "learning_rate": 7.967542503863989e-06, "loss": 1.282, "step": 1031 }, { "epoch": 0.02, "learning_rate": 7.975270479134467e-06, "loss": 1.2651, "step": 1032 }, { "epoch": 0.02, "learning_rate": 7.982998454404947e-06, "loss": 1.1779, "step": 1033 }, { "epoch": 0.02, "learning_rate": 7.990726429675425e-06, "loss": 1.054, "step": 1034 }, { "epoch": 0.02, "learning_rate": 7.998454404945905e-06, "loss": 1.4005, "step": 1035 }, { "epoch": 0.02, "learning_rate": 8.006182380216384e-06, "loss": 1.2898, "step": 1036 }, { "epoch": 0.02, "learning_rate": 8.013910355486864e-06, "loss": 1.2089, "step": 1037 }, { "epoch": 0.02, "learning_rate": 8.021638330757342e-06, "loss": 1.1573, "step": 1038 }, { "epoch": 0.02, "learning_rate": 8.029366306027822e-06, "loss": 1.4102, "step": 1039 }, { "epoch": 0.02, "learning_rate": 8.037094281298302e-06, "loss": 1.307, "step": 1040 }, { "epoch": 0.02, "learning_rate": 8.04482225656878e-06, "loss": 1.3003, "step": 1041 }, { "epoch": 0.02, "learning_rate": 8.052550231839258e-06, "loss": 1.13, "step": 1042 }, { "epoch": 0.02, "learning_rate": 8.060278207109738e-06, "loss": 1.3561, "step": 1043 }, { "epoch": 0.02, "learning_rate": 8.068006182380216e-06, "loss": 1.2739, "step": 1044 }, { "epoch": 0.02, "learning_rate": 8.075734157650696e-06, "loss": 1.1484, "step": 1045 }, { "epoch": 0.02, "learning_rate": 8.083462132921175e-06, "loss": 1.1848, "step": 1046 }, { "epoch": 0.02, "learning_rate": 8.091190108191655e-06, "loss": 1.1933, "step": 1047 }, { "epoch": 0.02, "learning_rate": 8.098918083462135e-06, "loss": 1.2266, "step": 1048 }, { "epoch": 0.02, "learning_rate": 8.106646058732613e-06, "loss": 1.2933, "step": 1049 }, { "epoch": 0.02, "learning_rate": 8.114374034003091e-06, "loss": 1.1083, "step": 1050 }, { "epoch": 0.02, "learning_rate": 8.122102009273571e-06, "loss": 1.0911, "step": 1051 }, { "epoch": 0.02, "learning_rate": 8.12982998454405e-06, "loss": 1.2906, "step": 1052 }, { "epoch": 0.02, "learning_rate": 8.13755795981453e-06, "loss": 0.9633, "step": 1053 }, { "epoch": 0.02, "learning_rate": 8.14528593508501e-06, "loss": 1.2617, "step": 1054 }, { "epoch": 0.02, "learning_rate": 8.153013910355487e-06, "loss": 1.014, "step": 1055 }, { "epoch": 0.02, "learning_rate": 8.160741885625967e-06, "loss": 1.0224, "step": 1056 }, { "epoch": 0.02, "learning_rate": 8.168469860896446e-06, "loss": 1.056, "step": 1057 }, { "epoch": 0.02, "learning_rate": 8.176197836166926e-06, "loss": 1.0978, "step": 1058 }, { "epoch": 0.02, "learning_rate": 8.183925811437404e-06, "loss": 1.1689, "step": 1059 }, { "epoch": 0.02, "learning_rate": 8.191653786707882e-06, "loss": 1.0927, "step": 1060 }, { "epoch": 0.02, "learning_rate": 8.199381761978362e-06, "loss": 1.1853, "step": 1061 }, { "epoch": 0.02, "learning_rate": 8.207109737248842e-06, "loss": 1.4396, "step": 1062 }, { "epoch": 0.02, "learning_rate": 8.21483771251932e-06, "loss": 1.0887, "step": 1063 }, { "epoch": 0.02, "learning_rate": 8.2225656877898e-06, "loss": 1.1303, "step": 1064 }, { "epoch": 0.02, "learning_rate": 8.230293663060278e-06, "loss": 1.1609, "step": 1065 }, { "epoch": 0.02, "learning_rate": 8.238021638330758e-06, "loss": 1.1039, "step": 1066 }, { "epoch": 0.02, "learning_rate": 8.245749613601237e-06, "loss": 1.0608, "step": 1067 }, { "epoch": 0.02, "learning_rate": 8.253477588871717e-06, "loss": 1.2398, "step": 1068 }, { "epoch": 0.02, "learning_rate": 8.261205564142195e-06, "loss": 1.3451, "step": 1069 }, { "epoch": 0.02, "learning_rate": 8.268933539412675e-06, "loss": 1.259, "step": 1070 }, { "epoch": 0.02, "learning_rate": 8.276661514683155e-06, "loss": 1.2839, "step": 1071 }, { "epoch": 0.02, "learning_rate": 8.284389489953633e-06, "loss": 1.1741, "step": 1072 }, { "epoch": 0.02, "learning_rate": 8.292117465224111e-06, "loss": 1.2571, "step": 1073 }, { "epoch": 0.02, "learning_rate": 8.299845440494591e-06, "loss": 1.293, "step": 1074 }, { "epoch": 0.02, "learning_rate": 8.30757341576507e-06, "loss": 0.9594, "step": 1075 }, { "epoch": 0.02, "learning_rate": 8.31530139103555e-06, "loss": 1.1868, "step": 1076 }, { "epoch": 0.02, "learning_rate": 8.323029366306028e-06, "loss": 1.2346, "step": 1077 }, { "epoch": 0.03, "learning_rate": 8.330757341576508e-06, "loss": 1.2177, "step": 1078 }, { "epoch": 0.03, "learning_rate": 8.338485316846988e-06, "loss": 1.0769, "step": 1079 }, { "epoch": 0.03, "learning_rate": 8.346213292117466e-06, "loss": 1.0848, "step": 1080 }, { "epoch": 0.03, "learning_rate": 8.353941267387946e-06, "loss": 1.0905, "step": 1081 }, { "epoch": 0.03, "learning_rate": 8.361669242658424e-06, "loss": 0.8525, "step": 1082 }, { "epoch": 0.03, "learning_rate": 8.369397217928902e-06, "loss": 1.1611, "step": 1083 }, { "epoch": 0.03, "learning_rate": 8.377125193199382e-06, "loss": 1.2146, "step": 1084 }, { "epoch": 0.03, "learning_rate": 8.384853168469862e-06, "loss": 1.029, "step": 1085 }, { "epoch": 0.03, "learning_rate": 8.39258114374034e-06, "loss": 1.2631, "step": 1086 }, { "epoch": 0.03, "learning_rate": 8.40030911901082e-06, "loss": 1.354, "step": 1087 }, { "epoch": 0.03, "learning_rate": 8.408037094281299e-06, "loss": 1.0036, "step": 1088 }, { "epoch": 0.03, "learning_rate": 8.415765069551779e-06, "loss": 1.1195, "step": 1089 }, { "epoch": 0.03, "learning_rate": 8.423493044822257e-06, "loss": 1.1021, "step": 1090 }, { "epoch": 0.03, "learning_rate": 8.431221020092737e-06, "loss": 1.0324, "step": 1091 }, { "epoch": 0.03, "learning_rate": 8.438948995363215e-06, "loss": 1.2383, "step": 1092 }, { "epoch": 0.03, "learning_rate": 8.446676970633695e-06, "loss": 1.0486, "step": 1093 }, { "epoch": 0.03, "learning_rate": 8.454404945904173e-06, "loss": 1.0238, "step": 1094 }, { "epoch": 0.03, "learning_rate": 8.462132921174653e-06, "loss": 1.0347, "step": 1095 }, { "epoch": 0.03, "learning_rate": 8.469860896445132e-06, "loss": 1.0331, "step": 1096 }, { "epoch": 0.03, "learning_rate": 8.477588871715611e-06, "loss": 1.1364, "step": 1097 }, { "epoch": 0.03, "learning_rate": 8.48531684698609e-06, "loss": 1.1818, "step": 1098 }, { "epoch": 0.03, "learning_rate": 8.49304482225657e-06, "loss": 0.9931, "step": 1099 }, { "epoch": 0.03, "learning_rate": 8.500772797527048e-06, "loss": 0.9524, "step": 1100 }, { "epoch": 0.03, "learning_rate": 8.508500772797528e-06, "loss": 0.9918, "step": 1101 }, { "epoch": 0.03, "learning_rate": 8.516228748068008e-06, "loss": 1.2946, "step": 1102 }, { "epoch": 0.03, "learning_rate": 8.523956723338486e-06, "loss": 1.0061, "step": 1103 }, { "epoch": 0.03, "learning_rate": 8.531684698608966e-06, "loss": 1.1566, "step": 1104 }, { "epoch": 0.03, "learning_rate": 8.539412673879444e-06, "loss": 1.0939, "step": 1105 }, { "epoch": 0.03, "learning_rate": 8.547140649149923e-06, "loss": 1.3909, "step": 1106 }, { "epoch": 0.03, "learning_rate": 8.554868624420403e-06, "loss": 0.9455, "step": 1107 }, { "epoch": 0.03, "learning_rate": 8.562596599690882e-06, "loss": 1.2982, "step": 1108 }, { "epoch": 0.03, "learning_rate": 8.57032457496136e-06, "loss": 1.4786, "step": 1109 }, { "epoch": 0.03, "learning_rate": 8.57805255023184e-06, "loss": 1.0222, "step": 1110 }, { "epoch": 0.03, "learning_rate": 8.585780525502319e-06, "loss": 1.4041, "step": 1111 }, { "epoch": 0.03, "learning_rate": 8.593508500772799e-06, "loss": 1.0573, "step": 1112 }, { "epoch": 0.03, "learning_rate": 8.601236476043277e-06, "loss": 1.0268, "step": 1113 }, { "epoch": 0.03, "learning_rate": 8.608964451313755e-06, "loss": 0.9781, "step": 1114 }, { "epoch": 0.03, "learning_rate": 8.616692426584235e-06, "loss": 1.03, "step": 1115 }, { "epoch": 0.03, "learning_rate": 8.624420401854715e-06, "loss": 1.0076, "step": 1116 }, { "epoch": 0.03, "learning_rate": 8.632148377125194e-06, "loss": 1.0558, "step": 1117 }, { "epoch": 0.03, "learning_rate": 8.639876352395673e-06, "loss": 1.0944, "step": 1118 }, { "epoch": 0.03, "learning_rate": 8.647604327666152e-06, "loss": 1.0792, "step": 1119 }, { "epoch": 0.03, "learning_rate": 8.655332302936632e-06, "loss": 1.2158, "step": 1120 }, { "epoch": 0.03, "learning_rate": 8.66306027820711e-06, "loss": 0.949, "step": 1121 }, { "epoch": 0.03, "learning_rate": 8.67078825347759e-06, "loss": 0.7596, "step": 1122 }, { "epoch": 0.03, "learning_rate": 8.678516228748068e-06, "loss": 1.2953, "step": 1123 }, { "epoch": 0.03, "learning_rate": 8.686244204018548e-06, "loss": 1.1104, "step": 1124 }, { "epoch": 0.03, "learning_rate": 8.693972179289028e-06, "loss": 0.9958, "step": 1125 }, { "epoch": 0.03, "learning_rate": 8.701700154559506e-06, "loss": 1.0414, "step": 1126 }, { "epoch": 0.03, "learning_rate": 8.709428129829986e-06, "loss": 0.8804, "step": 1127 }, { "epoch": 0.03, "learning_rate": 8.717156105100465e-06, "loss": 1.1219, "step": 1128 }, { "epoch": 0.03, "learning_rate": 8.724884080370943e-06, "loss": 1.1508, "step": 1129 }, { "epoch": 0.03, "learning_rate": 8.732612055641423e-06, "loss": 1.2654, "step": 1130 }, { "epoch": 0.03, "learning_rate": 8.740340030911901e-06, "loss": 1.0041, "step": 1131 }, { "epoch": 0.03, "learning_rate": 8.748068006182381e-06, "loss": 1.2563, "step": 1132 }, { "epoch": 0.03, "learning_rate": 8.755795981452861e-06, "loss": 1.2246, "step": 1133 }, { "epoch": 0.03, "learning_rate": 8.763523956723339e-06, "loss": 1.2602, "step": 1134 }, { "epoch": 0.03, "learning_rate": 8.771251931993819e-06, "loss": 1.3393, "step": 1135 }, { "epoch": 0.03, "learning_rate": 8.778979907264297e-06, "loss": 1.1584, "step": 1136 }, { "epoch": 0.03, "learning_rate": 8.786707882534776e-06, "loss": 1.4226, "step": 1137 }, { "epoch": 0.03, "learning_rate": 8.794435857805256e-06, "loss": 1.2256, "step": 1138 }, { "epoch": 0.03, "learning_rate": 8.802163833075736e-06, "loss": 1.3067, "step": 1139 }, { "epoch": 0.03, "learning_rate": 8.809891808346214e-06, "loss": 1.0477, "step": 1140 }, { "epoch": 0.03, "learning_rate": 8.817619783616694e-06, "loss": 1.061, "step": 1141 }, { "epoch": 0.03, "learning_rate": 8.825347758887172e-06, "loss": 1.159, "step": 1142 }, { "epoch": 0.03, "learning_rate": 8.833075734157652e-06, "loss": 1.2684, "step": 1143 }, { "epoch": 0.03, "learning_rate": 8.84080370942813e-06, "loss": 1.0198, "step": 1144 }, { "epoch": 0.03, "learning_rate": 8.84853168469861e-06, "loss": 1.2654, "step": 1145 }, { "epoch": 0.03, "learning_rate": 8.856259659969088e-06, "loss": 1.0586, "step": 1146 }, { "epoch": 0.03, "learning_rate": 8.863987635239568e-06, "loss": 0.9971, "step": 1147 }, { "epoch": 0.03, "learning_rate": 8.871715610510047e-06, "loss": 1.0816, "step": 1148 }, { "epoch": 0.03, "learning_rate": 8.879443585780527e-06, "loss": 1.2587, "step": 1149 }, { "epoch": 0.03, "learning_rate": 8.887171561051005e-06, "loss": 1.2041, "step": 1150 }, { "epoch": 0.03, "learning_rate": 8.894899536321485e-06, "loss": 1.0223, "step": 1151 }, { "epoch": 0.03, "learning_rate": 8.902627511591963e-06, "loss": 1.3152, "step": 1152 }, { "epoch": 0.03, "learning_rate": 8.910355486862443e-06, "loss": 0.9704, "step": 1153 }, { "epoch": 0.03, "learning_rate": 8.918083462132921e-06, "loss": 1.2736, "step": 1154 }, { "epoch": 0.03, "learning_rate": 8.925811437403401e-06, "loss": 1.0597, "step": 1155 }, { "epoch": 0.03, "learning_rate": 8.933539412673881e-06, "loss": 1.3982, "step": 1156 }, { "epoch": 0.03, "learning_rate": 8.94126738794436e-06, "loss": 1.1889, "step": 1157 }, { "epoch": 0.03, "learning_rate": 8.94899536321484e-06, "loss": 1.0898, "step": 1158 }, { "epoch": 0.03, "learning_rate": 8.956723338485318e-06, "loss": 1.1882, "step": 1159 }, { "epoch": 0.03, "learning_rate": 8.964451313755796e-06, "loss": 0.995, "step": 1160 }, { "epoch": 0.03, "learning_rate": 8.972179289026276e-06, "loss": 1.0228, "step": 1161 }, { "epoch": 0.03, "learning_rate": 8.979907264296756e-06, "loss": 1.2639, "step": 1162 }, { "epoch": 0.03, "learning_rate": 8.987635239567234e-06, "loss": 1.2225, "step": 1163 }, { "epoch": 0.03, "learning_rate": 8.995363214837714e-06, "loss": 1.1884, "step": 1164 }, { "epoch": 0.03, "learning_rate": 9.003091190108192e-06, "loss": 1.3759, "step": 1165 }, { "epoch": 0.03, "learning_rate": 9.010819165378672e-06, "loss": 1.0947, "step": 1166 }, { "epoch": 0.03, "learning_rate": 9.01854714064915e-06, "loss": 1.2494, "step": 1167 }, { "epoch": 0.03, "learning_rate": 9.026275115919629e-06, "loss": 1.2636, "step": 1168 }, { "epoch": 0.03, "learning_rate": 9.034003091190109e-06, "loss": 1.1304, "step": 1169 }, { "epoch": 0.03, "learning_rate": 9.041731066460589e-06, "loss": 1.0363, "step": 1170 }, { "epoch": 0.03, "learning_rate": 9.049459041731067e-06, "loss": 1.2116, "step": 1171 }, { "epoch": 0.03, "learning_rate": 9.057187017001547e-06, "loss": 1.2419, "step": 1172 }, { "epoch": 0.03, "learning_rate": 9.064914992272025e-06, "loss": 1.0545, "step": 1173 }, { "epoch": 0.03, "learning_rate": 9.072642967542505e-06, "loss": 1.139, "step": 1174 }, { "epoch": 0.03, "learning_rate": 9.080370942812983e-06, "loss": 1.2149, "step": 1175 }, { "epoch": 0.03, "learning_rate": 9.088098918083463e-06, "loss": 1.2842, "step": 1176 }, { "epoch": 0.03, "learning_rate": 9.095826893353941e-06, "loss": 1.1651, "step": 1177 }, { "epoch": 0.03, "learning_rate": 9.103554868624421e-06, "loss": 1.0238, "step": 1178 }, { "epoch": 0.03, "learning_rate": 9.111282843894901e-06, "loss": 1.2224, "step": 1179 }, { "epoch": 0.03, "learning_rate": 9.11901081916538e-06, "loss": 0.96, "step": 1180 }, { "epoch": 0.03, "learning_rate": 9.12673879443586e-06, "loss": 1.1486, "step": 1181 }, { "epoch": 0.03, "learning_rate": 9.134466769706338e-06, "loss": 1.3025, "step": 1182 }, { "epoch": 0.03, "learning_rate": 9.142194744976816e-06, "loss": 1.0598, "step": 1183 }, { "epoch": 0.03, "learning_rate": 9.149922720247296e-06, "loss": 1.3456, "step": 1184 }, { "epoch": 0.03, "learning_rate": 9.157650695517774e-06, "loss": 1.0218, "step": 1185 }, { "epoch": 0.03, "learning_rate": 9.165378670788254e-06, "loss": 1.1684, "step": 1186 }, { "epoch": 0.03, "learning_rate": 9.173106646058734e-06, "loss": 1.047, "step": 1187 }, { "epoch": 0.03, "learning_rate": 9.180834621329212e-06, "loss": 1.1349, "step": 1188 }, { "epoch": 0.03, "learning_rate": 9.188562596599692e-06, "loss": 1.1506, "step": 1189 }, { "epoch": 0.03, "learning_rate": 9.19629057187017e-06, "loss": 1.2678, "step": 1190 }, { "epoch": 0.03, "learning_rate": 9.204018547140649e-06, "loss": 1.4688, "step": 1191 }, { "epoch": 0.03, "learning_rate": 9.211746522411129e-06, "loss": 1.2847, "step": 1192 }, { "epoch": 0.03, "learning_rate": 9.219474497681609e-06, "loss": 1.0991, "step": 1193 }, { "epoch": 0.03, "learning_rate": 9.227202472952087e-06, "loss": 1.0346, "step": 1194 }, { "epoch": 0.03, "learning_rate": 9.234930448222567e-06, "loss": 1.098, "step": 1195 }, { "epoch": 0.03, "learning_rate": 9.242658423493045e-06, "loss": 0.9695, "step": 1196 }, { "epoch": 0.03, "learning_rate": 9.250386398763525e-06, "loss": 0.9265, "step": 1197 }, { "epoch": 0.03, "learning_rate": 9.258114374034003e-06, "loss": 1.2637, "step": 1198 }, { "epoch": 0.03, "learning_rate": 9.265842349304482e-06, "loss": 1.3521, "step": 1199 }, { "epoch": 0.03, "learning_rate": 9.273570324574962e-06, "loss": 1.0967, "step": 1200 }, { "epoch": 0.03, "learning_rate": 9.281298299845442e-06, "loss": 1.0272, "step": 1201 }, { "epoch": 0.03, "learning_rate": 9.28902627511592e-06, "loss": 1.1767, "step": 1202 }, { "epoch": 0.03, "learning_rate": 9.2967542503864e-06, "loss": 0.9403, "step": 1203 }, { "epoch": 0.03, "learning_rate": 9.30448222565688e-06, "loss": 1.2738, "step": 1204 }, { "epoch": 0.03, "learning_rate": 9.312210200927358e-06, "loss": 1.173, "step": 1205 }, { "epoch": 0.03, "learning_rate": 9.319938176197836e-06, "loss": 0.9912, "step": 1206 }, { "epoch": 0.03, "learning_rate": 9.327666151468316e-06, "loss": 1.2429, "step": 1207 }, { "epoch": 0.03, "learning_rate": 9.335394126738795e-06, "loss": 1.0968, "step": 1208 }, { "epoch": 0.03, "learning_rate": 9.343122102009274e-06, "loss": 1.4569, "step": 1209 }, { "epoch": 0.03, "learning_rate": 9.350850077279754e-06, "loss": 1.1124, "step": 1210 }, { "epoch": 0.03, "learning_rate": 9.358578052550233e-06, "loss": 1.2372, "step": 1211 }, { "epoch": 0.03, "learning_rate": 9.366306027820713e-06, "loss": 0.9276, "step": 1212 }, { "epoch": 0.03, "learning_rate": 9.374034003091191e-06, "loss": 1.1271, "step": 1213 }, { "epoch": 0.03, "learning_rate": 9.381761978361669e-06, "loss": 1.0334, "step": 1214 }, { "epoch": 0.03, "learning_rate": 9.389489953632149e-06, "loss": 1.3807, "step": 1215 }, { "epoch": 0.03, "learning_rate": 9.397217928902627e-06, "loss": 0.8487, "step": 1216 }, { "epoch": 0.03, "learning_rate": 9.404945904173107e-06, "loss": 1.1077, "step": 1217 }, { "epoch": 0.03, "learning_rate": 9.412673879443587e-06, "loss": 1.2172, "step": 1218 }, { "epoch": 0.03, "learning_rate": 9.420401854714066e-06, "loss": 1.5287, "step": 1219 }, { "epoch": 0.03, "learning_rate": 9.428129829984545e-06, "loss": 0.9519, "step": 1220 }, { "epoch": 0.03, "learning_rate": 9.435857805255024e-06, "loss": 1.2607, "step": 1221 }, { "epoch": 0.03, "learning_rate": 9.443585780525502e-06, "loss": 1.1796, "step": 1222 }, { "epoch": 0.03, "learning_rate": 9.451313755795982e-06, "loss": 1.1404, "step": 1223 }, { "epoch": 0.03, "learning_rate": 9.459041731066462e-06, "loss": 1.0707, "step": 1224 }, { "epoch": 0.03, "learning_rate": 9.46676970633694e-06, "loss": 1.1819, "step": 1225 }, { "epoch": 0.03, "learning_rate": 9.47449768160742e-06, "loss": 1.1035, "step": 1226 }, { "epoch": 0.03, "learning_rate": 9.4822256568779e-06, "loss": 1.1005, "step": 1227 }, { "epoch": 0.03, "learning_rate": 9.489953632148378e-06, "loss": 1.1064, "step": 1228 }, { "epoch": 0.03, "learning_rate": 9.497681607418857e-06, "loss": 1.1062, "step": 1229 }, { "epoch": 0.03, "learning_rate": 9.505409582689336e-06, "loss": 1.234, "step": 1230 }, { "epoch": 0.03, "learning_rate": 9.513137557959815e-06, "loss": 0.8213, "step": 1231 }, { "epoch": 0.03, "learning_rate": 9.520865533230295e-06, "loss": 1.0342, "step": 1232 }, { "epoch": 0.03, "learning_rate": 9.528593508500773e-06, "loss": 0.9599, "step": 1233 }, { "epoch": 0.03, "learning_rate": 9.536321483771253e-06, "loss": 0.9544, "step": 1234 }, { "epoch": 0.03, "learning_rate": 9.544049459041733e-06, "loss": 1.1169, "step": 1235 }, { "epoch": 0.03, "learning_rate": 9.551777434312211e-06, "loss": 1.3751, "step": 1236 }, { "epoch": 0.03, "learning_rate": 9.55950540958269e-06, "loss": 1.0293, "step": 1237 }, { "epoch": 0.03, "learning_rate": 9.56723338485317e-06, "loss": 1.2899, "step": 1238 }, { "epoch": 0.03, "learning_rate": 9.574961360123648e-06, "loss": 1.2947, "step": 1239 }, { "epoch": 0.03, "learning_rate": 9.582689335394128e-06, "loss": 1.206, "step": 1240 }, { "epoch": 0.03, "learning_rate": 9.590417310664607e-06, "loss": 0.9916, "step": 1241 }, { "epoch": 0.03, "learning_rate": 9.598145285935086e-06, "loss": 1.0595, "step": 1242 }, { "epoch": 0.03, "learning_rate": 9.605873261205566e-06, "loss": 1.2469, "step": 1243 }, { "epoch": 0.03, "learning_rate": 9.613601236476044e-06, "loss": 1.2762, "step": 1244 }, { "epoch": 0.03, "learning_rate": 9.621329211746522e-06, "loss": 1.3298, "step": 1245 }, { "epoch": 0.03, "learning_rate": 9.629057187017002e-06, "loss": 1.061, "step": 1246 }, { "epoch": 0.03, "learning_rate": 9.636785162287482e-06, "loss": 1.0558, "step": 1247 }, { "epoch": 0.03, "learning_rate": 9.64451313755796e-06, "loss": 1.1297, "step": 1248 }, { "epoch": 0.03, "learning_rate": 9.65224111282844e-06, "loss": 1.1197, "step": 1249 }, { "epoch": 0.03, "learning_rate": 9.65996908809892e-06, "loss": 1.1228, "step": 1250 }, { "epoch": 0.03, "learning_rate": 9.667697063369399e-06, "loss": 1.4191, "step": 1251 }, { "epoch": 0.03, "learning_rate": 9.675425038639877e-06, "loss": 1.01, "step": 1252 }, { "epoch": 0.03, "learning_rate": 9.683153013910355e-06, "loss": 1.0337, "step": 1253 }, { "epoch": 0.03, "learning_rate": 9.690880989180835e-06, "loss": 1.2477, "step": 1254 }, { "epoch": 0.03, "learning_rate": 9.698608964451315e-06, "loss": 1.3472, "step": 1255 }, { "epoch": 0.03, "learning_rate": 9.706336939721793e-06, "loss": 1.268, "step": 1256 }, { "epoch": 0.03, "learning_rate": 9.714064914992273e-06, "loss": 1.4364, "step": 1257 }, { "epoch": 0.03, "learning_rate": 9.721792890262753e-06, "loss": 1.3683, "step": 1258 }, { "epoch": 0.03, "learning_rate": 9.729520865533231e-06, "loss": 1.1099, "step": 1259 }, { "epoch": 0.03, "learning_rate": 9.73724884080371e-06, "loss": 1.2939, "step": 1260 }, { "epoch": 0.03, "learning_rate": 9.74497681607419e-06, "loss": 0.9426, "step": 1261 }, { "epoch": 0.03, "learning_rate": 9.752704791344668e-06, "loss": 1.4043, "step": 1262 }, { "epoch": 0.03, "learning_rate": 9.760432766615148e-06, "loss": 0.913, "step": 1263 }, { "epoch": 0.03, "learning_rate": 9.768160741885628e-06, "loss": 1.1007, "step": 1264 }, { "epoch": 0.03, "learning_rate": 9.775888717156106e-06, "loss": 0.9572, "step": 1265 }, { "epoch": 0.03, "learning_rate": 9.783616692426586e-06, "loss": 1.0717, "step": 1266 }, { "epoch": 0.03, "learning_rate": 9.791344667697064e-06, "loss": 1.2549, "step": 1267 }, { "epoch": 0.03, "learning_rate": 9.799072642967542e-06, "loss": 1.1922, "step": 1268 }, { "epoch": 0.03, "learning_rate": 9.806800618238022e-06, "loss": 1.3972, "step": 1269 }, { "epoch": 0.03, "learning_rate": 9.8145285935085e-06, "loss": 1.0323, "step": 1270 }, { "epoch": 0.03, "learning_rate": 9.82225656877898e-06, "loss": 1.1117, "step": 1271 }, { "epoch": 0.03, "learning_rate": 9.82998454404946e-06, "loss": 0.9673, "step": 1272 }, { "epoch": 0.03, "learning_rate": 9.837712519319939e-06, "loss": 1.1542, "step": 1273 }, { "epoch": 0.03, "learning_rate": 9.845440494590419e-06, "loss": 1.3125, "step": 1274 }, { "epoch": 0.03, "learning_rate": 9.853168469860897e-06, "loss": 1.4988, "step": 1275 }, { "epoch": 0.03, "learning_rate": 9.860896445131375e-06, "loss": 1.1455, "step": 1276 }, { "epoch": 0.03, "learning_rate": 9.868624420401855e-06, "loss": 1.1631, "step": 1277 }, { "epoch": 0.03, "learning_rate": 9.876352395672335e-06, "loss": 1.0012, "step": 1278 }, { "epoch": 0.03, "learning_rate": 9.884080370942813e-06, "loss": 1.1228, "step": 1279 }, { "epoch": 0.03, "learning_rate": 9.891808346213293e-06, "loss": 1.3955, "step": 1280 }, { "epoch": 0.03, "learning_rate": 9.899536321483773e-06, "loss": 1.3387, "step": 1281 }, { "epoch": 0.03, "learning_rate": 9.907264296754252e-06, "loss": 0.9471, "step": 1282 }, { "epoch": 0.03, "learning_rate": 9.91499227202473e-06, "loss": 1.3221, "step": 1283 }, { "epoch": 0.03, "learning_rate": 9.92272024729521e-06, "loss": 1.0049, "step": 1284 }, { "epoch": 0.03, "learning_rate": 9.930448222565688e-06, "loss": 1.2398, "step": 1285 }, { "epoch": 0.03, "learning_rate": 9.938176197836168e-06, "loss": 1.0836, "step": 1286 }, { "epoch": 0.03, "learning_rate": 9.945904173106646e-06, "loss": 1.2323, "step": 1287 }, { "epoch": 0.03, "learning_rate": 9.953632148377126e-06, "loss": 1.4117, "step": 1288 }, { "epoch": 0.03, "learning_rate": 9.961360123647606e-06, "loss": 0.9614, "step": 1289 }, { "epoch": 0.03, "learning_rate": 9.969088098918084e-06, "loss": 1.0249, "step": 1290 }, { "epoch": 0.03, "learning_rate": 9.976816074188563e-06, "loss": 0.9377, "step": 1291 }, { "epoch": 0.03, "learning_rate": 9.984544049459043e-06, "loss": 0.9368, "step": 1292 }, { "epoch": 0.03, "learning_rate": 9.992272024729521e-06, "loss": 1.1494, "step": 1293 }, { "epoch": 0.03, "learning_rate": 1e-05, "loss": 1.4144, "step": 1294 }, { "epoch": 0.03, "learning_rate": 9.999999985895171e-06, "loss": 1.1914, "step": 1295 }, { "epoch": 0.03, "learning_rate": 9.999999943580681e-06, "loss": 1.0858, "step": 1296 }, { "epoch": 0.03, "learning_rate": 9.999999873056532e-06, "loss": 1.2532, "step": 1297 }, { "epoch": 0.03, "learning_rate": 9.999999774322724e-06, "loss": 1.3722, "step": 1298 }, { "epoch": 0.03, "learning_rate": 9.999999647379257e-06, "loss": 1.15, "step": 1299 }, { "epoch": 0.03, "learning_rate": 9.999999492226131e-06, "loss": 1.1696, "step": 1300 }, { "epoch": 0.03, "learning_rate": 9.999999308863349e-06, "loss": 1.0633, "step": 1301 }, { "epoch": 0.03, "learning_rate": 9.99999909729091e-06, "loss": 1.1225, "step": 1302 }, { "epoch": 0.03, "learning_rate": 9.999998857508817e-06, "loss": 1.1462, "step": 1303 }, { "epoch": 0.03, "learning_rate": 9.999998589517071e-06, "loss": 0.9768, "step": 1304 }, { "epoch": 0.03, "learning_rate": 9.999998293315674e-06, "loss": 1.0471, "step": 1305 }, { "epoch": 0.03, "learning_rate": 9.999997968904625e-06, "loss": 1.1243, "step": 1306 }, { "epoch": 0.03, "learning_rate": 9.999997616283928e-06, "loss": 0.9283, "step": 1307 }, { "epoch": 0.03, "learning_rate": 9.999997235453585e-06, "loss": 1.0262, "step": 1308 }, { "epoch": 0.03, "learning_rate": 9.999996826413595e-06, "loss": 1.0404, "step": 1309 }, { "epoch": 0.03, "learning_rate": 9.999996389163966e-06, "loss": 1.2666, "step": 1310 }, { "epoch": 0.03, "learning_rate": 9.999995923704698e-06, "loss": 1.1752, "step": 1311 }, { "epoch": 0.03, "learning_rate": 9.999995430035792e-06, "loss": 1.1584, "step": 1312 }, { "epoch": 0.03, "learning_rate": 9.999994908157251e-06, "loss": 1.1858, "step": 1313 }, { "epoch": 0.03, "learning_rate": 9.99999435806908e-06, "loss": 1.1061, "step": 1314 }, { "epoch": 0.03, "learning_rate": 9.99999377977128e-06, "loss": 1.1566, "step": 1315 }, { "epoch": 0.03, "learning_rate": 9.999993173263856e-06, "loss": 1.3269, "step": 1316 }, { "epoch": 0.03, "learning_rate": 9.99999253854681e-06, "loss": 1.2844, "step": 1317 }, { "epoch": 0.03, "learning_rate": 9.999991875620146e-06, "loss": 1.2919, "step": 1318 }, { "epoch": 0.03, "learning_rate": 9.999991184483869e-06, "loss": 1.2522, "step": 1319 }, { "epoch": 0.03, "learning_rate": 9.99999046513798e-06, "loss": 1.1725, "step": 1320 }, { "epoch": 0.03, "learning_rate": 9.999989717582488e-06, "loss": 1.1586, "step": 1321 }, { "epoch": 0.03, "learning_rate": 9.99998894181739e-06, "loss": 1.0865, "step": 1322 }, { "epoch": 0.03, "learning_rate": 9.999988137842697e-06, "loss": 1.2913, "step": 1323 }, { "epoch": 0.03, "learning_rate": 9.999987305658412e-06, "loss": 1.0801, "step": 1324 }, { "epoch": 0.03, "learning_rate": 9.999986445264538e-06, "loss": 0.9936, "step": 1325 }, { "epoch": 0.03, "learning_rate": 9.99998555666108e-06, "loss": 0.992, "step": 1326 }, { "epoch": 0.03, "learning_rate": 9.999984639848043e-06, "loss": 0.9253, "step": 1327 }, { "epoch": 0.03, "learning_rate": 9.999983694825434e-06, "loss": 1.1841, "step": 1328 }, { "epoch": 0.03, "learning_rate": 9.999982721593256e-06, "loss": 1.0886, "step": 1329 }, { "epoch": 0.03, "learning_rate": 9.999981720151515e-06, "loss": 1.118, "step": 1330 }, { "epoch": 0.03, "learning_rate": 9.99998069050022e-06, "loss": 1.4223, "step": 1331 }, { "epoch": 0.03, "learning_rate": 9.999979632639372e-06, "loss": 1.0114, "step": 1332 }, { "epoch": 0.03, "learning_rate": 9.999978546568979e-06, "loss": 1.1565, "step": 1333 }, { "epoch": 0.03, "learning_rate": 9.999977432289048e-06, "loss": 1.3309, "step": 1334 }, { "epoch": 0.03, "learning_rate": 9.999976289799584e-06, "loss": 0.9064, "step": 1335 }, { "epoch": 0.03, "learning_rate": 9.999975119100594e-06, "loss": 1.0229, "step": 1336 }, { "epoch": 0.03, "learning_rate": 9.999973920192083e-06, "loss": 0.9279, "step": 1337 }, { "epoch": 0.03, "learning_rate": 9.999972693074061e-06, "loss": 0.9024, "step": 1338 }, { "epoch": 0.03, "learning_rate": 9.999971437746532e-06, "loss": 1.0331, "step": 1339 }, { "epoch": 0.03, "learning_rate": 9.999970154209506e-06, "loss": 1.4301, "step": 1340 }, { "epoch": 0.03, "learning_rate": 9.999968842462988e-06, "loss": 1.3346, "step": 1341 }, { "epoch": 0.03, "learning_rate": 9.999967502506984e-06, "loss": 1.1548, "step": 1342 }, { "epoch": 0.03, "learning_rate": 9.999966134341505e-06, "loss": 1.1553, "step": 1343 }, { "epoch": 0.03, "learning_rate": 9.999964737966558e-06, "loss": 0.9917, "step": 1344 }, { "epoch": 0.03, "learning_rate": 9.999963313382148e-06, "loss": 1.18, "step": 1345 }, { "epoch": 0.03, "learning_rate": 9.999961860588286e-06, "loss": 1.1786, "step": 1346 }, { "epoch": 0.03, "learning_rate": 9.999960379584979e-06, "loss": 1.2624, "step": 1347 }, { "epoch": 0.03, "learning_rate": 9.999958870372238e-06, "loss": 0.8394, "step": 1348 }, { "epoch": 0.03, "learning_rate": 9.999957332950066e-06, "loss": 1.0674, "step": 1349 }, { "epoch": 0.03, "learning_rate": 9.999955767318476e-06, "loss": 1.1159, "step": 1350 }, { "epoch": 0.03, "learning_rate": 9.999954173477476e-06, "loss": 1.2492, "step": 1351 }, { "epoch": 0.03, "learning_rate": 9.999952551427074e-06, "loss": 1.0678, "step": 1352 }, { "epoch": 0.03, "learning_rate": 9.999950901167281e-06, "loss": 1.3343, "step": 1353 }, { "epoch": 0.03, "learning_rate": 9.999949222698104e-06, "loss": 1.2218, "step": 1354 }, { "epoch": 0.03, "learning_rate": 9.999947516019552e-06, "loss": 1.2262, "step": 1355 }, { "epoch": 0.03, "learning_rate": 9.99994578113164e-06, "loss": 1.0377, "step": 1356 }, { "epoch": 0.03, "learning_rate": 9.999944018034371e-06, "loss": 1.3355, "step": 1357 }, { "epoch": 0.03, "learning_rate": 9.999942226727759e-06, "loss": 1.4045, "step": 1358 }, { "epoch": 0.03, "learning_rate": 9.999940407211813e-06, "loss": 1.1976, "step": 1359 }, { "epoch": 0.03, "learning_rate": 9.999938559486544e-06, "loss": 1.0258, "step": 1360 }, { "epoch": 0.03, "learning_rate": 9.99993668355196e-06, "loss": 1.2351, "step": 1361 }, { "epoch": 0.03, "learning_rate": 9.999934779408075e-06, "loss": 1.5254, "step": 1362 }, { "epoch": 0.03, "learning_rate": 9.999932847054897e-06, "loss": 1.0048, "step": 1363 }, { "epoch": 0.03, "learning_rate": 9.999930886492439e-06, "loss": 1.0374, "step": 1364 }, { "epoch": 0.03, "learning_rate": 9.99992889772071e-06, "loss": 0.9786, "step": 1365 }, { "epoch": 0.03, "learning_rate": 9.999926880739724e-06, "loss": 1.0951, "step": 1366 }, { "epoch": 0.03, "learning_rate": 9.999924835549489e-06, "loss": 1.113, "step": 1367 }, { "epoch": 0.03, "learning_rate": 9.999922762150018e-06, "loss": 1.3402, "step": 1368 }, { "epoch": 0.03, "learning_rate": 9.999920660541324e-06, "loss": 1.3314, "step": 1369 }, { "epoch": 0.03, "learning_rate": 9.999918530723416e-06, "loss": 1.3397, "step": 1370 }, { "epoch": 0.03, "learning_rate": 9.99991637269631e-06, "loss": 1.3396, "step": 1371 }, { "epoch": 0.03, "learning_rate": 9.999914186460013e-06, "loss": 1.0321, "step": 1372 }, { "epoch": 0.03, "learning_rate": 9.999911972014543e-06, "loss": 1.0748, "step": 1373 }, { "epoch": 0.03, "learning_rate": 9.999909729359908e-06, "loss": 1.0301, "step": 1374 }, { "epoch": 0.03, "learning_rate": 9.999907458496124e-06, "loss": 1.3439, "step": 1375 }, { "epoch": 0.03, "learning_rate": 9.999905159423203e-06, "loss": 1.0902, "step": 1376 }, { "epoch": 0.03, "learning_rate": 9.999902832141154e-06, "loss": 1.3583, "step": 1377 }, { "epoch": 0.03, "learning_rate": 9.999900476649996e-06, "loss": 0.8011, "step": 1378 }, { "epoch": 0.03, "learning_rate": 9.999898092949738e-06, "loss": 1.0307, "step": 1379 }, { "epoch": 0.03, "learning_rate": 9.999895681040395e-06, "loss": 1.0601, "step": 1380 }, { "epoch": 0.03, "learning_rate": 9.999893240921982e-06, "loss": 0.9575, "step": 1381 }, { "epoch": 0.03, "learning_rate": 9.999890772594511e-06, "loss": 1.1914, "step": 1382 }, { "epoch": 0.03, "learning_rate": 9.999888276057995e-06, "loss": 1.15, "step": 1383 }, { "epoch": 0.03, "learning_rate": 9.99988575131245e-06, "loss": 1.5214, "step": 1384 }, { "epoch": 0.03, "learning_rate": 9.999883198357892e-06, "loss": 1.133, "step": 1385 }, { "epoch": 0.03, "learning_rate": 9.99988061719433e-06, "loss": 1.1107, "step": 1386 }, { "epoch": 0.03, "learning_rate": 9.999878007821782e-06, "loss": 0.9918, "step": 1387 }, { "epoch": 0.03, "learning_rate": 9.999875370240263e-06, "loss": 1.1828, "step": 1388 }, { "epoch": 0.03, "learning_rate": 9.99987270444979e-06, "loss": 1.1842, "step": 1389 }, { "epoch": 0.03, "learning_rate": 9.999870010450373e-06, "loss": 1.2369, "step": 1390 }, { "epoch": 0.03, "learning_rate": 9.999867288242027e-06, "loss": 1.2759, "step": 1391 }, { "epoch": 0.03, "learning_rate": 9.999864537824773e-06, "loss": 1.3564, "step": 1392 }, { "epoch": 0.03, "learning_rate": 9.999861759198623e-06, "loss": 1.1303, "step": 1393 }, { "epoch": 0.03, "learning_rate": 9.999858952363592e-06, "loss": 0.9311, "step": 1394 }, { "epoch": 0.03, "learning_rate": 9.999856117319698e-06, "loss": 1.1289, "step": 1395 }, { "epoch": 0.03, "learning_rate": 9.999853254066955e-06, "loss": 1.18, "step": 1396 }, { "epoch": 0.03, "learning_rate": 9.99985036260538e-06, "loss": 1.077, "step": 1397 }, { "epoch": 0.03, "learning_rate": 9.999847442934991e-06, "loss": 1.168, "step": 1398 }, { "epoch": 0.03, "learning_rate": 9.9998444950558e-06, "loss": 1.1449, "step": 1399 }, { "epoch": 0.03, "learning_rate": 9.999841518967828e-06, "loss": 1.1809, "step": 1400 }, { "epoch": 0.03, "learning_rate": 9.99983851467109e-06, "loss": 0.9491, "step": 1401 }, { "epoch": 0.03, "learning_rate": 9.999835482165604e-06, "loss": 0.9606, "step": 1402 }, { "epoch": 0.03, "learning_rate": 9.999832421451385e-06, "loss": 1.2055, "step": 1403 }, { "epoch": 0.03, "learning_rate": 9.999829332528452e-06, "loss": 1.0745, "step": 1404 }, { "epoch": 0.03, "learning_rate": 9.999826215396824e-06, "loss": 1.2004, "step": 1405 }, { "epoch": 0.03, "learning_rate": 9.999823070056513e-06, "loss": 1.3773, "step": 1406 }, { "epoch": 0.03, "learning_rate": 9.999819896507543e-06, "loss": 1.2404, "step": 1407 }, { "epoch": 0.03, "learning_rate": 9.99981669474993e-06, "loss": 1.001, "step": 1408 }, { "epoch": 0.03, "learning_rate": 9.99981346478369e-06, "loss": 1.0718, "step": 1409 }, { "epoch": 0.03, "learning_rate": 9.99981020660884e-06, "loss": 1.2564, "step": 1410 }, { "epoch": 0.03, "learning_rate": 9.999806920225403e-06, "loss": 1.134, "step": 1411 }, { "epoch": 0.03, "learning_rate": 9.999803605633396e-06, "loss": 1.4868, "step": 1412 }, { "epoch": 0.03, "learning_rate": 9.999800262832837e-06, "loss": 1.1787, "step": 1413 }, { "epoch": 0.03, "learning_rate": 9.999796891823746e-06, "loss": 1.0405, "step": 1414 }, { "epoch": 0.03, "learning_rate": 9.999793492606139e-06, "loss": 1.21, "step": 1415 }, { "epoch": 0.03, "learning_rate": 9.999790065180037e-06, "loss": 1.0975, "step": 1416 }, { "epoch": 0.03, "learning_rate": 9.999786609545462e-06, "loss": 1.1233, "step": 1417 }, { "epoch": 0.03, "learning_rate": 9.99978312570243e-06, "loss": 1.2505, "step": 1418 }, { "epoch": 0.03, "learning_rate": 9.99977961365096e-06, "loss": 0.9906, "step": 1419 }, { "epoch": 0.03, "learning_rate": 9.999776073391075e-06, "loss": 1.0024, "step": 1420 }, { "epoch": 0.03, "learning_rate": 9.999772504922793e-06, "loss": 1.3488, "step": 1421 }, { "epoch": 0.03, "learning_rate": 9.999768908246134e-06, "loss": 1.3895, "step": 1422 }, { "epoch": 0.03, "learning_rate": 9.99976528336112e-06, "loss": 1.1852, "step": 1423 }, { "epoch": 0.03, "learning_rate": 9.99976163026777e-06, "loss": 1.0534, "step": 1424 }, { "epoch": 0.03, "learning_rate": 9.999757948966104e-06, "loss": 1.2672, "step": 1425 }, { "epoch": 0.03, "learning_rate": 9.999754239456146e-06, "loss": 1.2113, "step": 1426 }, { "epoch": 0.03, "learning_rate": 9.999750501737913e-06, "loss": 0.8137, "step": 1427 }, { "epoch": 0.03, "learning_rate": 9.999746735811429e-06, "loss": 1.3615, "step": 1428 }, { "epoch": 0.03, "learning_rate": 9.999742941676714e-06, "loss": 1.1386, "step": 1429 }, { "epoch": 0.03, "learning_rate": 9.999739119333786e-06, "loss": 1.1246, "step": 1430 }, { "epoch": 0.03, "learning_rate": 9.999735268782673e-06, "loss": 1.3213, "step": 1431 }, { "epoch": 0.03, "learning_rate": 9.999731390023395e-06, "loss": 0.8746, "step": 1432 }, { "epoch": 0.03, "learning_rate": 9.99972748305597e-06, "loss": 0.9306, "step": 1433 }, { "epoch": 0.03, "learning_rate": 9.999723547880424e-06, "loss": 1.2192, "step": 1434 }, { "epoch": 0.03, "learning_rate": 9.999719584496776e-06, "loss": 1.0624, "step": 1435 }, { "epoch": 0.03, "learning_rate": 9.999715592905053e-06, "loss": 1.3955, "step": 1436 }, { "epoch": 0.03, "learning_rate": 9.999711573105272e-06, "loss": 0.9833, "step": 1437 }, { "epoch": 0.03, "learning_rate": 9.99970752509746e-06, "loss": 0.9675, "step": 1438 }, { "epoch": 0.03, "learning_rate": 9.999703448881638e-06, "loss": 1.0396, "step": 1439 }, { "epoch": 0.03, "learning_rate": 9.99969934445783e-06, "loss": 0.9029, "step": 1440 }, { "epoch": 0.03, "learning_rate": 9.999695211826057e-06, "loss": 1.2313, "step": 1441 }, { "epoch": 0.03, "learning_rate": 9.999691050986342e-06, "loss": 1.5096, "step": 1442 }, { "epoch": 0.03, "learning_rate": 9.999686861938713e-06, "loss": 1.0149, "step": 1443 }, { "epoch": 0.03, "learning_rate": 9.99968264468319e-06, "loss": 1.0689, "step": 1444 }, { "epoch": 0.03, "learning_rate": 9.9996783992198e-06, "loss": 0.8879, "step": 1445 }, { "epoch": 0.03, "learning_rate": 9.99967412554856e-06, "loss": 1.0494, "step": 1446 }, { "epoch": 0.03, "learning_rate": 9.999669823669502e-06, "loss": 0.9881, "step": 1447 }, { "epoch": 0.03, "learning_rate": 9.999665493582645e-06, "loss": 1.2873, "step": 1448 }, { "epoch": 0.03, "learning_rate": 9.999661135288016e-06, "loss": 1.064, "step": 1449 }, { "epoch": 0.03, "learning_rate": 9.99965674878564e-06, "loss": 1.2118, "step": 1450 }, { "epoch": 0.03, "learning_rate": 9.99965233407554e-06, "loss": 1.0484, "step": 1451 }, { "epoch": 0.03, "learning_rate": 9.999647891157741e-06, "loss": 1.014, "step": 1452 }, { "epoch": 0.03, "learning_rate": 9.999643420032269e-06, "loss": 1.0051, "step": 1453 }, { "epoch": 0.03, "learning_rate": 9.999638920699149e-06, "loss": 1.3759, "step": 1454 }, { "epoch": 0.03, "learning_rate": 9.999634393158406e-06, "loss": 1.2153, "step": 1455 }, { "epoch": 0.03, "learning_rate": 9.999629837410066e-06, "loss": 1.1935, "step": 1456 }, { "epoch": 0.03, "learning_rate": 9.999625253454155e-06, "loss": 1.1087, "step": 1457 }, { "epoch": 0.03, "learning_rate": 9.999620641290699e-06, "loss": 1.301, "step": 1458 }, { "epoch": 0.03, "learning_rate": 9.99961600091972e-06, "loss": 0.7773, "step": 1459 }, { "epoch": 0.03, "learning_rate": 9.999611332341251e-06, "loss": 1.4354, "step": 1460 }, { "epoch": 0.03, "learning_rate": 9.999606635555315e-06, "loss": 1.1782, "step": 1461 }, { "epoch": 0.03, "learning_rate": 9.999601910561937e-06, "loss": 1.2528, "step": 1462 }, { "epoch": 0.03, "learning_rate": 9.999597157361146e-06, "loss": 0.9897, "step": 1463 }, { "epoch": 0.03, "learning_rate": 9.999592375952966e-06, "loss": 0.9889, "step": 1464 }, { "epoch": 0.03, "learning_rate": 9.999587566337429e-06, "loss": 1.044, "step": 1465 }, { "epoch": 0.03, "learning_rate": 9.999582728514556e-06, "loss": 1.0474, "step": 1466 }, { "epoch": 0.03, "learning_rate": 9.99957786248438e-06, "loss": 1.2329, "step": 1467 }, { "epoch": 0.03, "learning_rate": 9.999572968246925e-06, "loss": 1.3792, "step": 1468 }, { "epoch": 0.03, "learning_rate": 9.999568045802216e-06, "loss": 1.3008, "step": 1469 }, { "epoch": 0.03, "learning_rate": 9.99956309515029e-06, "loss": 0.9756, "step": 1470 }, { "epoch": 0.03, "learning_rate": 9.999558116291164e-06, "loss": 1.1467, "step": 1471 }, { "epoch": 0.03, "learning_rate": 9.999553109224875e-06, "loss": 1.1403, "step": 1472 }, { "epoch": 0.03, "learning_rate": 9.999548073951446e-06, "loss": 1.2093, "step": 1473 }, { "epoch": 0.03, "learning_rate": 9.999543010470905e-06, "loss": 1.2039, "step": 1474 }, { "epoch": 0.03, "learning_rate": 9.999537918783285e-06, "loss": 1.2725, "step": 1475 }, { "epoch": 0.03, "learning_rate": 9.99953279888861e-06, "loss": 1.2523, "step": 1476 }, { "epoch": 0.03, "learning_rate": 9.999527650786913e-06, "loss": 1.0649, "step": 1477 }, { "epoch": 0.03, "learning_rate": 9.99952247447822e-06, "loss": 0.9872, "step": 1478 }, { "epoch": 0.03, "learning_rate": 9.999517269962561e-06, "loss": 1.0407, "step": 1479 }, { "epoch": 0.03, "learning_rate": 9.999512037239967e-06, "loss": 1.0746, "step": 1480 }, { "epoch": 0.03, "learning_rate": 9.999506776310464e-06, "loss": 1.1165, "step": 1481 }, { "epoch": 0.03, "learning_rate": 9.999501487174085e-06, "loss": 1.2321, "step": 1482 }, { "epoch": 0.03, "learning_rate": 9.999496169830859e-06, "loss": 1.0493, "step": 1483 }, { "epoch": 0.03, "learning_rate": 9.999490824280815e-06, "loss": 1.2225, "step": 1484 }, { "epoch": 0.03, "learning_rate": 9.999485450523984e-06, "loss": 0.882, "step": 1485 }, { "epoch": 0.03, "learning_rate": 9.999480048560397e-06, "loss": 1.0552, "step": 1486 }, { "epoch": 0.03, "learning_rate": 9.999474618390083e-06, "loss": 1.1721, "step": 1487 }, { "epoch": 0.03, "learning_rate": 9.999469160013074e-06, "loss": 1.0574, "step": 1488 }, { "epoch": 0.03, "learning_rate": 9.9994636734294e-06, "loss": 1.5739, "step": 1489 }, { "epoch": 0.03, "learning_rate": 9.999458158639091e-06, "loss": 1.1519, "step": 1490 }, { "epoch": 0.03, "learning_rate": 9.999452615642177e-06, "loss": 1.246, "step": 1491 }, { "epoch": 0.03, "learning_rate": 9.999447044438696e-06, "loss": 1.112, "step": 1492 }, { "epoch": 0.03, "learning_rate": 9.999441445028673e-06, "loss": 1.1036, "step": 1493 }, { "epoch": 0.03, "learning_rate": 9.99943581741214e-06, "loss": 0.9466, "step": 1494 }, { "epoch": 0.03, "learning_rate": 9.999430161589133e-06, "loss": 1.0698, "step": 1495 }, { "epoch": 0.03, "learning_rate": 9.999424477559678e-06, "loss": 1.1112, "step": 1496 }, { "epoch": 0.03, "learning_rate": 9.999418765323811e-06, "loss": 0.8836, "step": 1497 }, { "epoch": 0.03, "learning_rate": 9.999413024881564e-06, "loss": 1.2782, "step": 1498 }, { "epoch": 0.03, "learning_rate": 9.99940725623297e-06, "loss": 1.2625, "step": 1499 }, { "epoch": 0.03, "learning_rate": 9.999401459378059e-06, "loss": 1.2561, "step": 1500 }, { "epoch": 0.03, "learning_rate": 9.999395634316864e-06, "loss": 1.1876, "step": 1501 }, { "epoch": 0.03, "learning_rate": 9.99938978104942e-06, "loss": 1.058, "step": 1502 }, { "epoch": 0.03, "learning_rate": 9.99938389957576e-06, "loss": 1.1447, "step": 1503 }, { "epoch": 0.03, "learning_rate": 9.999377989895914e-06, "loss": 0.9954, "step": 1504 }, { "epoch": 0.03, "learning_rate": 9.99937205200992e-06, "loss": 1.0971, "step": 1505 }, { "epoch": 0.03, "learning_rate": 9.999366085917806e-06, "loss": 1.2141, "step": 1506 }, { "epoch": 0.03, "learning_rate": 9.99936009161961e-06, "loss": 1.2913, "step": 1507 }, { "epoch": 0.03, "learning_rate": 9.999354069115365e-06, "loss": 0.8302, "step": 1508 }, { "epoch": 0.03, "learning_rate": 9.999348018405103e-06, "loss": 0.9804, "step": 1509 }, { "epoch": 0.04, "learning_rate": 9.99934193948886e-06, "loss": 1.0379, "step": 1510 }, { "epoch": 0.04, "learning_rate": 9.999335832366672e-06, "loss": 1.0356, "step": 1511 }, { "epoch": 0.04, "learning_rate": 9.99932969703857e-06, "loss": 1.0204, "step": 1512 }, { "epoch": 0.04, "learning_rate": 9.999323533504588e-06, "loss": 1.3292, "step": 1513 }, { "epoch": 0.04, "learning_rate": 9.999317341764764e-06, "loss": 1.0829, "step": 1514 }, { "epoch": 0.04, "learning_rate": 9.999311121819133e-06, "loss": 0.9661, "step": 1515 }, { "epoch": 0.04, "learning_rate": 9.999304873667726e-06, "loss": 1.3273, "step": 1516 }, { "epoch": 0.04, "learning_rate": 9.999298597310582e-06, "loss": 1.0804, "step": 1517 }, { "epoch": 0.04, "learning_rate": 9.999292292747735e-06, "loss": 1.2142, "step": 1518 }, { "epoch": 0.04, "learning_rate": 9.999285959979222e-06, "loss": 1.0474, "step": 1519 }, { "epoch": 0.04, "learning_rate": 9.999279599005078e-06, "loss": 0.91, "step": 1520 }, { "epoch": 0.04, "learning_rate": 9.999273209825337e-06, "loss": 0.9951, "step": 1521 }, { "epoch": 0.04, "learning_rate": 9.999266792440039e-06, "loss": 1.3073, "step": 1522 }, { "epoch": 0.04, "learning_rate": 9.999260346849216e-06, "loss": 1.0217, "step": 1523 }, { "epoch": 0.04, "learning_rate": 9.999253873052906e-06, "loss": 1.2474, "step": 1524 }, { "epoch": 0.04, "learning_rate": 9.999247371051145e-06, "loss": 1.0721, "step": 1525 }, { "epoch": 0.04, "learning_rate": 9.999240840843974e-06, "loss": 0.9529, "step": 1526 }, { "epoch": 0.04, "learning_rate": 9.999234282431422e-06, "loss": 1.1128, "step": 1527 }, { "epoch": 0.04, "learning_rate": 9.999227695813532e-06, "loss": 1.0448, "step": 1528 }, { "epoch": 0.04, "learning_rate": 9.999221080990341e-06, "loss": 1.131, "step": 1529 }, { "epoch": 0.04, "learning_rate": 9.999214437961881e-06, "loss": 1.0151, "step": 1530 }, { "epoch": 0.04, "learning_rate": 9.999207766728196e-06, "loss": 1.2357, "step": 1531 }, { "epoch": 0.04, "learning_rate": 9.99920106728932e-06, "loss": 1.1626, "step": 1532 }, { "epoch": 0.04, "learning_rate": 9.999194339645292e-06, "loss": 1.1253, "step": 1533 }, { "epoch": 0.04, "learning_rate": 9.999187583796148e-06, "loss": 1.1664, "step": 1534 }, { "epoch": 0.04, "learning_rate": 9.99918079974193e-06, "loss": 1.162, "step": 1535 }, { "epoch": 0.04, "learning_rate": 9.999173987482674e-06, "loss": 1.0028, "step": 1536 }, { "epoch": 0.04, "learning_rate": 9.999167147018416e-06, "loss": 1.0847, "step": 1537 }, { "epoch": 0.04, "learning_rate": 9.999160278349199e-06, "loss": 1.028, "step": 1538 }, { "epoch": 0.04, "learning_rate": 9.99915338147506e-06, "loss": 0.874, "step": 1539 }, { "epoch": 0.04, "learning_rate": 9.999146456396036e-06, "loss": 0.7182, "step": 1540 }, { "epoch": 0.04, "learning_rate": 9.999139503112167e-06, "loss": 1.0405, "step": 1541 }, { "epoch": 0.04, "learning_rate": 9.999132521623495e-06, "loss": 1.336, "step": 1542 }, { "epoch": 0.04, "learning_rate": 9.999125511930056e-06, "loss": 0.9943, "step": 1543 }, { "epoch": 0.04, "learning_rate": 9.999118474031892e-06, "loss": 1.271, "step": 1544 }, { "epoch": 0.04, "learning_rate": 9.999111407929044e-06, "loss": 0.9961, "step": 1545 }, { "epoch": 0.04, "learning_rate": 9.999104313621546e-06, "loss": 1.0706, "step": 1546 }, { "epoch": 0.04, "learning_rate": 9.999097191109441e-06, "loss": 1.2629, "step": 1547 }, { "epoch": 0.04, "learning_rate": 9.999090040392772e-06, "loss": 1.1691, "step": 1548 }, { "epoch": 0.04, "learning_rate": 9.999082861471576e-06, "loss": 0.9404, "step": 1549 }, { "epoch": 0.04, "learning_rate": 9.999075654345895e-06, "loss": 1.0098, "step": 1550 }, { "epoch": 0.04, "learning_rate": 9.999068419015769e-06, "loss": 1.1596, "step": 1551 }, { "epoch": 0.04, "learning_rate": 9.999061155481238e-06, "loss": 1.3724, "step": 1552 }, { "epoch": 0.04, "learning_rate": 9.999053863742344e-06, "loss": 1.22, "step": 1553 }, { "epoch": 0.04, "learning_rate": 9.99904654379913e-06, "loss": 1.3099, "step": 1554 }, { "epoch": 0.04, "learning_rate": 9.999039195651635e-06, "loss": 0.8795, "step": 1555 }, { "epoch": 0.04, "learning_rate": 9.999031819299901e-06, "loss": 1.0775, "step": 1556 }, { "epoch": 0.04, "learning_rate": 9.999024414743968e-06, "loss": 1.4494, "step": 1557 }, { "epoch": 0.04, "learning_rate": 9.99901698198388e-06, "loss": 1.1794, "step": 1558 }, { "epoch": 0.04, "learning_rate": 9.999009521019678e-06, "loss": 1.1071, "step": 1559 }, { "epoch": 0.04, "learning_rate": 9.999002031851404e-06, "loss": 1.231, "step": 1560 }, { "epoch": 0.04, "learning_rate": 9.998994514479102e-06, "loss": 1.1073, "step": 1561 }, { "epoch": 0.04, "learning_rate": 9.998986968902811e-06, "loss": 1.1064, "step": 1562 }, { "epoch": 0.04, "learning_rate": 9.998979395122577e-06, "loss": 1.2494, "step": 1563 }, { "epoch": 0.04, "learning_rate": 9.99897179313844e-06, "loss": 1.1669, "step": 1564 }, { "epoch": 0.04, "learning_rate": 9.998964162950447e-06, "loss": 1.1234, "step": 1565 }, { "epoch": 0.04, "learning_rate": 9.998956504558636e-06, "loss": 1.1257, "step": 1566 }, { "epoch": 0.04, "learning_rate": 9.998948817963052e-06, "loss": 1.2691, "step": 1567 }, { "epoch": 0.04, "learning_rate": 9.99894110316374e-06, "loss": 0.9981, "step": 1568 }, { "epoch": 0.04, "learning_rate": 9.998933360160742e-06, "loss": 1.2396, "step": 1569 }, { "epoch": 0.04, "learning_rate": 9.998925588954102e-06, "loss": 1.2344, "step": 1570 }, { "epoch": 0.04, "learning_rate": 9.998917789543864e-06, "loss": 1.3156, "step": 1571 }, { "epoch": 0.04, "learning_rate": 9.998909961930073e-06, "loss": 1.0232, "step": 1572 }, { "epoch": 0.04, "learning_rate": 9.99890210611277e-06, "loss": 1.139, "step": 1573 }, { "epoch": 0.04, "learning_rate": 9.998894222092002e-06, "loss": 1.2643, "step": 1574 }, { "epoch": 0.04, "learning_rate": 9.998886309867812e-06, "loss": 1.0971, "step": 1575 }, { "epoch": 0.04, "learning_rate": 9.998878369440245e-06, "loss": 1.3685, "step": 1576 }, { "epoch": 0.04, "learning_rate": 9.998870400809348e-06, "loss": 1.1458, "step": 1577 }, { "epoch": 0.04, "learning_rate": 9.998862403975166e-06, "loss": 1.1263, "step": 1578 }, { "epoch": 0.04, "learning_rate": 9.998854378937739e-06, "loss": 1.0671, "step": 1579 }, { "epoch": 0.04, "learning_rate": 9.998846325697117e-06, "loss": 1.3508, "step": 1580 }, { "epoch": 0.04, "learning_rate": 9.998838244253343e-06, "loss": 0.9181, "step": 1581 }, { "epoch": 0.04, "learning_rate": 9.998830134606465e-06, "loss": 1.1851, "step": 1582 }, { "epoch": 0.04, "learning_rate": 9.998821996756526e-06, "loss": 1.4399, "step": 1583 }, { "epoch": 0.04, "learning_rate": 9.998813830703575e-06, "loss": 1.3099, "step": 1584 }, { "epoch": 0.04, "learning_rate": 9.998805636447656e-06, "loss": 1.2465, "step": 1585 }, { "epoch": 0.04, "learning_rate": 9.998797413988815e-06, "loss": 1.266, "step": 1586 }, { "epoch": 0.04, "learning_rate": 9.998789163327098e-06, "loss": 1.0248, "step": 1587 }, { "epoch": 0.04, "learning_rate": 9.998780884462556e-06, "loss": 1.2859, "step": 1588 }, { "epoch": 0.04, "learning_rate": 9.998772577395228e-06, "loss": 1.3001, "step": 1589 }, { "epoch": 0.04, "learning_rate": 9.998764242125167e-06, "loss": 1.1026, "step": 1590 }, { "epoch": 0.04, "learning_rate": 9.99875587865242e-06, "loss": 1.0666, "step": 1591 }, { "epoch": 0.04, "learning_rate": 9.998747486977029e-06, "loss": 1.0155, "step": 1592 }, { "epoch": 0.04, "learning_rate": 9.998739067099048e-06, "loss": 1.5588, "step": 1593 }, { "epoch": 0.04, "learning_rate": 9.99873061901852e-06, "loss": 1.1069, "step": 1594 }, { "epoch": 0.04, "learning_rate": 9.998722142735494e-06, "loss": 1.1992, "step": 1595 }, { "epoch": 0.04, "learning_rate": 9.998713638250016e-06, "loss": 1.1337, "step": 1596 }, { "epoch": 0.04, "learning_rate": 9.998705105562137e-06, "loss": 1.0584, "step": 1597 }, { "epoch": 0.04, "learning_rate": 9.998696544671903e-06, "loss": 1.2517, "step": 1598 }, { "epoch": 0.04, "learning_rate": 9.998687955579363e-06, "loss": 1.2732, "step": 1599 }, { "epoch": 0.04, "learning_rate": 9.998679338284567e-06, "loss": 0.9688, "step": 1600 }, { "epoch": 0.04, "learning_rate": 9.998670692787562e-06, "loss": 1.0138, "step": 1601 }, { "epoch": 0.04, "learning_rate": 9.998662019088396e-06, "loss": 1.047, "step": 1602 }, { "epoch": 0.04, "learning_rate": 9.99865331718712e-06, "loss": 1.2447, "step": 1603 }, { "epoch": 0.04, "learning_rate": 9.99864458708378e-06, "loss": 1.4372, "step": 1604 }, { "epoch": 0.04, "learning_rate": 9.998635828778429e-06, "loss": 1.0406, "step": 1605 }, { "epoch": 0.04, "learning_rate": 9.998627042271115e-06, "loss": 0.9279, "step": 1606 }, { "epoch": 0.04, "learning_rate": 9.998618227561885e-06, "loss": 1.0566, "step": 1607 }, { "epoch": 0.04, "learning_rate": 9.998609384650793e-06, "loss": 1.228, "step": 1608 }, { "epoch": 0.04, "learning_rate": 9.998600513537886e-06, "loss": 1.0301, "step": 1609 }, { "epoch": 0.04, "learning_rate": 9.998591614223216e-06, "loss": 0.9537, "step": 1610 }, { "epoch": 0.04, "learning_rate": 9.99858268670683e-06, "loss": 1.4069, "step": 1611 }, { "epoch": 0.04, "learning_rate": 9.998573730988784e-06, "loss": 1.1853, "step": 1612 }, { "epoch": 0.04, "learning_rate": 9.998564747069122e-06, "loss": 1.2355, "step": 1613 }, { "epoch": 0.04, "learning_rate": 9.998555734947898e-06, "loss": 1.3015, "step": 1614 }, { "epoch": 0.04, "learning_rate": 9.998546694625162e-06, "loss": 1.2664, "step": 1615 }, { "epoch": 0.04, "learning_rate": 9.998537626100968e-06, "loss": 1.119, "step": 1616 }, { "epoch": 0.04, "learning_rate": 9.998528529375362e-06, "loss": 1.1277, "step": 1617 }, { "epoch": 0.04, "learning_rate": 9.9985194044484e-06, "loss": 1.1821, "step": 1618 }, { "epoch": 0.04, "learning_rate": 9.99851025132013e-06, "loss": 1.0787, "step": 1619 }, { "epoch": 0.04, "learning_rate": 9.998501069990607e-06, "loss": 1.5094, "step": 1620 }, { "epoch": 0.04, "learning_rate": 9.99849186045988e-06, "loss": 1.0923, "step": 1621 }, { "epoch": 0.04, "learning_rate": 9.998482622728001e-06, "loss": 1.4623, "step": 1622 }, { "epoch": 0.04, "learning_rate": 9.998473356795025e-06, "loss": 1.229, "step": 1623 }, { "epoch": 0.04, "learning_rate": 9.998464062661001e-06, "loss": 1.2052, "step": 1624 }, { "epoch": 0.04, "learning_rate": 9.998454740325983e-06, "loss": 1.1404, "step": 1625 }, { "epoch": 0.04, "learning_rate": 9.998445389790024e-06, "loss": 1.0561, "step": 1626 }, { "epoch": 0.04, "learning_rate": 9.998436011053176e-06, "loss": 1.1267, "step": 1627 }, { "epoch": 0.04, "learning_rate": 9.99842660411549e-06, "loss": 1.2308, "step": 1628 }, { "epoch": 0.04, "learning_rate": 9.998417168977024e-06, "loss": 1.0422, "step": 1629 }, { "epoch": 0.04, "learning_rate": 9.998407705637825e-06, "loss": 1.0079, "step": 1630 }, { "epoch": 0.04, "learning_rate": 9.998398214097954e-06, "loss": 1.1476, "step": 1631 }, { "epoch": 0.04, "learning_rate": 9.998388694357457e-06, "loss": 0.9895, "step": 1632 }, { "epoch": 0.04, "learning_rate": 9.998379146416392e-06, "loss": 1.3906, "step": 1633 }, { "epoch": 0.04, "learning_rate": 9.99836957027481e-06, "loss": 0.9879, "step": 1634 }, { "epoch": 0.04, "learning_rate": 9.99835996593277e-06, "loss": 1.2213, "step": 1635 }, { "epoch": 0.04, "learning_rate": 9.99835033339032e-06, "loss": 0.9946, "step": 1636 }, { "epoch": 0.04, "learning_rate": 9.99834067264752e-06, "loss": 1.2496, "step": 1637 }, { "epoch": 0.04, "learning_rate": 9.998330983704421e-06, "loss": 1.2481, "step": 1638 }, { "epoch": 0.04, "learning_rate": 9.99832126656108e-06, "loss": 1.0427, "step": 1639 }, { "epoch": 0.04, "learning_rate": 9.998311521217547e-06, "loss": 1.3076, "step": 1640 }, { "epoch": 0.04, "learning_rate": 9.998301747673883e-06, "loss": 1.1115, "step": 1641 }, { "epoch": 0.04, "learning_rate": 9.998291945930142e-06, "loss": 1.048, "step": 1642 }, { "epoch": 0.04, "learning_rate": 9.998282115986374e-06, "loss": 0.8403, "step": 1643 }, { "epoch": 0.04, "learning_rate": 9.99827225784264e-06, "loss": 0.8981, "step": 1644 }, { "epoch": 0.04, "learning_rate": 9.998262371498994e-06, "loss": 0.8763, "step": 1645 }, { "epoch": 0.04, "learning_rate": 9.998252456955492e-06, "loss": 0.9661, "step": 1646 }, { "epoch": 0.04, "learning_rate": 9.998242514212188e-06, "loss": 1.1853, "step": 1647 }, { "epoch": 0.04, "learning_rate": 9.998232543269142e-06, "loss": 1.1617, "step": 1648 }, { "epoch": 0.04, "learning_rate": 9.998222544126405e-06, "loss": 1.0885, "step": 1649 }, { "epoch": 0.04, "learning_rate": 9.99821251678404e-06, "loss": 1.3544, "step": 1650 }, { "epoch": 0.04, "learning_rate": 9.998202461242099e-06, "loss": 1.2349, "step": 1651 }, { "epoch": 0.04, "learning_rate": 9.998192377500638e-06, "loss": 1.3338, "step": 1652 }, { "epoch": 0.04, "learning_rate": 9.998182265559717e-06, "loss": 1.1691, "step": 1653 }, { "epoch": 0.04, "learning_rate": 9.998172125419391e-06, "loss": 1.22, "step": 1654 }, { "epoch": 0.04, "learning_rate": 9.998161957079717e-06, "loss": 1.0377, "step": 1655 }, { "epoch": 0.04, "learning_rate": 9.998151760540756e-06, "loss": 1.0465, "step": 1656 }, { "epoch": 0.04, "learning_rate": 9.998141535802558e-06, "loss": 1.1125, "step": 1657 }, { "epoch": 0.04, "learning_rate": 9.99813128286519e-06, "loss": 1.2892, "step": 1658 }, { "epoch": 0.04, "learning_rate": 9.998121001728705e-06, "loss": 1.0791, "step": 1659 }, { "epoch": 0.04, "learning_rate": 9.99811069239316e-06, "loss": 1.1596, "step": 1660 }, { "epoch": 0.04, "learning_rate": 9.998100354858614e-06, "loss": 0.7355, "step": 1661 }, { "epoch": 0.04, "learning_rate": 9.998089989125126e-06, "loss": 0.996, "step": 1662 }, { "epoch": 0.04, "learning_rate": 9.998079595192753e-06, "loss": 1.129, "step": 1663 }, { "epoch": 0.04, "learning_rate": 9.998069173061557e-06, "loss": 1.2663, "step": 1664 }, { "epoch": 0.04, "learning_rate": 9.998058722731594e-06, "loss": 1.1486, "step": 1665 }, { "epoch": 0.04, "learning_rate": 9.998048244202924e-06, "loss": 1.3347, "step": 1666 }, { "epoch": 0.04, "learning_rate": 9.998037737475606e-06, "loss": 1.1758, "step": 1667 }, { "epoch": 0.04, "learning_rate": 9.998027202549698e-06, "loss": 1.1108, "step": 1668 }, { "epoch": 0.04, "learning_rate": 9.99801663942526e-06, "loss": 1.1711, "step": 1669 }, { "epoch": 0.04, "learning_rate": 9.998006048102354e-06, "loss": 1.0449, "step": 1670 }, { "epoch": 0.04, "learning_rate": 9.997995428581037e-06, "loss": 1.1843, "step": 1671 }, { "epoch": 0.04, "learning_rate": 9.997984780861369e-06, "loss": 1.0682, "step": 1672 }, { "epoch": 0.04, "learning_rate": 9.997974104943412e-06, "loss": 0.84, "step": 1673 }, { "epoch": 0.04, "learning_rate": 9.997963400827224e-06, "loss": 1.1317, "step": 1674 }, { "epoch": 0.04, "learning_rate": 9.997952668512866e-06, "loss": 0.8795, "step": 1675 }, { "epoch": 0.04, "learning_rate": 9.997941908000402e-06, "loss": 1.108, "step": 1676 }, { "epoch": 0.04, "learning_rate": 9.997931119289887e-06, "loss": 0.9631, "step": 1677 }, { "epoch": 0.04, "learning_rate": 9.997920302381385e-06, "loss": 1.167, "step": 1678 }, { "epoch": 0.04, "learning_rate": 9.997909457274957e-06, "loss": 1.2596, "step": 1679 }, { "epoch": 0.04, "learning_rate": 9.997898583970664e-06, "loss": 1.1028, "step": 1680 }, { "epoch": 0.04, "learning_rate": 9.997887682468566e-06, "loss": 1.0209, "step": 1681 }, { "epoch": 0.04, "learning_rate": 9.997876752768726e-06, "loss": 1.1541, "step": 1682 }, { "epoch": 0.04, "learning_rate": 9.997865794871207e-06, "loss": 1.1281, "step": 1683 }, { "epoch": 0.04, "learning_rate": 9.997854808776068e-06, "loss": 1.2324, "step": 1684 }, { "epoch": 0.04, "learning_rate": 9.997843794483373e-06, "loss": 1.0866, "step": 1685 }, { "epoch": 0.04, "learning_rate": 9.997832751993181e-06, "loss": 1.0339, "step": 1686 }, { "epoch": 0.04, "learning_rate": 9.997821681305559e-06, "loss": 1.1833, "step": 1687 }, { "epoch": 0.04, "learning_rate": 9.997810582420564e-06, "loss": 1.0435, "step": 1688 }, { "epoch": 0.04, "learning_rate": 9.997799455338265e-06, "loss": 1.3844, "step": 1689 }, { "epoch": 0.04, "learning_rate": 9.99778830005872e-06, "loss": 1.1712, "step": 1690 }, { "epoch": 0.04, "learning_rate": 9.997777116581993e-06, "loss": 1.0882, "step": 1691 }, { "epoch": 0.04, "learning_rate": 9.997765904908147e-06, "loss": 1.1345, "step": 1692 }, { "epoch": 0.04, "learning_rate": 9.997754665037248e-06, "loss": 1.06, "step": 1693 }, { "epoch": 0.04, "learning_rate": 9.997743396969355e-06, "loss": 1.2851, "step": 1694 }, { "epoch": 0.04, "learning_rate": 9.997732100704535e-06, "loss": 1.1428, "step": 1695 }, { "epoch": 0.04, "learning_rate": 9.99772077624285e-06, "loss": 1.2267, "step": 1696 }, { "epoch": 0.04, "learning_rate": 9.997709423584364e-06, "loss": 1.0831, "step": 1697 }, { "epoch": 0.04, "learning_rate": 9.997698042729142e-06, "loss": 1.2037, "step": 1698 }, { "epoch": 0.04, "learning_rate": 9.997686633677246e-06, "loss": 1.0108, "step": 1699 }, { "epoch": 0.04, "learning_rate": 9.997675196428744e-06, "loss": 1.1723, "step": 1700 }, { "epoch": 0.04, "learning_rate": 9.997663730983697e-06, "loss": 1.0526, "step": 1701 }, { "epoch": 0.04, "learning_rate": 9.997652237342172e-06, "loss": 0.9795, "step": 1702 }, { "epoch": 0.04, "learning_rate": 9.997640715504233e-06, "loss": 1.0566, "step": 1703 }, { "epoch": 0.04, "learning_rate": 9.997629165469944e-06, "loss": 0.8428, "step": 1704 }, { "epoch": 0.04, "learning_rate": 9.997617587239373e-06, "loss": 0.8144, "step": 1705 }, { "epoch": 0.04, "learning_rate": 9.997605980812581e-06, "loss": 1.0512, "step": 1706 }, { "epoch": 0.04, "learning_rate": 9.997594346189639e-06, "loss": 1.089, "step": 1707 }, { "epoch": 0.04, "learning_rate": 9.997582683370608e-06, "loss": 1.2316, "step": 1708 }, { "epoch": 0.04, "learning_rate": 9.997570992355554e-06, "loss": 0.9349, "step": 1709 }, { "epoch": 0.04, "learning_rate": 9.997559273144546e-06, "loss": 0.8211, "step": 1710 }, { "epoch": 0.04, "learning_rate": 9.99754752573765e-06, "loss": 1.3261, "step": 1711 }, { "epoch": 0.04, "learning_rate": 9.997535750134927e-06, "loss": 1.1056, "step": 1712 }, { "epoch": 0.04, "learning_rate": 9.997523946336452e-06, "loss": 1.1943, "step": 1713 }, { "epoch": 0.04, "learning_rate": 9.997512114342282e-06, "loss": 1.0583, "step": 1714 }, { "epoch": 0.04, "learning_rate": 9.997500254152492e-06, "loss": 1.1126, "step": 1715 }, { "epoch": 0.04, "learning_rate": 9.997488365767145e-06, "loss": 1.1053, "step": 1716 }, { "epoch": 0.04, "learning_rate": 9.997476449186307e-06, "loss": 1.0912, "step": 1717 }, { "epoch": 0.04, "learning_rate": 9.997464504410048e-06, "loss": 1.0763, "step": 1718 }, { "epoch": 0.04, "learning_rate": 9.997452531438435e-06, "loss": 1.0993, "step": 1719 }, { "epoch": 0.04, "learning_rate": 9.997440530271532e-06, "loss": 1.0673, "step": 1720 }, { "epoch": 0.04, "learning_rate": 9.997428500909412e-06, "loss": 1.142, "step": 1721 }, { "epoch": 0.04, "learning_rate": 9.99741644335214e-06, "loss": 1.3536, "step": 1722 }, { "epoch": 0.04, "learning_rate": 9.997404357599783e-06, "loss": 1.2241, "step": 1723 }, { "epoch": 0.04, "learning_rate": 9.997392243652412e-06, "loss": 1.1552, "step": 1724 }, { "epoch": 0.04, "learning_rate": 9.997380101510092e-06, "loss": 1.0507, "step": 1725 }, { "epoch": 0.04, "learning_rate": 9.997367931172896e-06, "loss": 1.3327, "step": 1726 }, { "epoch": 0.04, "learning_rate": 9.997355732640887e-06, "loss": 1.3671, "step": 1727 }, { "epoch": 0.04, "learning_rate": 9.99734350591414e-06, "loss": 1.2333, "step": 1728 }, { "epoch": 0.04, "learning_rate": 9.99733125099272e-06, "loss": 0.9654, "step": 1729 }, { "epoch": 0.04, "learning_rate": 9.997318967876696e-06, "loss": 1.2706, "step": 1730 }, { "epoch": 0.04, "learning_rate": 9.997306656566139e-06, "loss": 1.0961, "step": 1731 }, { "epoch": 0.04, "learning_rate": 9.997294317061117e-06, "loss": 1.1718, "step": 1732 }, { "epoch": 0.04, "learning_rate": 9.997281949361701e-06, "loss": 1.1424, "step": 1733 }, { "epoch": 0.04, "learning_rate": 9.99726955346796e-06, "loss": 1.1762, "step": 1734 }, { "epoch": 0.04, "learning_rate": 9.997257129379964e-06, "loss": 1.0383, "step": 1735 }, { "epoch": 0.04, "learning_rate": 9.997244677097784e-06, "loss": 1.4059, "step": 1736 }, { "epoch": 0.04, "learning_rate": 9.997232196621488e-06, "loss": 1.1816, "step": 1737 }, { "epoch": 0.04, "learning_rate": 9.997219687951149e-06, "loss": 1.2414, "step": 1738 }, { "epoch": 0.04, "learning_rate": 9.997207151086836e-06, "loss": 1.3517, "step": 1739 }, { "epoch": 0.04, "learning_rate": 9.99719458602862e-06, "loss": 0.9843, "step": 1740 }, { "epoch": 0.04, "learning_rate": 9.997181992776573e-06, "loss": 1.2251, "step": 1741 }, { "epoch": 0.04, "learning_rate": 9.997169371330764e-06, "loss": 1.0348, "step": 1742 }, { "epoch": 0.04, "learning_rate": 9.997156721691266e-06, "loss": 0.982, "step": 1743 }, { "epoch": 0.04, "learning_rate": 9.99714404385815e-06, "loss": 1.1031, "step": 1744 }, { "epoch": 0.04, "learning_rate": 9.997131337831486e-06, "loss": 1.3597, "step": 1745 }, { "epoch": 0.04, "learning_rate": 9.997118603611347e-06, "loss": 1.1512, "step": 1746 }, { "epoch": 0.04, "learning_rate": 9.997105841197805e-06, "loss": 1.2472, "step": 1747 }, { "epoch": 0.04, "learning_rate": 9.997093050590932e-06, "loss": 1.1115, "step": 1748 }, { "epoch": 0.04, "learning_rate": 9.9970802317908e-06, "loss": 1.2711, "step": 1749 }, { "epoch": 0.04, "learning_rate": 9.99706738479748e-06, "loss": 1.2757, "step": 1750 }, { "epoch": 0.04, "learning_rate": 9.997054509611047e-06, "loss": 1.1823, "step": 1751 }, { "epoch": 0.04, "learning_rate": 9.997041606231572e-06, "loss": 1.1148, "step": 1752 }, { "epoch": 0.04, "learning_rate": 9.99702867465913e-06, "loss": 1.1573, "step": 1753 }, { "epoch": 0.04, "learning_rate": 9.99701571489379e-06, "loss": 1.1023, "step": 1754 }, { "epoch": 0.04, "learning_rate": 9.997002726935627e-06, "loss": 1.1751, "step": 1755 }, { "epoch": 0.04, "learning_rate": 9.996989710784715e-06, "loss": 0.9811, "step": 1756 }, { "epoch": 0.04, "learning_rate": 9.996976666441127e-06, "loss": 1.0377, "step": 1757 }, { "epoch": 0.04, "learning_rate": 9.996963593904938e-06, "loss": 1.3181, "step": 1758 }, { "epoch": 0.04, "learning_rate": 9.996950493176218e-06, "loss": 1.443, "step": 1759 }, { "epoch": 0.04, "learning_rate": 9.996937364255045e-06, "loss": 1.0528, "step": 1760 }, { "epoch": 0.04, "learning_rate": 9.99692420714149e-06, "loss": 1.1089, "step": 1761 }, { "epoch": 0.04, "learning_rate": 9.99691102183563e-06, "loss": 1.1001, "step": 1762 }, { "epoch": 0.04, "learning_rate": 9.996897808337535e-06, "loss": 1.0787, "step": 1763 }, { "epoch": 0.04, "learning_rate": 9.996884566647287e-06, "loss": 1.0052, "step": 1764 }, { "epoch": 0.04, "learning_rate": 9.996871296764952e-06, "loss": 1.2313, "step": 1765 }, { "epoch": 0.04, "learning_rate": 9.99685799869061e-06, "loss": 1.0672, "step": 1766 }, { "epoch": 0.04, "learning_rate": 9.996844672424336e-06, "loss": 1.0775, "step": 1767 }, { "epoch": 0.04, "learning_rate": 9.996831317966204e-06, "loss": 1.1409, "step": 1768 }, { "epoch": 0.04, "learning_rate": 9.99681793531629e-06, "loss": 1.0899, "step": 1769 }, { "epoch": 0.04, "learning_rate": 9.996804524474668e-06, "loss": 1.173, "step": 1770 }, { "epoch": 0.04, "learning_rate": 9.996791085441415e-06, "loss": 1.0265, "step": 1771 }, { "epoch": 0.04, "learning_rate": 9.996777618216608e-06, "loss": 0.9377, "step": 1772 }, { "epoch": 0.04, "learning_rate": 9.99676412280032e-06, "loss": 1.2924, "step": 1773 }, { "epoch": 0.04, "learning_rate": 9.996750599192629e-06, "loss": 1.5154, "step": 1774 }, { "epoch": 0.04, "learning_rate": 9.996737047393613e-06, "loss": 0.9551, "step": 1775 }, { "epoch": 0.04, "learning_rate": 9.996723467403343e-06, "loss": 0.8921, "step": 1776 }, { "epoch": 0.04, "learning_rate": 9.9967098592219e-06, "loss": 1.0487, "step": 1777 }, { "epoch": 0.04, "learning_rate": 9.996696222849362e-06, "loss": 1.0403, "step": 1778 }, { "epoch": 0.04, "learning_rate": 9.996682558285802e-06, "loss": 1.1693, "step": 1779 }, { "epoch": 0.04, "learning_rate": 9.996668865531298e-06, "loss": 1.1696, "step": 1780 }, { "epoch": 0.04, "learning_rate": 9.99665514458593e-06, "loss": 1.1666, "step": 1781 }, { "epoch": 0.04, "learning_rate": 9.996641395449773e-06, "loss": 1.3049, "step": 1782 }, { "epoch": 0.04, "learning_rate": 9.996627618122905e-06, "loss": 1.2274, "step": 1783 }, { "epoch": 0.04, "learning_rate": 9.996613812605404e-06, "loss": 1.349, "step": 1784 }, { "epoch": 0.04, "learning_rate": 9.996599978897348e-06, "loss": 1.0914, "step": 1785 }, { "epoch": 0.04, "learning_rate": 9.996586116998815e-06, "loss": 1.2269, "step": 1786 }, { "epoch": 0.04, "learning_rate": 9.996572226909883e-06, "loss": 0.9203, "step": 1787 }, { "epoch": 0.04, "learning_rate": 9.996558308630629e-06, "loss": 1.2395, "step": 1788 }, { "epoch": 0.04, "learning_rate": 9.996544362161132e-06, "loss": 1.2504, "step": 1789 }, { "epoch": 0.04, "learning_rate": 9.996530387501473e-06, "loss": 1.0333, "step": 1790 }, { "epoch": 0.04, "learning_rate": 9.996516384651731e-06, "loss": 1.5018, "step": 1791 }, { "epoch": 0.04, "learning_rate": 9.996502353611982e-06, "loss": 1.3287, "step": 1792 }, { "epoch": 0.04, "learning_rate": 9.996488294382307e-06, "loss": 1.0323, "step": 1793 }, { "epoch": 0.04, "learning_rate": 9.996474206962782e-06, "loss": 1.0964, "step": 1794 }, { "epoch": 0.04, "learning_rate": 9.996460091353493e-06, "loss": 0.9505, "step": 1795 }, { "epoch": 0.04, "learning_rate": 9.996445947554516e-06, "loss": 1.0012, "step": 1796 }, { "epoch": 0.04, "learning_rate": 9.99643177556593e-06, "loss": 1.2589, "step": 1797 }, { "epoch": 0.04, "learning_rate": 9.996417575387815e-06, "loss": 0.9291, "step": 1798 }, { "epoch": 0.04, "learning_rate": 9.996403347020252e-06, "loss": 1.0675, "step": 1799 }, { "epoch": 0.04, "learning_rate": 9.996389090463322e-06, "loss": 1.2389, "step": 1800 }, { "epoch": 0.04, "learning_rate": 9.996374805717105e-06, "loss": 1.2279, "step": 1801 }, { "epoch": 0.04, "learning_rate": 9.99636049278168e-06, "loss": 0.9271, "step": 1802 }, { "epoch": 0.04, "learning_rate": 9.99634615165713e-06, "loss": 1.0847, "step": 1803 }, { "epoch": 0.04, "learning_rate": 9.996331782343534e-06, "loss": 1.2401, "step": 1804 }, { "epoch": 0.04, "learning_rate": 9.996317384840974e-06, "loss": 1.2019, "step": 1805 }, { "epoch": 0.04, "learning_rate": 9.996302959149532e-06, "loss": 1.1261, "step": 1806 }, { "epoch": 0.04, "learning_rate": 9.996288505269287e-06, "loss": 1.0577, "step": 1807 }, { "epoch": 0.04, "learning_rate": 9.996274023200322e-06, "loss": 1.1432, "step": 1808 }, { "epoch": 0.04, "learning_rate": 9.996259512942721e-06, "loss": 1.163, "step": 1809 }, { "epoch": 0.04, "learning_rate": 9.996244974496562e-06, "loss": 1.1661, "step": 1810 }, { "epoch": 0.04, "learning_rate": 9.996230407861929e-06, "loss": 1.0513, "step": 1811 }, { "epoch": 0.04, "learning_rate": 9.996215813038905e-06, "loss": 1.0899, "step": 1812 }, { "epoch": 0.04, "learning_rate": 9.99620119002757e-06, "loss": 0.8658, "step": 1813 }, { "epoch": 0.04, "learning_rate": 9.996186538828008e-06, "loss": 1.0287, "step": 1814 }, { "epoch": 0.04, "learning_rate": 9.996171859440301e-06, "loss": 0.9841, "step": 1815 }, { "epoch": 0.04, "learning_rate": 9.996157151864532e-06, "loss": 0.9829, "step": 1816 }, { "epoch": 0.04, "learning_rate": 9.996142416100786e-06, "loss": 1.0137, "step": 1817 }, { "epoch": 0.04, "learning_rate": 9.996127652149143e-06, "loss": 1.2009, "step": 1818 }, { "epoch": 0.04, "learning_rate": 9.996112860009689e-06, "loss": 1.1839, "step": 1819 }, { "epoch": 0.04, "learning_rate": 9.996098039682503e-06, "loss": 1.0313, "step": 1820 }, { "epoch": 0.04, "learning_rate": 9.996083191167673e-06, "loss": 1.2684, "step": 1821 }, { "epoch": 0.04, "learning_rate": 9.996068314465283e-06, "loss": 1.1696, "step": 1822 }, { "epoch": 0.04, "learning_rate": 9.996053409575415e-06, "loss": 0.9913, "step": 1823 }, { "epoch": 0.04, "learning_rate": 9.996038476498152e-06, "loss": 1.1932, "step": 1824 }, { "epoch": 0.04, "learning_rate": 9.996023515233582e-06, "loss": 1.2449, "step": 1825 }, { "epoch": 0.04, "learning_rate": 9.996008525781784e-06, "loss": 1.1002, "step": 1826 }, { "epoch": 0.04, "learning_rate": 9.995993508142849e-06, "loss": 0.9011, "step": 1827 }, { "epoch": 0.04, "learning_rate": 9.995978462316856e-06, "loss": 1.159, "step": 1828 }, { "epoch": 0.04, "learning_rate": 9.995963388303894e-06, "loss": 1.0621, "step": 1829 }, { "epoch": 0.04, "learning_rate": 9.995948286104045e-06, "loss": 1.0939, "step": 1830 }, { "epoch": 0.04, "learning_rate": 9.995933155717396e-06, "loss": 1.1561, "step": 1831 }, { "epoch": 0.04, "learning_rate": 9.995917997144033e-06, "loss": 0.9246, "step": 1832 }, { "epoch": 0.04, "learning_rate": 9.99590281038404e-06, "loss": 1.2417, "step": 1833 }, { "epoch": 0.04, "learning_rate": 9.995887595437504e-06, "loss": 1.1474, "step": 1834 }, { "epoch": 0.04, "learning_rate": 9.995872352304508e-06, "loss": 1.384, "step": 1835 }, { "epoch": 0.04, "learning_rate": 9.995857080985141e-06, "loss": 1.2156, "step": 1836 }, { "epoch": 0.04, "learning_rate": 9.995841781479487e-06, "loss": 0.9738, "step": 1837 }, { "epoch": 0.04, "learning_rate": 9.995826453787637e-06, "loss": 1.4743, "step": 1838 }, { "epoch": 0.04, "learning_rate": 9.995811097909668e-06, "loss": 0.9338, "step": 1839 }, { "epoch": 0.04, "learning_rate": 9.995795713845678e-06, "loss": 1.2243, "step": 1840 }, { "epoch": 0.04, "learning_rate": 9.995780301595746e-06, "loss": 1.0983, "step": 1841 }, { "epoch": 0.04, "learning_rate": 9.995764861159963e-06, "loss": 1.0417, "step": 1842 }, { "epoch": 0.04, "learning_rate": 9.995749392538413e-06, "loss": 0.8932, "step": 1843 }, { "epoch": 0.04, "learning_rate": 9.995733895731186e-06, "loss": 1.2428, "step": 1844 }, { "epoch": 0.04, "learning_rate": 9.995718370738366e-06, "loss": 0.9122, "step": 1845 }, { "epoch": 0.04, "learning_rate": 9.995702817560045e-06, "loss": 1.076, "step": 1846 }, { "epoch": 0.04, "learning_rate": 9.995687236196307e-06, "loss": 1.184, "step": 1847 }, { "epoch": 0.04, "learning_rate": 9.995671626647242e-06, "loss": 0.9664, "step": 1848 }, { "epoch": 0.04, "learning_rate": 9.995655988912938e-06, "loss": 1.031, "step": 1849 }, { "epoch": 0.04, "learning_rate": 9.995640322993482e-06, "loss": 1.1795, "step": 1850 }, { "epoch": 0.04, "learning_rate": 9.995624628888963e-06, "loss": 1.1608, "step": 1851 }, { "epoch": 0.04, "learning_rate": 9.99560890659947e-06, "loss": 1.1101, "step": 1852 }, { "epoch": 0.04, "learning_rate": 9.995593156125091e-06, "loss": 1.0451, "step": 1853 }, { "epoch": 0.04, "learning_rate": 9.995577377465916e-06, "loss": 1.1053, "step": 1854 }, { "epoch": 0.04, "learning_rate": 9.995561570622032e-06, "loss": 1.1353, "step": 1855 }, { "epoch": 0.04, "learning_rate": 9.995545735593531e-06, "loss": 1.0726, "step": 1856 }, { "epoch": 0.04, "learning_rate": 9.9955298723805e-06, "loss": 1.1387, "step": 1857 }, { "epoch": 0.04, "learning_rate": 9.995513980983029e-06, "loss": 1.3367, "step": 1858 }, { "epoch": 0.04, "learning_rate": 9.995498061401207e-06, "loss": 1.2795, "step": 1859 }, { "epoch": 0.04, "learning_rate": 9.995482113635127e-06, "loss": 1.0236, "step": 1860 }, { "epoch": 0.04, "learning_rate": 9.995466137684875e-06, "loss": 1.4444, "step": 1861 }, { "epoch": 0.04, "learning_rate": 9.995450133550544e-06, "loss": 1.1237, "step": 1862 }, { "epoch": 0.04, "learning_rate": 9.995434101232222e-06, "loss": 1.3173, "step": 1863 }, { "epoch": 0.04, "learning_rate": 9.995418040730001e-06, "loss": 0.9999, "step": 1864 }, { "epoch": 0.04, "learning_rate": 9.995401952043972e-06, "loss": 1.0887, "step": 1865 }, { "epoch": 0.04, "learning_rate": 9.995385835174223e-06, "loss": 1.2018, "step": 1866 }, { "epoch": 0.04, "learning_rate": 9.995369690120849e-06, "loss": 0.9045, "step": 1867 }, { "epoch": 0.04, "learning_rate": 9.995353516883939e-06, "loss": 1.1763, "step": 1868 }, { "epoch": 0.04, "learning_rate": 9.995337315463583e-06, "loss": 1.1612, "step": 1869 }, { "epoch": 0.04, "learning_rate": 9.995321085859874e-06, "loss": 1.0112, "step": 1870 }, { "epoch": 0.04, "learning_rate": 9.995304828072902e-06, "loss": 1.1033, "step": 1871 }, { "epoch": 0.04, "learning_rate": 9.995288542102763e-06, "loss": 0.949, "step": 1872 }, { "epoch": 0.04, "learning_rate": 9.995272227949543e-06, "loss": 1.2116, "step": 1873 }, { "epoch": 0.04, "learning_rate": 9.995255885613337e-06, "loss": 1.0379, "step": 1874 }, { "epoch": 0.04, "learning_rate": 9.995239515094239e-06, "loss": 1.0963, "step": 1875 }, { "epoch": 0.04, "learning_rate": 9.995223116392339e-06, "loss": 1.3267, "step": 1876 }, { "epoch": 0.04, "learning_rate": 9.99520668950773e-06, "loss": 1.199, "step": 1877 }, { "epoch": 0.04, "learning_rate": 9.995190234440503e-06, "loss": 1.0717, "step": 1878 }, { "epoch": 0.04, "learning_rate": 9.995173751190754e-06, "loss": 0.9125, "step": 1879 }, { "epoch": 0.04, "learning_rate": 9.995157239758574e-06, "loss": 1.0851, "step": 1880 }, { "epoch": 0.04, "learning_rate": 9.995140700144058e-06, "loss": 1.3378, "step": 1881 }, { "epoch": 0.04, "learning_rate": 9.995124132347295e-06, "loss": 1.025, "step": 1882 }, { "epoch": 0.04, "learning_rate": 9.995107536368382e-06, "loss": 1.3211, "step": 1883 }, { "epoch": 0.04, "learning_rate": 9.995090912207414e-06, "loss": 1.1258, "step": 1884 }, { "epoch": 0.04, "learning_rate": 9.995074259864481e-06, "loss": 1.2906, "step": 1885 }, { "epoch": 0.04, "learning_rate": 9.99505757933968e-06, "loss": 1.1542, "step": 1886 }, { "epoch": 0.04, "learning_rate": 9.995040870633104e-06, "loss": 1.2236, "step": 1887 }, { "epoch": 0.04, "learning_rate": 9.995024133744846e-06, "loss": 0.7421, "step": 1888 }, { "epoch": 0.04, "learning_rate": 9.995007368675003e-06, "loss": 0.8333, "step": 1889 }, { "epoch": 0.04, "learning_rate": 9.994990575423667e-06, "loss": 1.1252, "step": 1890 }, { "epoch": 0.04, "learning_rate": 9.994973753990935e-06, "loss": 1.0842, "step": 1891 }, { "epoch": 0.04, "learning_rate": 9.9949569043769e-06, "loss": 0.9036, "step": 1892 }, { "epoch": 0.04, "learning_rate": 9.994940026581658e-06, "loss": 0.9496, "step": 1893 }, { "epoch": 0.04, "learning_rate": 9.994923120605304e-06, "loss": 0.9891, "step": 1894 }, { "epoch": 0.04, "learning_rate": 9.994906186447935e-06, "loss": 1.1851, "step": 1895 }, { "epoch": 0.04, "learning_rate": 9.994889224109642e-06, "loss": 1.0457, "step": 1896 }, { "epoch": 0.04, "learning_rate": 9.994872233590526e-06, "loss": 0.9502, "step": 1897 }, { "epoch": 0.04, "learning_rate": 9.994855214890682e-06, "loss": 1.2144, "step": 1898 }, { "epoch": 0.04, "learning_rate": 9.994838168010202e-06, "loss": 1.1694, "step": 1899 }, { "epoch": 0.04, "learning_rate": 9.994821092949185e-06, "loss": 1.2106, "step": 1900 }, { "epoch": 0.04, "learning_rate": 9.994803989707729e-06, "loss": 1.1402, "step": 1901 }, { "epoch": 0.04, "learning_rate": 9.994786858285927e-06, "loss": 1.1327, "step": 1902 }, { "epoch": 0.04, "learning_rate": 9.994769698683878e-06, "loss": 1.3715, "step": 1903 }, { "epoch": 0.04, "learning_rate": 9.994752510901678e-06, "loss": 1.2256, "step": 1904 }, { "epoch": 0.04, "learning_rate": 9.994735294939422e-06, "loss": 1.34, "step": 1905 }, { "epoch": 0.04, "learning_rate": 9.994718050797212e-06, "loss": 1.1695, "step": 1906 }, { "epoch": 0.04, "learning_rate": 9.994700778475142e-06, "loss": 1.2509, "step": 1907 }, { "epoch": 0.04, "learning_rate": 9.994683477973309e-06, "loss": 1.0569, "step": 1908 }, { "epoch": 0.04, "learning_rate": 9.994666149291811e-06, "loss": 1.2498, "step": 1909 }, { "epoch": 0.04, "learning_rate": 9.99464879243075e-06, "loss": 1.0959, "step": 1910 }, { "epoch": 0.04, "learning_rate": 9.994631407390215e-06, "loss": 1.1604, "step": 1911 }, { "epoch": 0.04, "learning_rate": 9.994613994170313e-06, "loss": 1.3578, "step": 1912 }, { "epoch": 0.04, "learning_rate": 9.994596552771138e-06, "loss": 1.138, "step": 1913 }, { "epoch": 0.04, "learning_rate": 9.994579083192788e-06, "loss": 1.5569, "step": 1914 }, { "epoch": 0.04, "learning_rate": 9.994561585435364e-06, "loss": 1.1807, "step": 1915 }, { "epoch": 0.04, "learning_rate": 9.994544059498963e-06, "loss": 1.0572, "step": 1916 }, { "epoch": 0.04, "learning_rate": 9.994526505383682e-06, "loss": 0.9038, "step": 1917 }, { "epoch": 0.04, "learning_rate": 9.994508923089624e-06, "loss": 1.278, "step": 1918 }, { "epoch": 0.04, "learning_rate": 9.994491312616887e-06, "loss": 1.0921, "step": 1919 }, { "epoch": 0.04, "learning_rate": 9.994473673965568e-06, "loss": 0.9022, "step": 1920 }, { "epoch": 0.04, "learning_rate": 9.994456007135768e-06, "loss": 1.0638, "step": 1921 }, { "epoch": 0.04, "learning_rate": 9.99443831212759e-06, "loss": 1.0533, "step": 1922 }, { "epoch": 0.04, "learning_rate": 9.994420588941129e-06, "loss": 1.3979, "step": 1923 }, { "epoch": 0.04, "learning_rate": 9.994402837576486e-06, "loss": 1.1208, "step": 1924 }, { "epoch": 0.04, "learning_rate": 9.994385058033762e-06, "loss": 1.2388, "step": 1925 }, { "epoch": 0.04, "learning_rate": 9.994367250313057e-06, "loss": 1.2068, "step": 1926 }, { "epoch": 0.04, "learning_rate": 9.994349414414474e-06, "loss": 1.0933, "step": 1927 }, { "epoch": 0.04, "learning_rate": 9.99433155033811e-06, "loss": 1.1899, "step": 1928 }, { "epoch": 0.04, "learning_rate": 9.994313658084067e-06, "loss": 1.0026, "step": 1929 }, { "epoch": 0.04, "learning_rate": 9.994295737652443e-06, "loss": 1.0185, "step": 1930 }, { "epoch": 0.04, "learning_rate": 9.994277789043348e-06, "loss": 1.2305, "step": 1931 }, { "epoch": 0.04, "learning_rate": 9.994259812256874e-06, "loss": 0.9932, "step": 1932 }, { "epoch": 0.04, "learning_rate": 9.994241807293126e-06, "loss": 1.2554, "step": 1933 }, { "epoch": 0.04, "learning_rate": 9.994223774152206e-06, "loss": 1.1399, "step": 1934 }, { "epoch": 0.04, "learning_rate": 9.994205712834214e-06, "loss": 0.8776, "step": 1935 }, { "epoch": 0.04, "learning_rate": 9.994187623339255e-06, "loss": 1.0796, "step": 1936 }, { "epoch": 0.04, "learning_rate": 9.994169505667428e-06, "loss": 1.0299, "step": 1937 }, { "epoch": 0.04, "learning_rate": 9.994151359818836e-06, "loss": 1.0449, "step": 1938 }, { "epoch": 0.04, "learning_rate": 9.994133185793582e-06, "loss": 1.3916, "step": 1939 }, { "epoch": 0.04, "learning_rate": 9.994114983591768e-06, "loss": 0.756, "step": 1940 }, { "epoch": 0.05, "learning_rate": 9.994096753213498e-06, "loss": 1.0101, "step": 1941 }, { "epoch": 0.05, "learning_rate": 9.994078494658874e-06, "loss": 1.0675, "step": 1942 }, { "epoch": 0.05, "learning_rate": 9.994060207927998e-06, "loss": 1.0577, "step": 1943 }, { "epoch": 0.05, "learning_rate": 9.994041893020973e-06, "loss": 1.2699, "step": 1944 }, { "epoch": 0.05, "learning_rate": 9.994023549937905e-06, "loss": 1.2352, "step": 1945 }, { "epoch": 0.05, "learning_rate": 9.994005178678895e-06, "loss": 1.2628, "step": 1946 }, { "epoch": 0.05, "learning_rate": 9.993986779244048e-06, "loss": 1.161, "step": 1947 }, { "epoch": 0.05, "learning_rate": 9.993968351633467e-06, "loss": 0.9045, "step": 1948 }, { "epoch": 0.05, "learning_rate": 9.993949895847256e-06, "loss": 1.2757, "step": 1949 }, { "epoch": 0.05, "learning_rate": 9.99393141188552e-06, "loss": 1.4167, "step": 1950 }, { "epoch": 0.05, "learning_rate": 9.993912899748362e-06, "loss": 1.0599, "step": 1951 }, { "epoch": 0.05, "learning_rate": 9.993894359435888e-06, "loss": 0.8049, "step": 1952 }, { "epoch": 0.05, "learning_rate": 9.9938757909482e-06, "loss": 0.8213, "step": 1953 }, { "epoch": 0.05, "learning_rate": 9.993857194285406e-06, "loss": 1.1746, "step": 1954 }, { "epoch": 0.05, "learning_rate": 9.993838569447609e-06, "loss": 1.0356, "step": 1955 }, { "epoch": 0.05, "learning_rate": 9.993819916434915e-06, "loss": 0.8958, "step": 1956 }, { "epoch": 0.05, "learning_rate": 9.993801235247428e-06, "loss": 1.2381, "step": 1957 }, { "epoch": 0.05, "learning_rate": 9.993782525885254e-06, "loss": 1.0052, "step": 1958 }, { "epoch": 0.05, "learning_rate": 9.993763788348498e-06, "loss": 1.0044, "step": 1959 }, { "epoch": 0.05, "learning_rate": 9.99374502263727e-06, "loss": 1.3164, "step": 1960 }, { "epoch": 0.05, "learning_rate": 9.993726228751668e-06, "loss": 1.0679, "step": 1961 }, { "epoch": 0.05, "learning_rate": 9.993707406691804e-06, "loss": 0.8509, "step": 1962 }, { "epoch": 0.05, "learning_rate": 9.993688556457782e-06, "loss": 1.044, "step": 1963 }, { "epoch": 0.05, "learning_rate": 9.993669678049709e-06, "loss": 1.2671, "step": 1964 }, { "epoch": 0.05, "learning_rate": 9.993650771467692e-06, "loss": 1.1239, "step": 1965 }, { "epoch": 0.05, "learning_rate": 9.993631836711837e-06, "loss": 1.2872, "step": 1966 }, { "epoch": 0.05, "learning_rate": 9.993612873782251e-06, "loss": 1.2605, "step": 1967 }, { "epoch": 0.05, "learning_rate": 9.99359388267904e-06, "loss": 0.9449, "step": 1968 }, { "epoch": 0.05, "learning_rate": 9.99357486340231e-06, "loss": 1.3128, "step": 1969 }, { "epoch": 0.05, "learning_rate": 9.993555815952173e-06, "loss": 0.7963, "step": 1970 }, { "epoch": 0.05, "learning_rate": 9.993536740328734e-06, "loss": 1.2249, "step": 1971 }, { "epoch": 0.05, "learning_rate": 9.9935176365321e-06, "loss": 1.1477, "step": 1972 }, { "epoch": 0.05, "learning_rate": 9.993498504562378e-06, "loss": 1.1306, "step": 1973 }, { "epoch": 0.05, "learning_rate": 9.993479344419679e-06, "loss": 1.2001, "step": 1974 }, { "epoch": 0.05, "learning_rate": 9.993460156104107e-06, "loss": 1.1193, "step": 1975 }, { "epoch": 0.05, "learning_rate": 9.993440939615774e-06, "loss": 0.9083, "step": 1976 }, { "epoch": 0.05, "learning_rate": 9.993421694954786e-06, "loss": 1.0803, "step": 1977 }, { "epoch": 0.05, "learning_rate": 9.993402422121253e-06, "loss": 1.1623, "step": 1978 }, { "epoch": 0.05, "learning_rate": 9.993383121115283e-06, "loss": 1.3604, "step": 1979 }, { "epoch": 0.05, "learning_rate": 9.993363791936985e-06, "loss": 1.1272, "step": 1980 }, { "epoch": 0.05, "learning_rate": 9.99334443458647e-06, "loss": 1.1441, "step": 1981 }, { "epoch": 0.05, "learning_rate": 9.993325049063843e-06, "loss": 1.0917, "step": 1982 }, { "epoch": 0.05, "learning_rate": 9.993305635369216e-06, "loss": 1.1146, "step": 1983 }, { "epoch": 0.05, "learning_rate": 9.993286193502698e-06, "loss": 1.1194, "step": 1984 }, { "epoch": 0.05, "learning_rate": 9.9932667234644e-06, "loss": 1.2163, "step": 1985 }, { "epoch": 0.05, "learning_rate": 9.99324722525443e-06, "loss": 0.9606, "step": 1986 }, { "epoch": 0.05, "learning_rate": 9.993227698872899e-06, "loss": 1.2377, "step": 1987 }, { "epoch": 0.05, "learning_rate": 9.993208144319918e-06, "loss": 0.8312, "step": 1988 }, { "epoch": 0.05, "learning_rate": 9.993188561595595e-06, "loss": 1.2628, "step": 1989 }, { "epoch": 0.05, "learning_rate": 9.993168950700041e-06, "loss": 1.0521, "step": 1990 }, { "epoch": 0.05, "learning_rate": 9.993149311633369e-06, "loss": 1.3335, "step": 1991 }, { "epoch": 0.05, "learning_rate": 9.993129644395687e-06, "loss": 0.8724, "step": 1992 }, { "epoch": 0.05, "learning_rate": 9.993109948987109e-06, "loss": 0.9841, "step": 1993 }, { "epoch": 0.05, "learning_rate": 9.993090225407743e-06, "loss": 0.8383, "step": 1994 }, { "epoch": 0.05, "learning_rate": 9.993070473657702e-06, "loss": 1.1362, "step": 1995 }, { "epoch": 0.05, "learning_rate": 9.993050693737096e-06, "loss": 1.1529, "step": 1996 }, { "epoch": 0.05, "learning_rate": 9.99303088564604e-06, "loss": 1.2843, "step": 1997 }, { "epoch": 0.05, "learning_rate": 9.99301104938464e-06, "loss": 1.1596, "step": 1998 }, { "epoch": 0.05, "learning_rate": 9.992991184953013e-06, "loss": 1.0519, "step": 1999 }, { "epoch": 0.05, "learning_rate": 9.99297129235127e-06, "loss": 1.154, "step": 2000 }, { "epoch": 0.05, "learning_rate": 9.992951371579522e-06, "loss": 1.1055, "step": 2001 }, { "epoch": 0.05, "learning_rate": 9.992931422637882e-06, "loss": 1.0284, "step": 2002 }, { "epoch": 0.05, "learning_rate": 9.992911445526463e-06, "loss": 0.9887, "step": 2003 }, { "epoch": 0.05, "learning_rate": 9.992891440245377e-06, "loss": 0.9823, "step": 2004 }, { "epoch": 0.05, "learning_rate": 9.992871406794737e-06, "loss": 1.0888, "step": 2005 }, { "epoch": 0.05, "learning_rate": 9.992851345174657e-06, "loss": 0.9502, "step": 2006 }, { "epoch": 0.05, "learning_rate": 9.992831255385247e-06, "loss": 1.0603, "step": 2007 }, { "epoch": 0.05, "learning_rate": 9.992811137426624e-06, "loss": 1.0717, "step": 2008 }, { "epoch": 0.05, "learning_rate": 9.9927909912989e-06, "loss": 1.3487, "step": 2009 }, { "epoch": 0.05, "learning_rate": 9.99277081700219e-06, "loss": 1.2958, "step": 2010 }, { "epoch": 0.05, "learning_rate": 9.992750614536606e-06, "loss": 1.1667, "step": 2011 }, { "epoch": 0.05, "learning_rate": 9.992730383902263e-06, "loss": 1.064, "step": 2012 }, { "epoch": 0.05, "learning_rate": 9.992710125099273e-06, "loss": 1.1557, "step": 2013 }, { "epoch": 0.05, "learning_rate": 9.992689838127754e-06, "loss": 0.9379, "step": 2014 }, { "epoch": 0.05, "learning_rate": 9.992669522987817e-06, "loss": 1.2097, "step": 2015 }, { "epoch": 0.05, "learning_rate": 9.992649179679578e-06, "loss": 1.1774, "step": 2016 }, { "epoch": 0.05, "learning_rate": 9.992628808203153e-06, "loss": 1.0527, "step": 2017 }, { "epoch": 0.05, "learning_rate": 9.992608408558658e-06, "loss": 0.8915, "step": 2018 }, { "epoch": 0.05, "learning_rate": 9.992587980746203e-06, "loss": 1.0963, "step": 2019 }, { "epoch": 0.05, "learning_rate": 9.992567524765906e-06, "loss": 0.7738, "step": 2020 }, { "epoch": 0.05, "learning_rate": 9.992547040617884e-06, "loss": 0.9813, "step": 2021 }, { "epoch": 0.05, "learning_rate": 9.992526528302251e-06, "loss": 1.3223, "step": 2022 }, { "epoch": 0.05, "learning_rate": 9.992505987819122e-06, "loss": 1.2647, "step": 2023 }, { "epoch": 0.05, "learning_rate": 9.992485419168613e-06, "loss": 1.1395, "step": 2024 }, { "epoch": 0.05, "learning_rate": 9.992464822350844e-06, "loss": 1.2276, "step": 2025 }, { "epoch": 0.05, "learning_rate": 9.992444197365925e-06, "loss": 1.2221, "step": 2026 }, { "epoch": 0.05, "learning_rate": 9.992423544213978e-06, "loss": 1.225, "step": 2027 }, { "epoch": 0.05, "learning_rate": 9.992402862895115e-06, "loss": 0.9969, "step": 2028 }, { "epoch": 0.05, "learning_rate": 9.992382153409456e-06, "loss": 1.1601, "step": 2029 }, { "epoch": 0.05, "learning_rate": 9.992361415757116e-06, "loss": 1.2298, "step": 2030 }, { "epoch": 0.05, "learning_rate": 9.992340649938213e-06, "loss": 1.4933, "step": 2031 }, { "epoch": 0.05, "learning_rate": 9.992319855952861e-06, "loss": 0.9225, "step": 2032 }, { "epoch": 0.05, "learning_rate": 9.992299033801183e-06, "loss": 1.2912, "step": 2033 }, { "epoch": 0.05, "learning_rate": 9.992278183483293e-06, "loss": 1.1703, "step": 2034 }, { "epoch": 0.05, "learning_rate": 9.992257304999307e-06, "loss": 1.2394, "step": 2035 }, { "epoch": 0.05, "learning_rate": 9.992236398349347e-06, "loss": 1.1373, "step": 2036 }, { "epoch": 0.05, "learning_rate": 9.992215463533527e-06, "loss": 0.9021, "step": 2037 }, { "epoch": 0.05, "learning_rate": 9.992194500551968e-06, "loss": 1.0109, "step": 2038 }, { "epoch": 0.05, "learning_rate": 9.992173509404788e-06, "loss": 1.1587, "step": 2039 }, { "epoch": 0.05, "learning_rate": 9.992152490092104e-06, "loss": 0.9716, "step": 2040 }, { "epoch": 0.05, "learning_rate": 9.992131442614034e-06, "loss": 0.958, "step": 2041 }, { "epoch": 0.05, "learning_rate": 9.9921103669707e-06, "loss": 1.115, "step": 2042 }, { "epoch": 0.05, "learning_rate": 9.992089263162217e-06, "loss": 1.042, "step": 2043 }, { "epoch": 0.05, "learning_rate": 9.992068131188708e-06, "loss": 0.7266, "step": 2044 }, { "epoch": 0.05, "learning_rate": 9.992046971050288e-06, "loss": 1.2457, "step": 2045 }, { "epoch": 0.05, "learning_rate": 9.992025782747079e-06, "loss": 0.9046, "step": 2046 }, { "epoch": 0.05, "learning_rate": 9.9920045662792e-06, "loss": 1.326, "step": 2047 }, { "epoch": 0.05, "learning_rate": 9.991983321646773e-06, "loss": 1.3182, "step": 2048 }, { "epoch": 0.05, "learning_rate": 9.991962048849914e-06, "loss": 1.0877, "step": 2049 }, { "epoch": 0.05, "learning_rate": 9.991940747888745e-06, "loss": 1.1882, "step": 2050 }, { "epoch": 0.05, "learning_rate": 9.991919418763386e-06, "loss": 0.8664, "step": 2051 }, { "epoch": 0.05, "learning_rate": 9.991898061473956e-06, "loss": 1.2978, "step": 2052 }, { "epoch": 0.05, "learning_rate": 9.991876676020577e-06, "loss": 1.0102, "step": 2053 }, { "epoch": 0.05, "learning_rate": 9.991855262403369e-06, "loss": 1.115, "step": 2054 }, { "epoch": 0.05, "learning_rate": 9.991833820622455e-06, "loss": 1.0636, "step": 2055 }, { "epoch": 0.05, "learning_rate": 9.991812350677953e-06, "loss": 1.0674, "step": 2056 }, { "epoch": 0.05, "learning_rate": 9.991790852569985e-06, "loss": 1.1631, "step": 2057 }, { "epoch": 0.05, "learning_rate": 9.991769326298672e-06, "loss": 1.3359, "step": 2058 }, { "epoch": 0.05, "learning_rate": 9.991747771864138e-06, "loss": 1.2151, "step": 2059 }, { "epoch": 0.05, "learning_rate": 9.991726189266502e-06, "loss": 0.9383, "step": 2060 }, { "epoch": 0.05, "learning_rate": 9.991704578505885e-06, "loss": 1.0464, "step": 2061 }, { "epoch": 0.05, "learning_rate": 9.991682939582412e-06, "loss": 1.0672, "step": 2062 }, { "epoch": 0.05, "learning_rate": 9.991661272496203e-06, "loss": 0.8612, "step": 2063 }, { "epoch": 0.05, "learning_rate": 9.99163957724738e-06, "loss": 1.2698, "step": 2064 }, { "epoch": 0.05, "learning_rate": 9.991617853836066e-06, "loss": 0.939, "step": 2065 }, { "epoch": 0.05, "learning_rate": 9.991596102262384e-06, "loss": 0.8037, "step": 2066 }, { "epoch": 0.05, "learning_rate": 9.991574322526456e-06, "loss": 1.2209, "step": 2067 }, { "epoch": 0.05, "learning_rate": 9.991552514628406e-06, "loss": 1.0281, "step": 2068 }, { "epoch": 0.05, "learning_rate": 9.991530678568355e-06, "loss": 0.9021, "step": 2069 }, { "epoch": 0.05, "learning_rate": 9.991508814346428e-06, "loss": 1.2871, "step": 2070 }, { "epoch": 0.05, "learning_rate": 9.991486921962748e-06, "loss": 0.9722, "step": 2071 }, { "epoch": 0.05, "learning_rate": 9.991465001417437e-06, "loss": 1.2363, "step": 2072 }, { "epoch": 0.05, "learning_rate": 9.991443052710621e-06, "loss": 1.1228, "step": 2073 }, { "epoch": 0.05, "learning_rate": 9.991421075842425e-06, "loss": 1.0646, "step": 2074 }, { "epoch": 0.05, "learning_rate": 9.991399070812969e-06, "loss": 1.0453, "step": 2075 }, { "epoch": 0.05, "learning_rate": 9.991377037622377e-06, "loss": 0.804, "step": 2076 }, { "epoch": 0.05, "learning_rate": 9.991354976270778e-06, "loss": 1.1507, "step": 2077 }, { "epoch": 0.05, "learning_rate": 9.991332886758292e-06, "loss": 1.1822, "step": 2078 }, { "epoch": 0.05, "learning_rate": 9.991310769085046e-06, "loss": 0.8814, "step": 2079 }, { "epoch": 0.05, "learning_rate": 9.991288623251165e-06, "loss": 1.2203, "step": 2080 }, { "epoch": 0.05, "learning_rate": 9.99126644925677e-06, "loss": 1.1361, "step": 2081 }, { "epoch": 0.05, "learning_rate": 9.991244247101993e-06, "loss": 1.1301, "step": 2082 }, { "epoch": 0.05, "learning_rate": 9.991222016786955e-06, "loss": 1.1419, "step": 2083 }, { "epoch": 0.05, "learning_rate": 9.99119975831178e-06, "loss": 1.0344, "step": 2084 }, { "epoch": 0.05, "learning_rate": 9.991177471676596e-06, "loss": 1.0829, "step": 2085 }, { "epoch": 0.05, "learning_rate": 9.991155156881529e-06, "loss": 1.0765, "step": 2086 }, { "epoch": 0.05, "learning_rate": 9.991132813926704e-06, "loss": 0.9184, "step": 2087 }, { "epoch": 0.05, "learning_rate": 9.991110442812246e-06, "loss": 1.055, "step": 2088 }, { "epoch": 0.05, "learning_rate": 9.991088043538283e-06, "loss": 1.1061, "step": 2089 }, { "epoch": 0.05, "learning_rate": 9.991065616104943e-06, "loss": 1.2927, "step": 2090 }, { "epoch": 0.05, "learning_rate": 9.991043160512348e-06, "loss": 1.2675, "step": 2091 }, { "epoch": 0.05, "learning_rate": 9.991020676760625e-06, "loss": 1.2052, "step": 2092 }, { "epoch": 0.05, "learning_rate": 9.990998164849905e-06, "loss": 1.2036, "step": 2093 }, { "epoch": 0.05, "learning_rate": 9.990975624780314e-06, "loss": 0.9615, "step": 2094 }, { "epoch": 0.05, "learning_rate": 9.990953056551978e-06, "loss": 1.0458, "step": 2095 }, { "epoch": 0.05, "learning_rate": 9.990930460165023e-06, "loss": 1.352, "step": 2096 }, { "epoch": 0.05, "learning_rate": 9.990907835619577e-06, "loss": 1.105, "step": 2097 }, { "epoch": 0.05, "learning_rate": 9.99088518291577e-06, "loss": 0.9112, "step": 2098 }, { "epoch": 0.05, "learning_rate": 9.990862502053728e-06, "loss": 1.2023, "step": 2099 }, { "epoch": 0.05, "learning_rate": 9.990839793033578e-06, "loss": 1.2435, "step": 2100 }, { "epoch": 0.05, "learning_rate": 9.99081705585545e-06, "loss": 1.0922, "step": 2101 }, { "epoch": 0.05, "learning_rate": 9.990794290519473e-06, "loss": 1.2501, "step": 2102 }, { "epoch": 0.05, "learning_rate": 9.990771497025772e-06, "loss": 1.0168, "step": 2103 }, { "epoch": 0.05, "learning_rate": 9.99074867537448e-06, "loss": 1.2843, "step": 2104 }, { "epoch": 0.05, "learning_rate": 9.990725825565723e-06, "loss": 1.1295, "step": 2105 }, { "epoch": 0.05, "learning_rate": 9.990702947599629e-06, "loss": 1.3312, "step": 2106 }, { "epoch": 0.05, "learning_rate": 9.99068004147633e-06, "loss": 0.8271, "step": 2107 }, { "epoch": 0.05, "learning_rate": 9.990657107195951e-06, "loss": 0.9828, "step": 2108 }, { "epoch": 0.05, "learning_rate": 9.990634144758627e-06, "loss": 0.9523, "step": 2109 }, { "epoch": 0.05, "learning_rate": 9.990611154164483e-06, "loss": 0.9791, "step": 2110 }, { "epoch": 0.05, "learning_rate": 9.99058813541365e-06, "loss": 1.392, "step": 2111 }, { "epoch": 0.05, "learning_rate": 9.99056508850626e-06, "loss": 1.089, "step": 2112 }, { "epoch": 0.05, "learning_rate": 9.99054201344244e-06, "loss": 1.0258, "step": 2113 }, { "epoch": 0.05, "learning_rate": 9.990518910222323e-06, "loss": 1.3651, "step": 2114 }, { "epoch": 0.05, "learning_rate": 9.990495778846036e-06, "loss": 1.2203, "step": 2115 }, { "epoch": 0.05, "learning_rate": 9.990472619313712e-06, "loss": 1.0976, "step": 2116 }, { "epoch": 0.05, "learning_rate": 9.99044943162548e-06, "loss": 1.0162, "step": 2117 }, { "epoch": 0.05, "learning_rate": 9.990426215781472e-06, "loss": 1.4532, "step": 2118 }, { "epoch": 0.05, "learning_rate": 9.990402971781819e-06, "loss": 1.3014, "step": 2119 }, { "epoch": 0.05, "learning_rate": 9.990379699626652e-06, "loss": 1.2458, "step": 2120 }, { "epoch": 0.05, "learning_rate": 9.990356399316102e-06, "loss": 1.238, "step": 2121 }, { "epoch": 0.05, "learning_rate": 9.990333070850301e-06, "loss": 1.0954, "step": 2122 }, { "epoch": 0.05, "learning_rate": 9.99030971422938e-06, "loss": 0.9196, "step": 2123 }, { "epoch": 0.05, "learning_rate": 9.990286329453472e-06, "loss": 1.1249, "step": 2124 }, { "epoch": 0.05, "learning_rate": 9.990262916522706e-06, "loss": 1.2564, "step": 2125 }, { "epoch": 0.05, "learning_rate": 9.990239475437218e-06, "loss": 1.3184, "step": 2126 }, { "epoch": 0.05, "learning_rate": 9.990216006197137e-06, "loss": 1.186, "step": 2127 }, { "epoch": 0.05, "learning_rate": 9.990192508802596e-06, "loss": 1.1165, "step": 2128 }, { "epoch": 0.05, "learning_rate": 9.990168983253732e-06, "loss": 1.439, "step": 2129 }, { "epoch": 0.05, "learning_rate": 9.990145429550671e-06, "loss": 1.069, "step": 2130 }, { "epoch": 0.05, "learning_rate": 9.990121847693548e-06, "loss": 1.1704, "step": 2131 }, { "epoch": 0.05, "learning_rate": 9.990098237682499e-06, "loss": 1.0587, "step": 2132 }, { "epoch": 0.05, "learning_rate": 9.990074599517653e-06, "loss": 1.1624, "step": 2133 }, { "epoch": 0.05, "learning_rate": 9.990050933199149e-06, "loss": 1.0966, "step": 2134 }, { "epoch": 0.05, "learning_rate": 9.990027238727115e-06, "loss": 1.0902, "step": 2135 }, { "epoch": 0.05, "learning_rate": 9.990003516101687e-06, "loss": 1.2735, "step": 2136 }, { "epoch": 0.05, "learning_rate": 9.989979765322998e-06, "loss": 1.4112, "step": 2137 }, { "epoch": 0.05, "learning_rate": 9.989955986391183e-06, "loss": 1.1263, "step": 2138 }, { "epoch": 0.05, "learning_rate": 9.989932179306377e-06, "loss": 0.9585, "step": 2139 }, { "epoch": 0.05, "learning_rate": 9.989908344068711e-06, "loss": 1.0561, "step": 2140 }, { "epoch": 0.05, "learning_rate": 9.989884480678323e-06, "loss": 1.1685, "step": 2141 }, { "epoch": 0.05, "learning_rate": 9.989860589135345e-06, "loss": 0.9246, "step": 2142 }, { "epoch": 0.05, "learning_rate": 9.989836669439914e-06, "loss": 1.2927, "step": 2143 }, { "epoch": 0.05, "learning_rate": 9.989812721592162e-06, "loss": 1.1858, "step": 2144 }, { "epoch": 0.05, "learning_rate": 9.989788745592228e-06, "loss": 0.738, "step": 2145 }, { "epoch": 0.05, "learning_rate": 9.989764741440245e-06, "loss": 0.9414, "step": 2146 }, { "epoch": 0.05, "learning_rate": 9.989740709136349e-06, "loss": 1.3666, "step": 2147 }, { "epoch": 0.05, "learning_rate": 9.989716648680674e-06, "loss": 1.1209, "step": 2148 }, { "epoch": 0.05, "learning_rate": 9.989692560073359e-06, "loss": 1.0699, "step": 2149 }, { "epoch": 0.05, "learning_rate": 9.989668443314537e-06, "loss": 1.117, "step": 2150 }, { "epoch": 0.05, "learning_rate": 9.989644298404344e-06, "loss": 1.1267, "step": 2151 }, { "epoch": 0.05, "learning_rate": 9.989620125342919e-06, "loss": 1.1558, "step": 2152 }, { "epoch": 0.05, "learning_rate": 9.989595924130396e-06, "loss": 1.0646, "step": 2153 }, { "epoch": 0.05, "learning_rate": 9.98957169476691e-06, "loss": 1.1583, "step": 2154 }, { "epoch": 0.05, "learning_rate": 9.989547437252602e-06, "loss": 1.4519, "step": 2155 }, { "epoch": 0.05, "learning_rate": 9.989523151587608e-06, "loss": 1.1126, "step": 2156 }, { "epoch": 0.05, "learning_rate": 9.989498837772063e-06, "loss": 1.3033, "step": 2157 }, { "epoch": 0.05, "learning_rate": 9.989474495806104e-06, "loss": 1.1168, "step": 2158 }, { "epoch": 0.05, "learning_rate": 9.98945012568987e-06, "loss": 1.0378, "step": 2159 }, { "epoch": 0.05, "learning_rate": 9.989425727423496e-06, "loss": 0.8394, "step": 2160 }, { "epoch": 0.05, "learning_rate": 9.989401301007124e-06, "loss": 1.0173, "step": 2161 }, { "epoch": 0.05, "learning_rate": 9.989376846440889e-06, "loss": 1.3838, "step": 2162 }, { "epoch": 0.05, "learning_rate": 9.989352363724926e-06, "loss": 1.3411, "step": 2163 }, { "epoch": 0.05, "learning_rate": 9.98932785285938e-06, "loss": 1.3437, "step": 2164 }, { "epoch": 0.05, "learning_rate": 9.989303313844383e-06, "loss": 0.9162, "step": 2165 }, { "epoch": 0.05, "learning_rate": 9.989278746680078e-06, "loss": 1.281, "step": 2166 }, { "epoch": 0.05, "learning_rate": 9.9892541513666e-06, "loss": 1.135, "step": 2167 }, { "epoch": 0.05, "learning_rate": 9.989229527904093e-06, "loss": 0.9913, "step": 2168 }, { "epoch": 0.05, "learning_rate": 9.98920487629269e-06, "loss": 1.154, "step": 2169 }, { "epoch": 0.05, "learning_rate": 9.989180196532531e-06, "loss": 1.2621, "step": 2170 }, { "epoch": 0.05, "learning_rate": 9.989155488623759e-06, "loss": 1.0669, "step": 2171 }, { "epoch": 0.05, "learning_rate": 9.98913075256651e-06, "loss": 1.2744, "step": 2172 }, { "epoch": 0.05, "learning_rate": 9.989105988360924e-06, "loss": 0.9135, "step": 2173 }, { "epoch": 0.05, "learning_rate": 9.989081196007143e-06, "loss": 1.1341, "step": 2174 }, { "epoch": 0.05, "learning_rate": 9.989056375505303e-06, "loss": 0.8783, "step": 2175 }, { "epoch": 0.05, "learning_rate": 9.989031526855549e-06, "loss": 0.9665, "step": 2176 }, { "epoch": 0.05, "learning_rate": 9.989006650058016e-06, "loss": 1.2025, "step": 2177 }, { "epoch": 0.05, "learning_rate": 9.988981745112849e-06, "loss": 0.9414, "step": 2178 }, { "epoch": 0.05, "learning_rate": 9.988956812020185e-06, "loss": 1.0292, "step": 2179 }, { "epoch": 0.05, "learning_rate": 9.988931850780165e-06, "loss": 1.214, "step": 2180 }, { "epoch": 0.05, "learning_rate": 9.988906861392932e-06, "loss": 0.9958, "step": 2181 }, { "epoch": 0.05, "learning_rate": 9.988881843858628e-06, "loss": 1.0734, "step": 2182 }, { "epoch": 0.05, "learning_rate": 9.98885679817739e-06, "loss": 1.2502, "step": 2183 }, { "epoch": 0.05, "learning_rate": 9.98883172434936e-06, "loss": 1.3073, "step": 2184 }, { "epoch": 0.05, "learning_rate": 9.988806622374683e-06, "loss": 1.2212, "step": 2185 }, { "epoch": 0.05, "learning_rate": 9.988781492253497e-06, "loss": 0.9822, "step": 2186 }, { "epoch": 0.05, "learning_rate": 9.988756333985946e-06, "loss": 0.8694, "step": 2187 }, { "epoch": 0.05, "learning_rate": 9.98873114757217e-06, "loss": 1.3646, "step": 2188 }, { "epoch": 0.05, "learning_rate": 9.988705933012314e-06, "loss": 1.2899, "step": 2189 }, { "epoch": 0.05, "learning_rate": 9.988680690306517e-06, "loss": 1.019, "step": 2190 }, { "epoch": 0.05, "learning_rate": 9.988655419454922e-06, "loss": 0.9521, "step": 2191 }, { "epoch": 0.05, "learning_rate": 9.988630120457673e-06, "loss": 1.0041, "step": 2192 }, { "epoch": 0.05, "learning_rate": 9.988604793314914e-06, "loss": 1.0015, "step": 2193 }, { "epoch": 0.05, "learning_rate": 9.988579438026787e-06, "loss": 1.2266, "step": 2194 }, { "epoch": 0.05, "learning_rate": 9.98855405459343e-06, "loss": 0.818, "step": 2195 }, { "epoch": 0.05, "learning_rate": 9.988528643014993e-06, "loss": 0.9354, "step": 2196 }, { "epoch": 0.05, "learning_rate": 9.988503203291617e-06, "loss": 1.0926, "step": 2197 }, { "epoch": 0.05, "learning_rate": 9.988477735423442e-06, "loss": 1.1617, "step": 2198 }, { "epoch": 0.05, "learning_rate": 9.98845223941062e-06, "loss": 1.0702, "step": 2199 }, { "epoch": 0.05, "learning_rate": 9.988426715253286e-06, "loss": 1.1743, "step": 2200 }, { "epoch": 0.05, "learning_rate": 9.988401162951589e-06, "loss": 1.2286, "step": 2201 }, { "epoch": 0.05, "learning_rate": 9.988375582505672e-06, "loss": 1.2883, "step": 2202 }, { "epoch": 0.05, "learning_rate": 9.988349973915679e-06, "loss": 1.2083, "step": 2203 }, { "epoch": 0.05, "learning_rate": 9.988324337181756e-06, "loss": 1.1226, "step": 2204 }, { "epoch": 0.05, "learning_rate": 9.988298672304045e-06, "loss": 1.5318, "step": 2205 }, { "epoch": 0.05, "learning_rate": 9.988272979282692e-06, "loss": 1.0463, "step": 2206 }, { "epoch": 0.05, "learning_rate": 9.988247258117843e-06, "loss": 0.8812, "step": 2207 }, { "epoch": 0.05, "learning_rate": 9.988221508809642e-06, "loss": 1.2252, "step": 2208 }, { "epoch": 0.05, "learning_rate": 9.988195731358233e-06, "loss": 1.0078, "step": 2209 }, { "epoch": 0.05, "learning_rate": 9.988169925763764e-06, "loss": 0.9337, "step": 2210 }, { "epoch": 0.05, "learning_rate": 9.988144092026381e-06, "loss": 0.9269, "step": 2211 }, { "epoch": 0.05, "learning_rate": 9.988118230146227e-06, "loss": 0.9093, "step": 2212 }, { "epoch": 0.05, "learning_rate": 9.988092340123449e-06, "loss": 1.0001, "step": 2213 }, { "epoch": 0.05, "learning_rate": 9.988066421958194e-06, "loss": 1.0032, "step": 2214 }, { "epoch": 0.05, "learning_rate": 9.988040475650609e-06, "loss": 1.1717, "step": 2215 }, { "epoch": 0.05, "learning_rate": 9.988014501200836e-06, "loss": 1.2825, "step": 2216 }, { "epoch": 0.05, "learning_rate": 9.987988498609026e-06, "loss": 1.2846, "step": 2217 }, { "epoch": 0.05, "learning_rate": 9.987962467875326e-06, "loss": 1.02, "step": 2218 }, { "epoch": 0.05, "learning_rate": 9.987936408999877e-06, "loss": 1.0649, "step": 2219 }, { "epoch": 0.05, "learning_rate": 9.987910321982833e-06, "loss": 1.1716, "step": 2220 }, { "epoch": 0.05, "learning_rate": 9.987884206824337e-06, "loss": 1.069, "step": 2221 }, { "epoch": 0.05, "learning_rate": 9.987858063524538e-06, "loss": 1.1989, "step": 2222 }, { "epoch": 0.05, "learning_rate": 9.987831892083583e-06, "loss": 1.1075, "step": 2223 }, { "epoch": 0.05, "learning_rate": 9.98780569250162e-06, "loss": 1.4452, "step": 2224 }, { "epoch": 0.05, "learning_rate": 9.987779464778795e-06, "loss": 1.2067, "step": 2225 }, { "epoch": 0.05, "learning_rate": 9.98775320891526e-06, "loss": 1.2002, "step": 2226 }, { "epoch": 0.05, "learning_rate": 9.98772692491116e-06, "loss": 1.0792, "step": 2227 }, { "epoch": 0.05, "learning_rate": 9.987700612766642e-06, "loss": 0.9657, "step": 2228 }, { "epoch": 0.05, "learning_rate": 9.987674272481858e-06, "loss": 1.131, "step": 2229 }, { "epoch": 0.05, "learning_rate": 9.987647904056955e-06, "loss": 1.1859, "step": 2230 }, { "epoch": 0.05, "learning_rate": 9.987621507492082e-06, "loss": 1.0028, "step": 2231 }, { "epoch": 0.05, "learning_rate": 9.987595082787386e-06, "loss": 0.8901, "step": 2232 }, { "epoch": 0.05, "learning_rate": 9.98756862994302e-06, "loss": 1.2033, "step": 2233 }, { "epoch": 0.05, "learning_rate": 9.987542148959131e-06, "loss": 1.0831, "step": 2234 }, { "epoch": 0.05, "learning_rate": 9.987515639835868e-06, "loss": 1.1178, "step": 2235 }, { "epoch": 0.05, "learning_rate": 9.98748910257338e-06, "loss": 1.0828, "step": 2236 }, { "epoch": 0.05, "learning_rate": 9.987462537171819e-06, "loss": 0.8755, "step": 2237 }, { "epoch": 0.05, "learning_rate": 9.987435943631332e-06, "loss": 1.0443, "step": 2238 }, { "epoch": 0.05, "learning_rate": 9.987409321952072e-06, "loss": 1.0456, "step": 2239 }, { "epoch": 0.05, "learning_rate": 9.987382672134187e-06, "loss": 1.0416, "step": 2240 }, { "epoch": 0.05, "learning_rate": 9.98735599417783e-06, "loss": 1.2289, "step": 2241 }, { "epoch": 0.05, "learning_rate": 9.987329288083147e-06, "loss": 1.3939, "step": 2242 }, { "epoch": 0.05, "learning_rate": 9.987302553850293e-06, "loss": 1.0642, "step": 2243 }, { "epoch": 0.05, "learning_rate": 9.987275791479417e-06, "loss": 1.1195, "step": 2244 }, { "epoch": 0.05, "learning_rate": 9.987249000970672e-06, "loss": 1.1071, "step": 2245 }, { "epoch": 0.05, "learning_rate": 9.987222182324204e-06, "loss": 1.2755, "step": 2246 }, { "epoch": 0.05, "learning_rate": 9.98719533554017e-06, "loss": 1.1686, "step": 2247 }, { "epoch": 0.05, "learning_rate": 9.987168460618718e-06, "loss": 1.2379, "step": 2248 }, { "epoch": 0.05, "learning_rate": 9.98714155756e-06, "loss": 1.1024, "step": 2249 }, { "epoch": 0.05, "learning_rate": 9.987114626364172e-06, "loss": 1.1361, "step": 2250 }, { "epoch": 0.05, "learning_rate": 9.987087667031379e-06, "loss": 1.0036, "step": 2251 }, { "epoch": 0.05, "learning_rate": 9.987060679561777e-06, "loss": 1.4775, "step": 2252 }, { "epoch": 0.05, "learning_rate": 9.98703366395552e-06, "loss": 1.0545, "step": 2253 }, { "epoch": 0.05, "learning_rate": 9.987006620212756e-06, "loss": 1.2083, "step": 2254 }, { "epoch": 0.05, "learning_rate": 9.986979548333641e-06, "loss": 1.0806, "step": 2255 }, { "epoch": 0.05, "learning_rate": 9.986952448318328e-06, "loss": 0.9677, "step": 2256 }, { "epoch": 0.05, "learning_rate": 9.986925320166968e-06, "loss": 1.291, "step": 2257 }, { "epoch": 0.05, "learning_rate": 9.986898163879712e-06, "loss": 1.2301, "step": 2258 }, { "epoch": 0.05, "learning_rate": 9.986870979456718e-06, "loss": 1.0597, "step": 2259 }, { "epoch": 0.05, "learning_rate": 9.986843766898135e-06, "loss": 0.917, "step": 2260 }, { "epoch": 0.05, "learning_rate": 9.986816526204122e-06, "loss": 1.0553, "step": 2261 }, { "epoch": 0.05, "learning_rate": 9.986789257374827e-06, "loss": 1.2151, "step": 2262 }, { "epoch": 0.05, "learning_rate": 9.986761960410407e-06, "loss": 1.1897, "step": 2263 }, { "epoch": 0.05, "learning_rate": 9.986734635311014e-06, "loss": 1.0441, "step": 2264 }, { "epoch": 0.05, "learning_rate": 9.986707282076804e-06, "loss": 1.0477, "step": 2265 }, { "epoch": 0.05, "learning_rate": 9.986679900707932e-06, "loss": 1.3181, "step": 2266 }, { "epoch": 0.05, "learning_rate": 9.986652491204551e-06, "loss": 0.8965, "step": 2267 }, { "epoch": 0.05, "learning_rate": 9.986625053566814e-06, "loss": 1.3058, "step": 2268 }, { "epoch": 0.05, "learning_rate": 9.98659758779488e-06, "loss": 1.4388, "step": 2269 }, { "epoch": 0.05, "learning_rate": 9.9865700938889e-06, "loss": 1.1121, "step": 2270 }, { "epoch": 0.05, "learning_rate": 9.98654257184903e-06, "loss": 1.1005, "step": 2271 }, { "epoch": 0.05, "learning_rate": 9.986515021675427e-06, "loss": 1.091, "step": 2272 }, { "epoch": 0.05, "learning_rate": 9.986487443368245e-06, "loss": 1.177, "step": 2273 }, { "epoch": 0.05, "learning_rate": 9.986459836927642e-06, "loss": 1.2011, "step": 2274 }, { "epoch": 0.05, "learning_rate": 9.98643220235377e-06, "loss": 1.0338, "step": 2275 }, { "epoch": 0.05, "learning_rate": 9.986404539646787e-06, "loss": 1.0997, "step": 2276 }, { "epoch": 0.05, "learning_rate": 9.986376848806849e-06, "loss": 1.0236, "step": 2277 }, { "epoch": 0.05, "learning_rate": 9.986349129834112e-06, "loss": 0.9718, "step": 2278 }, { "epoch": 0.05, "learning_rate": 9.986321382728732e-06, "loss": 1.0226, "step": 2279 }, { "epoch": 0.05, "learning_rate": 9.986293607490865e-06, "loss": 1.1595, "step": 2280 }, { "epoch": 0.05, "learning_rate": 9.98626580412067e-06, "loss": 1.2961, "step": 2281 }, { "epoch": 0.05, "learning_rate": 9.986237972618303e-06, "loss": 1.2581, "step": 2282 }, { "epoch": 0.05, "learning_rate": 9.986210112983919e-06, "loss": 1.4602, "step": 2283 }, { "epoch": 0.05, "learning_rate": 9.986182225217677e-06, "loss": 1.0229, "step": 2284 }, { "epoch": 0.05, "learning_rate": 9.986154309319736e-06, "loss": 1.0998, "step": 2285 }, { "epoch": 0.05, "learning_rate": 9.98612636529025e-06, "loss": 1.1305, "step": 2286 }, { "epoch": 0.05, "learning_rate": 9.986098393129377e-06, "loss": 1.2375, "step": 2287 }, { "epoch": 0.05, "learning_rate": 9.986070392837278e-06, "loss": 1.1374, "step": 2288 }, { "epoch": 0.05, "learning_rate": 9.986042364414108e-06, "loss": 1.1584, "step": 2289 }, { "epoch": 0.05, "learning_rate": 9.986014307860026e-06, "loss": 0.8862, "step": 2290 }, { "epoch": 0.05, "learning_rate": 9.98598622317519e-06, "loss": 1.2594, "step": 2291 }, { "epoch": 0.05, "learning_rate": 9.98595811035976e-06, "loss": 1.2049, "step": 2292 }, { "epoch": 0.05, "learning_rate": 9.985929969413893e-06, "loss": 1.2638, "step": 2293 }, { "epoch": 0.05, "learning_rate": 9.98590180033775e-06, "loss": 1.2705, "step": 2294 }, { "epoch": 0.05, "learning_rate": 9.985873603131485e-06, "loss": 0.9941, "step": 2295 }, { "epoch": 0.05, "learning_rate": 9.985845377795263e-06, "loss": 1.0282, "step": 2296 }, { "epoch": 0.05, "learning_rate": 9.985817124329238e-06, "loss": 1.2861, "step": 2297 }, { "epoch": 0.05, "learning_rate": 9.985788842733573e-06, "loss": 1.0244, "step": 2298 }, { "epoch": 0.05, "learning_rate": 9.985760533008429e-06, "loss": 1.1807, "step": 2299 }, { "epoch": 0.05, "learning_rate": 9.98573219515396e-06, "loss": 1.0446, "step": 2300 }, { "epoch": 0.05, "learning_rate": 9.98570382917033e-06, "loss": 1.115, "step": 2301 }, { "epoch": 0.05, "learning_rate": 9.985675435057697e-06, "loss": 1.4262, "step": 2302 }, { "epoch": 0.05, "learning_rate": 9.985647012816223e-06, "loss": 1.1526, "step": 2303 }, { "epoch": 0.05, "learning_rate": 9.98561856244607e-06, "loss": 1.2397, "step": 2304 }, { "epoch": 0.05, "learning_rate": 9.985590083947395e-06, "loss": 1.0023, "step": 2305 }, { "epoch": 0.05, "learning_rate": 9.985561577320358e-06, "loss": 1.0868, "step": 2306 }, { "epoch": 0.05, "learning_rate": 9.985533042565123e-06, "loss": 1.16, "step": 2307 }, { "epoch": 0.05, "learning_rate": 9.98550447968185e-06, "loss": 1.1772, "step": 2308 }, { "epoch": 0.05, "learning_rate": 9.9854758886707e-06, "loss": 1.0108, "step": 2309 }, { "epoch": 0.05, "learning_rate": 9.985447269531835e-06, "loss": 1.0498, "step": 2310 }, { "epoch": 0.05, "learning_rate": 9.985418622265413e-06, "loss": 0.8253, "step": 2311 }, { "epoch": 0.05, "learning_rate": 9.985389946871598e-06, "loss": 1.0529, "step": 2312 }, { "epoch": 0.05, "learning_rate": 9.985361243350554e-06, "loss": 1.6077, "step": 2313 }, { "epoch": 0.05, "learning_rate": 9.98533251170244e-06, "loss": 1.1605, "step": 2314 }, { "epoch": 0.05, "learning_rate": 9.98530375192742e-06, "loss": 1.33, "step": 2315 }, { "epoch": 0.05, "learning_rate": 9.985274964025656e-06, "loss": 1.0651, "step": 2316 }, { "epoch": 0.05, "learning_rate": 9.985246147997308e-06, "loss": 1.0416, "step": 2317 }, { "epoch": 0.05, "learning_rate": 9.98521730384254e-06, "loss": 1.2812, "step": 2318 }, { "epoch": 0.05, "learning_rate": 9.985188431561517e-06, "loss": 1.045, "step": 2319 }, { "epoch": 0.05, "learning_rate": 9.985159531154398e-06, "loss": 1.1599, "step": 2320 }, { "epoch": 0.05, "learning_rate": 9.98513060262135e-06, "loss": 1.5345, "step": 2321 }, { "epoch": 0.05, "learning_rate": 9.985101645962535e-06, "loss": 1.2292, "step": 2322 }, { "epoch": 0.05, "learning_rate": 9.985072661178112e-06, "loss": 1.275, "step": 2323 }, { "epoch": 0.05, "learning_rate": 9.98504364826825e-06, "loss": 1.0327, "step": 2324 }, { "epoch": 0.05, "learning_rate": 9.98501460723311e-06, "loss": 0.8698, "step": 2325 }, { "epoch": 0.05, "learning_rate": 9.984985538072857e-06, "loss": 1.145, "step": 2326 }, { "epoch": 0.05, "learning_rate": 9.984956440787656e-06, "loss": 0.9847, "step": 2327 }, { "epoch": 0.05, "learning_rate": 9.98492731537767e-06, "loss": 1.1448, "step": 2328 }, { "epoch": 0.05, "learning_rate": 9.984898161843062e-06, "loss": 1.3686, "step": 2329 }, { "epoch": 0.05, "learning_rate": 9.984868980183996e-06, "loss": 0.8199, "step": 2330 }, { "epoch": 0.05, "learning_rate": 9.984839770400641e-06, "loss": 1.1165, "step": 2331 }, { "epoch": 0.05, "learning_rate": 9.984810532493158e-06, "loss": 0.8773, "step": 2332 }, { "epoch": 0.05, "learning_rate": 9.984781266461714e-06, "loss": 1.171, "step": 2333 }, { "epoch": 0.05, "learning_rate": 9.984751972306473e-06, "loss": 1.1222, "step": 2334 }, { "epoch": 0.05, "learning_rate": 9.984722650027598e-06, "loss": 0.8129, "step": 2335 }, { "epoch": 0.05, "learning_rate": 9.98469329962526e-06, "loss": 0.9442, "step": 2336 }, { "epoch": 0.05, "learning_rate": 9.98466392109962e-06, "loss": 1.2394, "step": 2337 }, { "epoch": 0.05, "learning_rate": 9.984634514450847e-06, "loss": 0.9242, "step": 2338 }, { "epoch": 0.05, "learning_rate": 9.984605079679101e-06, "loss": 1.0999, "step": 2339 }, { "epoch": 0.05, "learning_rate": 9.984575616784555e-06, "loss": 1.2313, "step": 2340 }, { "epoch": 0.05, "learning_rate": 9.984546125767372e-06, "loss": 0.953, "step": 2341 }, { "epoch": 0.05, "learning_rate": 9.984516606627719e-06, "loss": 0.7515, "step": 2342 }, { "epoch": 0.05, "learning_rate": 9.984487059365763e-06, "loss": 1.1735, "step": 2343 }, { "epoch": 0.05, "learning_rate": 9.98445748398167e-06, "loss": 1.1985, "step": 2344 }, { "epoch": 0.05, "learning_rate": 9.984427880475605e-06, "loss": 1.1607, "step": 2345 }, { "epoch": 0.05, "learning_rate": 9.98439824884774e-06, "loss": 0.9735, "step": 2346 }, { "epoch": 0.05, "learning_rate": 9.984368589098236e-06, "loss": 1.0603, "step": 2347 }, { "epoch": 0.05, "learning_rate": 9.984338901227265e-06, "loss": 0.9975, "step": 2348 }, { "epoch": 0.05, "learning_rate": 9.984309185234992e-06, "loss": 1.3774, "step": 2349 }, { "epoch": 0.05, "learning_rate": 9.984279441121587e-06, "loss": 1.1408, "step": 2350 }, { "epoch": 0.05, "learning_rate": 9.984249668887216e-06, "loss": 0.9636, "step": 2351 }, { "epoch": 0.05, "learning_rate": 9.984219868532047e-06, "loss": 0.8673, "step": 2352 }, { "epoch": 0.05, "learning_rate": 9.984190040056247e-06, "loss": 0.8809, "step": 2353 }, { "epoch": 0.05, "learning_rate": 9.984160183459988e-06, "loss": 0.8419, "step": 2354 }, { "epoch": 0.05, "learning_rate": 9.984130298743437e-06, "loss": 1.1866, "step": 2355 }, { "epoch": 0.05, "learning_rate": 9.98410038590676e-06, "loss": 0.9695, "step": 2356 }, { "epoch": 0.05, "learning_rate": 9.984070444950128e-06, "loss": 1.0325, "step": 2357 }, { "epoch": 0.05, "learning_rate": 9.98404047587371e-06, "loss": 1.0889, "step": 2358 }, { "epoch": 0.05, "learning_rate": 9.984010478677675e-06, "loss": 1.3555, "step": 2359 }, { "epoch": 0.05, "learning_rate": 9.983980453362191e-06, "loss": 1.3076, "step": 2360 }, { "epoch": 0.05, "learning_rate": 9.983950399927429e-06, "loss": 0.9057, "step": 2361 }, { "epoch": 0.05, "learning_rate": 9.983920318373556e-06, "loss": 1.0779, "step": 2362 }, { "epoch": 0.05, "learning_rate": 9.983890208700746e-06, "loss": 1.2174, "step": 2363 }, { "epoch": 0.05, "learning_rate": 9.983860070909167e-06, "loss": 1.4052, "step": 2364 }, { "epoch": 0.05, "learning_rate": 9.983829904998985e-06, "loss": 1.3082, "step": 2365 }, { "epoch": 0.05, "learning_rate": 9.983799710970377e-06, "loss": 1.1248, "step": 2366 }, { "epoch": 0.05, "learning_rate": 9.983769488823508e-06, "loss": 0.9204, "step": 2367 }, { "epoch": 0.05, "learning_rate": 9.983739238558551e-06, "loss": 1.1409, "step": 2368 }, { "epoch": 0.05, "learning_rate": 9.983708960175677e-06, "loss": 1.1843, "step": 2369 }, { "epoch": 0.05, "learning_rate": 9.983678653675055e-06, "loss": 0.9184, "step": 2370 }, { "epoch": 0.05, "learning_rate": 9.983648319056857e-06, "loss": 1.2719, "step": 2371 }, { "epoch": 0.06, "learning_rate": 9.983617956321257e-06, "loss": 0.9942, "step": 2372 }, { "epoch": 0.06, "learning_rate": 9.98358756546842e-06, "loss": 1.0063, "step": 2373 }, { "epoch": 0.06, "learning_rate": 9.983557146498522e-06, "loss": 1.4426, "step": 2374 }, { "epoch": 0.06, "learning_rate": 9.983526699411735e-06, "loss": 1.036, "step": 2375 }, { "epoch": 0.06, "learning_rate": 9.983496224208226e-06, "loss": 1.2325, "step": 2376 }, { "epoch": 0.06, "learning_rate": 9.983465720888174e-06, "loss": 1.2367, "step": 2377 }, { "epoch": 0.06, "learning_rate": 9.983435189451745e-06, "loss": 1.1442, "step": 2378 }, { "epoch": 0.06, "learning_rate": 9.983404629899113e-06, "loss": 1.0926, "step": 2379 }, { "epoch": 0.06, "learning_rate": 9.983374042230454e-06, "loss": 1.2003, "step": 2380 }, { "epoch": 0.06, "learning_rate": 9.983343426445934e-06, "loss": 1.2898, "step": 2381 }, { "epoch": 0.06, "learning_rate": 9.983312782545733e-06, "loss": 0.9453, "step": 2382 }, { "epoch": 0.06, "learning_rate": 9.98328211053002e-06, "loss": 0.8981, "step": 2383 }, { "epoch": 0.06, "learning_rate": 9.983251410398966e-06, "loss": 1.1897, "step": 2384 }, { "epoch": 0.06, "learning_rate": 9.983220682152747e-06, "loss": 1.1089, "step": 2385 }, { "epoch": 0.06, "learning_rate": 9.983189925791537e-06, "loss": 1.1253, "step": 2386 }, { "epoch": 0.06, "learning_rate": 9.983159141315507e-06, "loss": 0.9213, "step": 2387 }, { "epoch": 0.06, "learning_rate": 9.983128328724833e-06, "loss": 1.1722, "step": 2388 }, { "epoch": 0.06, "learning_rate": 9.983097488019687e-06, "loss": 1.1483, "step": 2389 }, { "epoch": 0.06, "learning_rate": 9.983066619200246e-06, "loss": 1.0174, "step": 2390 }, { "epoch": 0.06, "learning_rate": 9.983035722266681e-06, "loss": 1.057, "step": 2391 }, { "epoch": 0.06, "learning_rate": 9.983004797219167e-06, "loss": 1.3196, "step": 2392 }, { "epoch": 0.06, "learning_rate": 9.982973844057876e-06, "loss": 0.8766, "step": 2393 }, { "epoch": 0.06, "learning_rate": 9.98294286278299e-06, "loss": 0.9491, "step": 2394 }, { "epoch": 0.06, "learning_rate": 9.982911853394679e-06, "loss": 1.0283, "step": 2395 }, { "epoch": 0.06, "learning_rate": 9.982880815893117e-06, "loss": 0.9938, "step": 2396 }, { "epoch": 0.06, "learning_rate": 9.98284975027848e-06, "loss": 1.3123, "step": 2397 }, { "epoch": 0.06, "learning_rate": 9.982818656550943e-06, "loss": 1.1633, "step": 2398 }, { "epoch": 0.06, "learning_rate": 9.982787534710685e-06, "loss": 0.911, "step": 2399 }, { "epoch": 0.06, "learning_rate": 9.982756384757876e-06, "loss": 1.2579, "step": 2400 }, { "epoch": 0.06, "learning_rate": 9.982725206692695e-06, "loss": 1.2414, "step": 2401 }, { "epoch": 0.06, "learning_rate": 9.982694000515318e-06, "loss": 1.0447, "step": 2402 }, { "epoch": 0.06, "learning_rate": 9.982662766225919e-06, "loss": 1.2388, "step": 2403 }, { "epoch": 0.06, "learning_rate": 9.982631503824677e-06, "loss": 0.8602, "step": 2404 }, { "epoch": 0.06, "learning_rate": 9.982600213311766e-06, "loss": 1.2129, "step": 2405 }, { "epoch": 0.06, "learning_rate": 9.982568894687364e-06, "loss": 1.2247, "step": 2406 }, { "epoch": 0.06, "learning_rate": 9.982537547951647e-06, "loss": 0.8765, "step": 2407 }, { "epoch": 0.06, "learning_rate": 9.982506173104794e-06, "loss": 1.1826, "step": 2408 }, { "epoch": 0.06, "learning_rate": 9.982474770146977e-06, "loss": 1.1856, "step": 2409 }, { "epoch": 0.06, "learning_rate": 9.982443339078379e-06, "loss": 1.4174, "step": 2410 }, { "epoch": 0.06, "learning_rate": 9.982411879899172e-06, "loss": 1.2374, "step": 2411 }, { "epoch": 0.06, "learning_rate": 9.982380392609537e-06, "loss": 1.225, "step": 2412 }, { "epoch": 0.06, "learning_rate": 9.98234887720965e-06, "loss": 0.9399, "step": 2413 }, { "epoch": 0.06, "learning_rate": 9.982317333699691e-06, "loss": 1.0874, "step": 2414 }, { "epoch": 0.06, "learning_rate": 9.982285762079837e-06, "loss": 1.211, "step": 2415 }, { "epoch": 0.06, "learning_rate": 9.982254162350265e-06, "loss": 1.1417, "step": 2416 }, { "epoch": 0.06, "learning_rate": 9.982222534511154e-06, "loss": 1.046, "step": 2417 }, { "epoch": 0.06, "learning_rate": 9.982190878562682e-06, "loss": 1.0932, "step": 2418 }, { "epoch": 0.06, "learning_rate": 9.982159194505028e-06, "loss": 1.2213, "step": 2419 }, { "epoch": 0.06, "learning_rate": 9.98212748233837e-06, "loss": 1.0062, "step": 2420 }, { "epoch": 0.06, "learning_rate": 9.982095742062887e-06, "loss": 1.013, "step": 2421 }, { "epoch": 0.06, "learning_rate": 9.98206397367876e-06, "loss": 1.2222, "step": 2422 }, { "epoch": 0.06, "learning_rate": 9.982032177186166e-06, "loss": 0.9153, "step": 2423 }, { "epoch": 0.06, "learning_rate": 9.982000352585288e-06, "loss": 1.1592, "step": 2424 }, { "epoch": 0.06, "learning_rate": 9.981968499876302e-06, "loss": 1.1635, "step": 2425 }, { "epoch": 0.06, "learning_rate": 9.981936619059386e-06, "loss": 1.052, "step": 2426 }, { "epoch": 0.06, "learning_rate": 9.981904710134724e-06, "loss": 1.4237, "step": 2427 }, { "epoch": 0.06, "learning_rate": 9.981872773102496e-06, "loss": 1.1575, "step": 2428 }, { "epoch": 0.06, "learning_rate": 9.98184080796288e-06, "loss": 1.2441, "step": 2429 }, { "epoch": 0.06, "learning_rate": 9.981808814716055e-06, "loss": 1.0599, "step": 2430 }, { "epoch": 0.06, "learning_rate": 9.981776793362206e-06, "loss": 1.0447, "step": 2431 }, { "epoch": 0.06, "learning_rate": 9.981744743901509e-06, "loss": 0.9695, "step": 2432 }, { "epoch": 0.06, "learning_rate": 9.981712666334147e-06, "loss": 1.1146, "step": 2433 }, { "epoch": 0.06, "learning_rate": 9.981680560660303e-06, "loss": 1.0788, "step": 2434 }, { "epoch": 0.06, "learning_rate": 9.981648426880156e-06, "loss": 1.1188, "step": 2435 }, { "epoch": 0.06, "learning_rate": 9.981616264993885e-06, "loss": 1.0908, "step": 2436 }, { "epoch": 0.06, "learning_rate": 9.981584075001676e-06, "loss": 1.2538, "step": 2437 }, { "epoch": 0.06, "learning_rate": 9.981551856903709e-06, "loss": 1.0485, "step": 2438 }, { "epoch": 0.06, "learning_rate": 9.981519610700163e-06, "loss": 1.0094, "step": 2439 }, { "epoch": 0.06, "learning_rate": 9.981487336391224e-06, "loss": 0.953, "step": 2440 }, { "epoch": 0.06, "learning_rate": 9.981455033977073e-06, "loss": 0.9958, "step": 2441 }, { "epoch": 0.06, "learning_rate": 9.98142270345789e-06, "loss": 1.2796, "step": 2442 }, { "epoch": 0.06, "learning_rate": 9.981390344833859e-06, "loss": 1.1912, "step": 2443 }, { "epoch": 0.06, "learning_rate": 9.981357958105162e-06, "loss": 1.0768, "step": 2444 }, { "epoch": 0.06, "learning_rate": 9.981325543271983e-06, "loss": 1.2219, "step": 2445 }, { "epoch": 0.06, "learning_rate": 9.981293100334505e-06, "loss": 1.2298, "step": 2446 }, { "epoch": 0.06, "learning_rate": 9.981260629292909e-06, "loss": 1.3473, "step": 2447 }, { "epoch": 0.06, "learning_rate": 9.98122813014738e-06, "loss": 1.4179, "step": 2448 }, { "epoch": 0.06, "learning_rate": 9.981195602898099e-06, "loss": 1.0085, "step": 2449 }, { "epoch": 0.06, "learning_rate": 9.981163047545254e-06, "loss": 1.0379, "step": 2450 }, { "epoch": 0.06, "learning_rate": 9.981130464089024e-06, "loss": 0.9443, "step": 2451 }, { "epoch": 0.06, "learning_rate": 9.981097852529595e-06, "loss": 0.9804, "step": 2452 }, { "epoch": 0.06, "learning_rate": 9.981065212867151e-06, "loss": 1.0661, "step": 2453 }, { "epoch": 0.06, "learning_rate": 9.981032545101876e-06, "loss": 0.8813, "step": 2454 }, { "epoch": 0.06, "learning_rate": 9.980999849233954e-06, "loss": 1.1556, "step": 2455 }, { "epoch": 0.06, "learning_rate": 9.98096712526357e-06, "loss": 1.1164, "step": 2456 }, { "epoch": 0.06, "learning_rate": 9.980934373190908e-06, "loss": 1.1501, "step": 2457 }, { "epoch": 0.06, "learning_rate": 9.980901593016153e-06, "loss": 1.0962, "step": 2458 }, { "epoch": 0.06, "learning_rate": 9.98086878473949e-06, "loss": 0.7874, "step": 2459 }, { "epoch": 0.06, "learning_rate": 9.980835948361103e-06, "loss": 1.0508, "step": 2460 }, { "epoch": 0.06, "learning_rate": 9.98080308388118e-06, "loss": 0.9481, "step": 2461 }, { "epoch": 0.06, "learning_rate": 9.980770191299905e-06, "loss": 0.9292, "step": 2462 }, { "epoch": 0.06, "learning_rate": 9.980737270617462e-06, "loss": 1.1313, "step": 2463 }, { "epoch": 0.06, "learning_rate": 9.980704321834041e-06, "loss": 0.7389, "step": 2464 }, { "epoch": 0.06, "learning_rate": 9.980671344949822e-06, "loss": 0.8956, "step": 2465 }, { "epoch": 0.06, "learning_rate": 9.980638339964994e-06, "loss": 0.9041, "step": 2466 }, { "epoch": 0.06, "learning_rate": 9.980605306879745e-06, "loss": 0.9605, "step": 2467 }, { "epoch": 0.06, "learning_rate": 9.980572245694258e-06, "loss": 0.7356, "step": 2468 }, { "epoch": 0.06, "learning_rate": 9.980539156408722e-06, "loss": 1.0341, "step": 2469 }, { "epoch": 0.06, "learning_rate": 9.980506039023323e-06, "loss": 1.2517, "step": 2470 }, { "epoch": 0.06, "learning_rate": 9.980472893538248e-06, "loss": 1.2268, "step": 2471 }, { "epoch": 0.06, "learning_rate": 9.980439719953684e-06, "loss": 1.1745, "step": 2472 }, { "epoch": 0.06, "learning_rate": 9.980406518269816e-06, "loss": 1.2685, "step": 2473 }, { "epoch": 0.06, "learning_rate": 9.980373288486835e-06, "loss": 1.1124, "step": 2474 }, { "epoch": 0.06, "learning_rate": 9.980340030604924e-06, "loss": 1.2576, "step": 2475 }, { "epoch": 0.06, "learning_rate": 9.980306744624277e-06, "loss": 1.1884, "step": 2476 }, { "epoch": 0.06, "learning_rate": 9.980273430545076e-06, "loss": 0.9859, "step": 2477 }, { "epoch": 0.06, "learning_rate": 9.980240088367513e-06, "loss": 1.124, "step": 2478 }, { "epoch": 0.06, "learning_rate": 9.980206718091772e-06, "loss": 1.1025, "step": 2479 }, { "epoch": 0.06, "learning_rate": 9.980173319718043e-06, "loss": 0.7661, "step": 2480 }, { "epoch": 0.06, "learning_rate": 9.980139893246517e-06, "loss": 1.0839, "step": 2481 }, { "epoch": 0.06, "learning_rate": 9.98010643867738e-06, "loss": 1.5159, "step": 2482 }, { "epoch": 0.06, "learning_rate": 9.98007295601082e-06, "loss": 1.0282, "step": 2483 }, { "epoch": 0.06, "learning_rate": 9.980039445247027e-06, "loss": 1.0842, "step": 2484 }, { "epoch": 0.06, "learning_rate": 9.98000590638619e-06, "loss": 1.0829, "step": 2485 }, { "epoch": 0.06, "learning_rate": 9.9799723394285e-06, "loss": 1.0799, "step": 2486 }, { "epoch": 0.06, "learning_rate": 9.979938744374144e-06, "loss": 0.8933, "step": 2487 }, { "epoch": 0.06, "learning_rate": 9.979905121223313e-06, "loss": 1.073, "step": 2488 }, { "epoch": 0.06, "learning_rate": 9.979871469976197e-06, "loss": 0.8732, "step": 2489 }, { "epoch": 0.06, "learning_rate": 9.979837790632982e-06, "loss": 0.9502, "step": 2490 }, { "epoch": 0.06, "learning_rate": 9.979804083193863e-06, "loss": 1.0758, "step": 2491 }, { "epoch": 0.06, "learning_rate": 9.979770347659029e-06, "loss": 1.047, "step": 2492 }, { "epoch": 0.06, "learning_rate": 9.979736584028667e-06, "loss": 0.9486, "step": 2493 }, { "epoch": 0.06, "learning_rate": 9.97970279230297e-06, "loss": 1.0163, "step": 2494 }, { "epoch": 0.06, "learning_rate": 9.97966897248213e-06, "loss": 1.4455, "step": 2495 }, { "epoch": 0.06, "learning_rate": 9.979635124566336e-06, "loss": 1.1417, "step": 2496 }, { "epoch": 0.06, "learning_rate": 9.979601248555779e-06, "loss": 1.3064, "step": 2497 }, { "epoch": 0.06, "learning_rate": 9.97956734445065e-06, "loss": 1.1803, "step": 2498 }, { "epoch": 0.06, "learning_rate": 9.97953341225114e-06, "loss": 1.255, "step": 2499 }, { "epoch": 0.06, "learning_rate": 9.979499451957443e-06, "loss": 1.0026, "step": 2500 }, { "epoch": 0.06, "learning_rate": 9.979465463569749e-06, "loss": 1.0873, "step": 2501 }, { "epoch": 0.06, "learning_rate": 9.97943144708825e-06, "loss": 1.2869, "step": 2502 }, { "epoch": 0.06, "learning_rate": 9.979397402513136e-06, "loss": 1.0276, "step": 2503 }, { "epoch": 0.06, "learning_rate": 9.9793633298446e-06, "loss": 1.1679, "step": 2504 }, { "epoch": 0.06, "learning_rate": 9.979329229082836e-06, "loss": 0.9919, "step": 2505 }, { "epoch": 0.06, "learning_rate": 9.979295100228034e-06, "loss": 0.9996, "step": 2506 }, { "epoch": 0.06, "learning_rate": 9.979260943280388e-06, "loss": 1.1078, "step": 2507 }, { "epoch": 0.06, "learning_rate": 9.979226758240093e-06, "loss": 1.0279, "step": 2508 }, { "epoch": 0.06, "learning_rate": 9.979192545107337e-06, "loss": 1.1624, "step": 2509 }, { "epoch": 0.06, "learning_rate": 9.979158303882315e-06, "loss": 1.2805, "step": 2510 }, { "epoch": 0.06, "learning_rate": 9.979124034565222e-06, "loss": 1.1838, "step": 2511 }, { "epoch": 0.06, "learning_rate": 9.979089737156249e-06, "loss": 1.0757, "step": 2512 }, { "epoch": 0.06, "learning_rate": 9.97905541165559e-06, "loss": 1.1318, "step": 2513 }, { "epoch": 0.06, "learning_rate": 9.97902105806344e-06, "loss": 1.0279, "step": 2514 }, { "epoch": 0.06, "learning_rate": 9.978986676379992e-06, "loss": 1.081, "step": 2515 }, { "epoch": 0.06, "learning_rate": 9.978952266605439e-06, "loss": 1.0409, "step": 2516 }, { "epoch": 0.06, "learning_rate": 9.978917828739975e-06, "loss": 0.9796, "step": 2517 }, { "epoch": 0.06, "learning_rate": 9.978883362783798e-06, "loss": 1.2283, "step": 2518 }, { "epoch": 0.06, "learning_rate": 9.978848868737099e-06, "loss": 1.2233, "step": 2519 }, { "epoch": 0.06, "learning_rate": 9.978814346600071e-06, "loss": 1.1014, "step": 2520 }, { "epoch": 0.06, "learning_rate": 9.978779796372914e-06, "loss": 0.9544, "step": 2521 }, { "epoch": 0.06, "learning_rate": 9.978745218055818e-06, "loss": 1.1055, "step": 2522 }, { "epoch": 0.06, "learning_rate": 9.97871061164898e-06, "loss": 1.1376, "step": 2523 }, { "epoch": 0.06, "learning_rate": 9.978675977152598e-06, "loss": 1.2044, "step": 2524 }, { "epoch": 0.06, "learning_rate": 9.978641314566863e-06, "loss": 1.1036, "step": 2525 }, { "epoch": 0.06, "learning_rate": 9.978606623891973e-06, "loss": 0.9997, "step": 2526 }, { "epoch": 0.06, "learning_rate": 9.978571905128122e-06, "loss": 1.323, "step": 2527 }, { "epoch": 0.06, "learning_rate": 9.978537158275508e-06, "loss": 1.0966, "step": 2528 }, { "epoch": 0.06, "learning_rate": 9.978502383334325e-06, "loss": 1.0959, "step": 2529 }, { "epoch": 0.06, "learning_rate": 9.97846758030477e-06, "loss": 1.1724, "step": 2530 }, { "epoch": 0.06, "learning_rate": 9.97843274918704e-06, "loss": 1.0393, "step": 2531 }, { "epoch": 0.06, "learning_rate": 9.978397889981332e-06, "loss": 1.1252, "step": 2532 }, { "epoch": 0.06, "learning_rate": 9.97836300268784e-06, "loss": 1.2466, "step": 2533 }, { "epoch": 0.06, "learning_rate": 9.978328087306765e-06, "loss": 1.1072, "step": 2534 }, { "epoch": 0.06, "learning_rate": 9.9782931438383e-06, "loss": 1.0111, "step": 2535 }, { "epoch": 0.06, "learning_rate": 9.978258172282643e-06, "loss": 1.0677, "step": 2536 }, { "epoch": 0.06, "learning_rate": 9.978223172639994e-06, "loss": 0.9246, "step": 2537 }, { "epoch": 0.06, "learning_rate": 9.978188144910547e-06, "loss": 1.1921, "step": 2538 }, { "epoch": 0.06, "learning_rate": 9.978153089094502e-06, "loss": 1.1901, "step": 2539 }, { "epoch": 0.06, "learning_rate": 9.978118005192054e-06, "loss": 0.9476, "step": 2540 }, { "epoch": 0.06, "learning_rate": 9.978082893203405e-06, "loss": 0.9612, "step": 2541 }, { "epoch": 0.06, "learning_rate": 9.97804775312875e-06, "loss": 1.3081, "step": 2542 }, { "epoch": 0.06, "learning_rate": 9.978012584968288e-06, "loss": 1.1531, "step": 2543 }, { "epoch": 0.06, "learning_rate": 9.977977388722217e-06, "loss": 1.0469, "step": 2544 }, { "epoch": 0.06, "learning_rate": 9.977942164390738e-06, "loss": 1.0955, "step": 2545 }, { "epoch": 0.06, "learning_rate": 9.977906911974046e-06, "loss": 1.3647, "step": 2546 }, { "epoch": 0.06, "learning_rate": 9.977871631472343e-06, "loss": 1.0695, "step": 2547 }, { "epoch": 0.06, "learning_rate": 9.977836322885827e-06, "loss": 1.073, "step": 2548 }, { "epoch": 0.06, "learning_rate": 9.977800986214697e-06, "loss": 1.166, "step": 2549 }, { "epoch": 0.06, "learning_rate": 9.977765621459153e-06, "loss": 1.2651, "step": 2550 }, { "epoch": 0.06, "learning_rate": 9.977730228619391e-06, "loss": 1.132, "step": 2551 }, { "epoch": 0.06, "learning_rate": 9.977694807695617e-06, "loss": 1.1822, "step": 2552 }, { "epoch": 0.06, "learning_rate": 9.977659358688025e-06, "loss": 1.0577, "step": 2553 }, { "epoch": 0.06, "learning_rate": 9.977623881596818e-06, "loss": 1.2185, "step": 2554 }, { "epoch": 0.06, "learning_rate": 9.977588376422199e-06, "loss": 0.8814, "step": 2555 }, { "epoch": 0.06, "learning_rate": 9.977552843164361e-06, "loss": 1.1163, "step": 2556 }, { "epoch": 0.06, "learning_rate": 9.97751728182351e-06, "loss": 0.7689, "step": 2557 }, { "epoch": 0.06, "learning_rate": 9.977481692399844e-06, "loss": 1.0452, "step": 2558 }, { "epoch": 0.06, "learning_rate": 9.977446074893567e-06, "loss": 1.2044, "step": 2559 }, { "epoch": 0.06, "learning_rate": 9.977410429304874e-06, "loss": 1.4217, "step": 2560 }, { "epoch": 0.06, "learning_rate": 9.977374755633973e-06, "loss": 0.8754, "step": 2561 }, { "epoch": 0.06, "learning_rate": 9.977339053881062e-06, "loss": 1.16, "step": 2562 }, { "epoch": 0.06, "learning_rate": 9.977303324046342e-06, "loss": 1.1556, "step": 2563 }, { "epoch": 0.06, "learning_rate": 9.977267566130015e-06, "loss": 1.0347, "step": 2564 }, { "epoch": 0.06, "learning_rate": 9.977231780132284e-06, "loss": 1.1905, "step": 2565 }, { "epoch": 0.06, "learning_rate": 9.97719596605335e-06, "loss": 0.9431, "step": 2566 }, { "epoch": 0.06, "learning_rate": 9.977160123893412e-06, "loss": 0.9091, "step": 2567 }, { "epoch": 0.06, "learning_rate": 9.977124253652678e-06, "loss": 1.0472, "step": 2568 }, { "epoch": 0.06, "learning_rate": 9.977088355331347e-06, "loss": 1.0319, "step": 2569 }, { "epoch": 0.06, "learning_rate": 9.97705242892962e-06, "loss": 1.0799, "step": 2570 }, { "epoch": 0.06, "learning_rate": 9.977016474447704e-06, "loss": 0.9922, "step": 2571 }, { "epoch": 0.06, "learning_rate": 9.9769804918858e-06, "loss": 0.87, "step": 2572 }, { "epoch": 0.06, "learning_rate": 9.97694448124411e-06, "loss": 1.37, "step": 2573 }, { "epoch": 0.06, "learning_rate": 9.976908442522837e-06, "loss": 0.9154, "step": 2574 }, { "epoch": 0.06, "learning_rate": 9.976872375722185e-06, "loss": 1.0029, "step": 2575 }, { "epoch": 0.06, "learning_rate": 9.976836280842358e-06, "loss": 1.3845, "step": 2576 }, { "epoch": 0.06, "learning_rate": 9.976800157883559e-06, "loss": 1.0114, "step": 2577 }, { "epoch": 0.06, "learning_rate": 9.976764006845994e-06, "loss": 0.9927, "step": 2578 }, { "epoch": 0.06, "learning_rate": 9.976727827729862e-06, "loss": 1.241, "step": 2579 }, { "epoch": 0.06, "learning_rate": 9.976691620535372e-06, "loss": 0.9885, "step": 2580 }, { "epoch": 0.06, "learning_rate": 9.976655385262725e-06, "loss": 1.1419, "step": 2581 }, { "epoch": 0.06, "learning_rate": 9.97661912191213e-06, "loss": 1.1456, "step": 2582 }, { "epoch": 0.06, "learning_rate": 9.976582830483785e-06, "loss": 1.1823, "step": 2583 }, { "epoch": 0.06, "learning_rate": 9.976546510977898e-06, "loss": 1.1577, "step": 2584 }, { "epoch": 0.06, "learning_rate": 9.976510163394677e-06, "loss": 0.9172, "step": 2585 }, { "epoch": 0.06, "learning_rate": 9.976473787734322e-06, "loss": 1.0379, "step": 2586 }, { "epoch": 0.06, "learning_rate": 9.976437383997041e-06, "loss": 0.9258, "step": 2587 }, { "epoch": 0.06, "learning_rate": 9.976400952183038e-06, "loss": 1.2037, "step": 2588 }, { "epoch": 0.06, "learning_rate": 9.976364492292521e-06, "loss": 0.7991, "step": 2589 }, { "epoch": 0.06, "learning_rate": 9.976328004325694e-06, "loss": 1.2188, "step": 2590 }, { "epoch": 0.06, "learning_rate": 9.976291488282761e-06, "loss": 1.1756, "step": 2591 }, { "epoch": 0.06, "learning_rate": 9.97625494416393e-06, "loss": 1.0473, "step": 2592 }, { "epoch": 0.06, "learning_rate": 9.976218371969408e-06, "loss": 0.9732, "step": 2593 }, { "epoch": 0.06, "learning_rate": 9.9761817716994e-06, "loss": 1.1907, "step": 2594 }, { "epoch": 0.06, "learning_rate": 9.976145143354115e-06, "loss": 0.7972, "step": 2595 }, { "epoch": 0.06, "learning_rate": 9.976108486933755e-06, "loss": 1.2905, "step": 2596 }, { "epoch": 0.06, "learning_rate": 9.97607180243853e-06, "loss": 1.1636, "step": 2597 }, { "epoch": 0.06, "learning_rate": 9.976035089868647e-06, "loss": 0.9982, "step": 2598 }, { "epoch": 0.06, "learning_rate": 9.975998349224312e-06, "loss": 1.1735, "step": 2599 }, { "epoch": 0.06, "learning_rate": 9.975961580505734e-06, "loss": 1.2002, "step": 2600 }, { "epoch": 0.06, "learning_rate": 9.975924783713117e-06, "loss": 1.1099, "step": 2601 }, { "epoch": 0.06, "learning_rate": 9.975887958846673e-06, "loss": 1.0986, "step": 2602 }, { "epoch": 0.06, "learning_rate": 9.975851105906606e-06, "loss": 1.3815, "step": 2603 }, { "epoch": 0.06, "learning_rate": 9.975814224893126e-06, "loss": 1.2087, "step": 2604 }, { "epoch": 0.06, "learning_rate": 9.97577731580644e-06, "loss": 1.0909, "step": 2605 }, { "epoch": 0.06, "learning_rate": 9.975740378646758e-06, "loss": 0.77, "step": 2606 }, { "epoch": 0.06, "learning_rate": 9.975703413414286e-06, "loss": 1.2479, "step": 2607 }, { "epoch": 0.06, "learning_rate": 9.975666420109235e-06, "loss": 1.3397, "step": 2608 }, { "epoch": 0.06, "learning_rate": 9.975629398731813e-06, "loss": 0.9701, "step": 2609 }, { "epoch": 0.06, "learning_rate": 9.975592349282226e-06, "loss": 1.2868, "step": 2610 }, { "epoch": 0.06, "learning_rate": 9.975555271760687e-06, "loss": 1.126, "step": 2611 }, { "epoch": 0.06, "learning_rate": 9.975518166167404e-06, "loss": 1.1516, "step": 2612 }, { "epoch": 0.06, "learning_rate": 9.975481032502585e-06, "loss": 1.0802, "step": 2613 }, { "epoch": 0.06, "learning_rate": 9.975443870766441e-06, "loss": 1.3031, "step": 2614 }, { "epoch": 0.06, "learning_rate": 9.975406680959181e-06, "loss": 1.1384, "step": 2615 }, { "epoch": 0.06, "learning_rate": 9.975369463081015e-06, "loss": 0.9396, "step": 2616 }, { "epoch": 0.06, "learning_rate": 9.975332217132153e-06, "loss": 1.0089, "step": 2617 }, { "epoch": 0.06, "learning_rate": 9.975294943112805e-06, "loss": 1.2618, "step": 2618 }, { "epoch": 0.06, "learning_rate": 9.975257641023182e-06, "loss": 1.1794, "step": 2619 }, { "epoch": 0.06, "learning_rate": 9.97522031086349e-06, "loss": 0.986, "step": 2620 }, { "epoch": 0.06, "learning_rate": 9.975182952633949e-06, "loss": 1.044, "step": 2621 }, { "epoch": 0.06, "learning_rate": 9.97514556633476e-06, "loss": 1.1346, "step": 2622 }, { "epoch": 0.06, "learning_rate": 9.975108151966141e-06, "loss": 1.1021, "step": 2623 }, { "epoch": 0.06, "learning_rate": 9.975070709528299e-06, "loss": 1.1847, "step": 2624 }, { "epoch": 0.06, "learning_rate": 9.975033239021446e-06, "loss": 0.9984, "step": 2625 }, { "epoch": 0.06, "learning_rate": 9.974995740445794e-06, "loss": 1.23, "step": 2626 }, { "epoch": 0.06, "learning_rate": 9.974958213801555e-06, "loss": 1.0948, "step": 2627 }, { "epoch": 0.06, "learning_rate": 9.97492065908894e-06, "loss": 1.031, "step": 2628 }, { "epoch": 0.06, "learning_rate": 9.97488307630816e-06, "loss": 0.9692, "step": 2629 }, { "epoch": 0.06, "learning_rate": 9.974845465459429e-06, "loss": 0.8888, "step": 2630 }, { "epoch": 0.06, "learning_rate": 9.974807826542958e-06, "loss": 0.8682, "step": 2631 }, { "epoch": 0.06, "learning_rate": 9.97477015955896e-06, "loss": 1.0413, "step": 2632 }, { "epoch": 0.06, "learning_rate": 9.974732464507648e-06, "loss": 1.4472, "step": 2633 }, { "epoch": 0.06, "learning_rate": 9.974694741389233e-06, "loss": 1.3341, "step": 2634 }, { "epoch": 0.06, "learning_rate": 9.974656990203929e-06, "loss": 0.7686, "step": 2635 }, { "epoch": 0.06, "learning_rate": 9.974619210951947e-06, "loss": 1.3847, "step": 2636 }, { "epoch": 0.06, "learning_rate": 9.974581403633502e-06, "loss": 1.112, "step": 2637 }, { "epoch": 0.06, "learning_rate": 9.974543568248809e-06, "loss": 1.1618, "step": 2638 }, { "epoch": 0.06, "learning_rate": 9.974505704798078e-06, "loss": 0.9664, "step": 2639 }, { "epoch": 0.06, "learning_rate": 9.974467813281526e-06, "loss": 1.1241, "step": 2640 }, { "epoch": 0.06, "learning_rate": 9.974429893699363e-06, "loss": 1.1294, "step": 2641 }, { "epoch": 0.06, "learning_rate": 9.974391946051806e-06, "loss": 0.8548, "step": 2642 }, { "epoch": 0.06, "learning_rate": 9.974353970339068e-06, "loss": 1.1058, "step": 2643 }, { "epoch": 0.06, "learning_rate": 9.974315966561363e-06, "loss": 1.3466, "step": 2644 }, { "epoch": 0.06, "learning_rate": 9.974277934718905e-06, "loss": 1.3913, "step": 2645 }, { "epoch": 0.06, "learning_rate": 9.97423987481191e-06, "loss": 0.9315, "step": 2646 }, { "epoch": 0.06, "learning_rate": 9.974201786840592e-06, "loss": 1.2875, "step": 2647 }, { "epoch": 0.06, "learning_rate": 9.974163670805167e-06, "loss": 0.9647, "step": 2648 }, { "epoch": 0.06, "learning_rate": 9.974125526705846e-06, "loss": 1.145, "step": 2649 }, { "epoch": 0.06, "learning_rate": 9.974087354542848e-06, "loss": 1.1659, "step": 2650 }, { "epoch": 0.06, "learning_rate": 9.974049154316388e-06, "loss": 1.3151, "step": 2651 }, { "epoch": 0.06, "learning_rate": 9.974010926026681e-06, "loss": 1.0622, "step": 2652 }, { "epoch": 0.06, "learning_rate": 9.973972669673943e-06, "loss": 1.3992, "step": 2653 }, { "epoch": 0.06, "learning_rate": 9.97393438525839e-06, "loss": 1.5295, "step": 2654 }, { "epoch": 0.06, "learning_rate": 9.973896072780237e-06, "loss": 1.1111, "step": 2655 }, { "epoch": 0.06, "learning_rate": 9.9738577322397e-06, "loss": 1.1341, "step": 2656 }, { "epoch": 0.06, "learning_rate": 9.973819363636997e-06, "loss": 0.8523, "step": 2657 }, { "epoch": 0.06, "learning_rate": 9.973780966972343e-06, "loss": 1.069, "step": 2658 }, { "epoch": 0.06, "learning_rate": 9.973742542245955e-06, "loss": 1.2015, "step": 2659 }, { "epoch": 0.06, "learning_rate": 9.97370408945805e-06, "loss": 0.9228, "step": 2660 }, { "epoch": 0.06, "learning_rate": 9.973665608608844e-06, "loss": 0.8225, "step": 2661 }, { "epoch": 0.06, "learning_rate": 9.973627099698557e-06, "loss": 1.2587, "step": 2662 }, { "epoch": 0.06, "learning_rate": 9.973588562727403e-06, "loss": 1.1453, "step": 2663 }, { "epoch": 0.06, "learning_rate": 9.973549997695602e-06, "loss": 1.3107, "step": 2664 }, { "epoch": 0.06, "learning_rate": 9.973511404603368e-06, "loss": 0.952, "step": 2665 }, { "epoch": 0.06, "learning_rate": 9.973472783450921e-06, "loss": 1.0667, "step": 2666 }, { "epoch": 0.06, "learning_rate": 9.97343413423848e-06, "loss": 1.0926, "step": 2667 }, { "epoch": 0.06, "learning_rate": 9.973395456966262e-06, "loss": 1.0915, "step": 2668 }, { "epoch": 0.06, "learning_rate": 9.973356751634484e-06, "loss": 1.0205, "step": 2669 }, { "epoch": 0.06, "learning_rate": 9.973318018243366e-06, "loss": 1.1349, "step": 2670 }, { "epoch": 0.06, "learning_rate": 9.973279256793126e-06, "loss": 1.1246, "step": 2671 }, { "epoch": 0.06, "learning_rate": 9.973240467283985e-06, "loss": 1.0404, "step": 2672 }, { "epoch": 0.06, "learning_rate": 9.973201649716155e-06, "loss": 1.0429, "step": 2673 }, { "epoch": 0.06, "learning_rate": 9.973162804089863e-06, "loss": 1.0954, "step": 2674 }, { "epoch": 0.06, "learning_rate": 9.973123930405324e-06, "loss": 1.0698, "step": 2675 }, { "epoch": 0.06, "learning_rate": 9.973085028662758e-06, "loss": 1.1731, "step": 2676 }, { "epoch": 0.06, "learning_rate": 9.973046098862384e-06, "loss": 1.058, "step": 2677 }, { "epoch": 0.06, "learning_rate": 9.973007141004423e-06, "loss": 1.0562, "step": 2678 }, { "epoch": 0.06, "learning_rate": 9.972968155089093e-06, "loss": 1.0737, "step": 2679 }, { "epoch": 0.06, "learning_rate": 9.972929141116616e-06, "loss": 1.1596, "step": 2680 }, { "epoch": 0.06, "learning_rate": 9.972890099087212e-06, "loss": 1.1078, "step": 2681 }, { "epoch": 0.06, "learning_rate": 9.972851029001099e-06, "loss": 1.1613, "step": 2682 }, { "epoch": 0.06, "learning_rate": 9.972811930858496e-06, "loss": 0.9003, "step": 2683 }, { "epoch": 0.06, "learning_rate": 9.97277280465963e-06, "loss": 1.2046, "step": 2684 }, { "epoch": 0.06, "learning_rate": 9.972733650404718e-06, "loss": 1.0442, "step": 2685 }, { "epoch": 0.06, "learning_rate": 9.97269446809398e-06, "loss": 1.3595, "step": 2686 }, { "epoch": 0.06, "learning_rate": 9.972655257727637e-06, "loss": 0.8567, "step": 2687 }, { "epoch": 0.06, "learning_rate": 9.972616019305913e-06, "loss": 1.1863, "step": 2688 }, { "epoch": 0.06, "learning_rate": 9.972576752829025e-06, "loss": 1.0518, "step": 2689 }, { "epoch": 0.06, "learning_rate": 9.972537458297201e-06, "loss": 0.8447, "step": 2690 }, { "epoch": 0.06, "learning_rate": 9.972498135710658e-06, "loss": 1.2537, "step": 2691 }, { "epoch": 0.06, "learning_rate": 9.972458785069616e-06, "loss": 1.2187, "step": 2692 }, { "epoch": 0.06, "learning_rate": 9.972419406374304e-06, "loss": 1.1564, "step": 2693 }, { "epoch": 0.06, "learning_rate": 9.972379999624935e-06, "loss": 1.0199, "step": 2694 }, { "epoch": 0.06, "learning_rate": 9.97234056482174e-06, "loss": 1.189, "step": 2695 }, { "epoch": 0.06, "learning_rate": 9.972301101964936e-06, "loss": 1.1444, "step": 2696 }, { "epoch": 0.06, "learning_rate": 9.972261611054748e-06, "loss": 1.2147, "step": 2697 }, { "epoch": 0.06, "learning_rate": 9.9722220920914e-06, "loss": 1.176, "step": 2698 }, { "epoch": 0.06, "learning_rate": 9.97218254507511e-06, "loss": 1.2612, "step": 2699 }, { "epoch": 0.06, "learning_rate": 9.972142970006106e-06, "loss": 1.1503, "step": 2700 }, { "epoch": 0.06, "learning_rate": 9.972103366884609e-06, "loss": 1.3114, "step": 2701 }, { "epoch": 0.06, "learning_rate": 9.972063735710844e-06, "loss": 0.9019, "step": 2702 }, { "epoch": 0.06, "learning_rate": 9.972024076485031e-06, "loss": 1.131, "step": 2703 }, { "epoch": 0.06, "learning_rate": 9.971984389207399e-06, "loss": 0.9381, "step": 2704 }, { "epoch": 0.06, "learning_rate": 9.971944673878168e-06, "loss": 1.0423, "step": 2705 }, { "epoch": 0.06, "learning_rate": 9.971904930497564e-06, "loss": 1.0887, "step": 2706 }, { "epoch": 0.06, "learning_rate": 9.97186515906581e-06, "loss": 0.968, "step": 2707 }, { "epoch": 0.06, "learning_rate": 9.971825359583132e-06, "loss": 0.9431, "step": 2708 }, { "epoch": 0.06, "learning_rate": 9.971785532049752e-06, "loss": 1.0646, "step": 2709 }, { "epoch": 0.06, "learning_rate": 9.971745676465898e-06, "loss": 0.9873, "step": 2710 }, { "epoch": 0.06, "learning_rate": 9.971705792831792e-06, "loss": 1.0495, "step": 2711 }, { "epoch": 0.06, "learning_rate": 9.97166588114766e-06, "loss": 1.0989, "step": 2712 }, { "epoch": 0.06, "learning_rate": 9.971625941413727e-06, "loss": 0.803, "step": 2713 }, { "epoch": 0.06, "learning_rate": 9.97158597363022e-06, "loss": 1.2178, "step": 2714 }, { "epoch": 0.06, "learning_rate": 9.97154597779736e-06, "loss": 1.3769, "step": 2715 }, { "epoch": 0.06, "learning_rate": 9.97150595391538e-06, "loss": 1.0159, "step": 2716 }, { "epoch": 0.06, "learning_rate": 9.9714659019845e-06, "loss": 1.0505, "step": 2717 }, { "epoch": 0.06, "learning_rate": 9.971425822004946e-06, "loss": 1.1729, "step": 2718 }, { "epoch": 0.06, "learning_rate": 9.971385713976946e-06, "loss": 0.9478, "step": 2719 }, { "epoch": 0.06, "learning_rate": 9.971345577900729e-06, "loss": 1.0774, "step": 2720 }, { "epoch": 0.06, "learning_rate": 9.971305413776516e-06, "loss": 1.1951, "step": 2721 }, { "epoch": 0.06, "learning_rate": 9.971265221604536e-06, "loss": 0.9978, "step": 2722 }, { "epoch": 0.06, "learning_rate": 9.971225001385014e-06, "loss": 1.0904, "step": 2723 }, { "epoch": 0.06, "learning_rate": 9.971184753118181e-06, "loss": 1.0563, "step": 2724 }, { "epoch": 0.06, "learning_rate": 9.971144476804262e-06, "loss": 1.0125, "step": 2725 }, { "epoch": 0.06, "learning_rate": 9.971104172443483e-06, "loss": 0.9815, "step": 2726 }, { "epoch": 0.06, "learning_rate": 9.971063840036073e-06, "loss": 0.9796, "step": 2727 }, { "epoch": 0.06, "learning_rate": 9.971023479582258e-06, "loss": 1.0834, "step": 2728 }, { "epoch": 0.06, "learning_rate": 9.970983091082268e-06, "loss": 1.1239, "step": 2729 }, { "epoch": 0.06, "learning_rate": 9.970942674536329e-06, "loss": 1.17, "step": 2730 }, { "epoch": 0.06, "learning_rate": 9.97090222994467e-06, "loss": 0.9696, "step": 2731 }, { "epoch": 0.06, "learning_rate": 9.970861757307518e-06, "loss": 1.5185, "step": 2732 }, { "epoch": 0.06, "learning_rate": 9.970821256625101e-06, "loss": 1.2965, "step": 2733 }, { "epoch": 0.06, "learning_rate": 9.97078072789765e-06, "loss": 1.0771, "step": 2734 }, { "epoch": 0.06, "learning_rate": 9.970740171125392e-06, "loss": 1.2006, "step": 2735 }, { "epoch": 0.06, "learning_rate": 9.970699586308557e-06, "loss": 1.0772, "step": 2736 }, { "epoch": 0.06, "learning_rate": 9.970658973447371e-06, "loss": 0.9525, "step": 2737 }, { "epoch": 0.06, "learning_rate": 9.970618332542067e-06, "loss": 1.0964, "step": 2738 }, { "epoch": 0.06, "learning_rate": 9.970577663592871e-06, "loss": 1.2048, "step": 2739 }, { "epoch": 0.06, "learning_rate": 9.970536966600015e-06, "loss": 0.8698, "step": 2740 }, { "epoch": 0.06, "learning_rate": 9.970496241563727e-06, "loss": 1.0175, "step": 2741 }, { "epoch": 0.06, "learning_rate": 9.970455488484239e-06, "loss": 1.048, "step": 2742 }, { "epoch": 0.06, "learning_rate": 9.970414707361777e-06, "loss": 1.1473, "step": 2743 }, { "epoch": 0.06, "learning_rate": 9.970373898196575e-06, "loss": 1.1951, "step": 2744 }, { "epoch": 0.06, "learning_rate": 9.97033306098886e-06, "loss": 0.9742, "step": 2745 }, { "epoch": 0.06, "learning_rate": 9.970292195738865e-06, "loss": 1.2297, "step": 2746 }, { "epoch": 0.06, "learning_rate": 9.970251302446818e-06, "loss": 1.0903, "step": 2747 }, { "epoch": 0.06, "learning_rate": 9.970210381112953e-06, "loss": 1.134, "step": 2748 }, { "epoch": 0.06, "learning_rate": 9.970169431737498e-06, "loss": 0.9185, "step": 2749 }, { "epoch": 0.06, "learning_rate": 9.970128454320685e-06, "loss": 0.9885, "step": 2750 }, { "epoch": 0.06, "learning_rate": 9.970087448862746e-06, "loss": 0.9676, "step": 2751 }, { "epoch": 0.06, "learning_rate": 9.970046415363912e-06, "loss": 1.1045, "step": 2752 }, { "epoch": 0.06, "learning_rate": 9.970005353824415e-06, "loss": 1.1452, "step": 2753 }, { "epoch": 0.06, "learning_rate": 9.969964264244482e-06, "loss": 0.839, "step": 2754 }, { "epoch": 0.06, "learning_rate": 9.969923146624353e-06, "loss": 0.8753, "step": 2755 }, { "epoch": 0.06, "learning_rate": 9.969882000964254e-06, "loss": 1.0915, "step": 2756 }, { "epoch": 0.06, "learning_rate": 9.969840827264418e-06, "loss": 1.1627, "step": 2757 }, { "epoch": 0.06, "learning_rate": 9.96979962552508e-06, "loss": 1.2522, "step": 2758 }, { "epoch": 0.06, "learning_rate": 9.969758395746469e-06, "loss": 1.0509, "step": 2759 }, { "epoch": 0.06, "learning_rate": 9.96971713792882e-06, "loss": 0.9786, "step": 2760 }, { "epoch": 0.06, "learning_rate": 9.969675852072365e-06, "loss": 1.119, "step": 2761 }, { "epoch": 0.06, "learning_rate": 9.969634538177335e-06, "loss": 0.9841, "step": 2762 }, { "epoch": 0.06, "learning_rate": 9.969593196243967e-06, "loss": 1.1842, "step": 2763 }, { "epoch": 0.06, "learning_rate": 9.969551826272493e-06, "loss": 1.0877, "step": 2764 }, { "epoch": 0.06, "learning_rate": 9.969510428263142e-06, "loss": 1.2268, "step": 2765 }, { "epoch": 0.06, "learning_rate": 9.969469002216155e-06, "loss": 0.9413, "step": 2766 }, { "epoch": 0.06, "learning_rate": 9.96942754813176e-06, "loss": 1.2997, "step": 2767 }, { "epoch": 0.06, "learning_rate": 9.969386066010192e-06, "loss": 1.2059, "step": 2768 }, { "epoch": 0.06, "learning_rate": 9.969344555851687e-06, "loss": 0.9987, "step": 2769 }, { "epoch": 0.06, "learning_rate": 9.96930301765648e-06, "loss": 1.0131, "step": 2770 }, { "epoch": 0.06, "learning_rate": 9.969261451424801e-06, "loss": 1.0771, "step": 2771 }, { "epoch": 0.06, "learning_rate": 9.969219857156886e-06, "loss": 0.9272, "step": 2772 }, { "epoch": 0.06, "learning_rate": 9.969178234852972e-06, "loss": 1.0062, "step": 2773 }, { "epoch": 0.06, "learning_rate": 9.969136584513292e-06, "loss": 1.1797, "step": 2774 }, { "epoch": 0.06, "learning_rate": 9.96909490613808e-06, "loss": 1.1895, "step": 2775 }, { "epoch": 0.06, "learning_rate": 9.969053199727576e-06, "loss": 0.9343, "step": 2776 }, { "epoch": 0.06, "learning_rate": 9.96901146528201e-06, "loss": 1.1935, "step": 2777 }, { "epoch": 0.06, "learning_rate": 9.96896970280162e-06, "loss": 1.0947, "step": 2778 }, { "epoch": 0.06, "learning_rate": 9.96892791228664e-06, "loss": 1.5579, "step": 2779 }, { "epoch": 0.06, "learning_rate": 9.968886093737306e-06, "loss": 1.1753, "step": 2780 }, { "epoch": 0.06, "learning_rate": 9.968844247153857e-06, "loss": 1.2305, "step": 2781 }, { "epoch": 0.06, "learning_rate": 9.968802372536526e-06, "loss": 0.9322, "step": 2782 }, { "epoch": 0.06, "learning_rate": 9.968760469885548e-06, "loss": 1.1037, "step": 2783 }, { "epoch": 0.06, "learning_rate": 9.968718539201163e-06, "loss": 1.088, "step": 2784 }, { "epoch": 0.06, "learning_rate": 9.968676580483606e-06, "loss": 1.0788, "step": 2785 }, { "epoch": 0.06, "learning_rate": 9.968634593733112e-06, "loss": 0.9158, "step": 2786 }, { "epoch": 0.06, "learning_rate": 9.968592578949923e-06, "loss": 0.9796, "step": 2787 }, { "epoch": 0.06, "learning_rate": 9.96855053613427e-06, "loss": 1.0303, "step": 2788 }, { "epoch": 0.06, "learning_rate": 9.968508465286394e-06, "loss": 0.9284, "step": 2789 }, { "epoch": 0.06, "learning_rate": 9.96846636640653e-06, "loss": 0.9966, "step": 2790 }, { "epoch": 0.06, "learning_rate": 9.968424239494918e-06, "loss": 1.2073, "step": 2791 }, { "epoch": 0.06, "learning_rate": 9.968382084551793e-06, "loss": 1.0397, "step": 2792 }, { "epoch": 0.06, "learning_rate": 9.968339901577396e-06, "loss": 1.054, "step": 2793 }, { "epoch": 0.06, "learning_rate": 9.968297690571961e-06, "loss": 0.9733, "step": 2794 }, { "epoch": 0.06, "learning_rate": 9.968255451535732e-06, "loss": 1.2082, "step": 2795 }, { "epoch": 0.06, "learning_rate": 9.96821318446894e-06, "loss": 1.3153, "step": 2796 }, { "epoch": 0.06, "learning_rate": 9.968170889371828e-06, "loss": 1.0755, "step": 2797 }, { "epoch": 0.06, "learning_rate": 9.968128566244634e-06, "loss": 1.0827, "step": 2798 }, { "epoch": 0.06, "learning_rate": 9.968086215087598e-06, "loss": 1.1515, "step": 2799 }, { "epoch": 0.06, "learning_rate": 9.968043835900955e-06, "loss": 0.8988, "step": 2800 }, { "epoch": 0.06, "learning_rate": 9.96800142868495e-06, "loss": 0.8549, "step": 2801 }, { "epoch": 0.06, "learning_rate": 9.967958993439816e-06, "loss": 1.1154, "step": 2802 }, { "epoch": 0.07, "learning_rate": 9.967916530165796e-06, "loss": 1.1419, "step": 2803 }, { "epoch": 0.07, "learning_rate": 9.967874038863129e-06, "loss": 0.9983, "step": 2804 }, { "epoch": 0.07, "learning_rate": 9.967831519532054e-06, "loss": 1.1789, "step": 2805 }, { "epoch": 0.07, "learning_rate": 9.967788972172812e-06, "loss": 1.0586, "step": 2806 }, { "epoch": 0.07, "learning_rate": 9.967746396785642e-06, "loss": 1.0396, "step": 2807 }, { "epoch": 0.07, "learning_rate": 9.967703793370787e-06, "loss": 0.907, "step": 2808 }, { "epoch": 0.07, "learning_rate": 9.967661161928482e-06, "loss": 0.9443, "step": 2809 }, { "epoch": 0.07, "learning_rate": 9.967618502458974e-06, "loss": 1.2855, "step": 2810 }, { "epoch": 0.07, "learning_rate": 9.967575814962497e-06, "loss": 1.0475, "step": 2811 }, { "epoch": 0.07, "learning_rate": 9.967533099439297e-06, "loss": 1.1292, "step": 2812 }, { "epoch": 0.07, "learning_rate": 9.967490355889612e-06, "loss": 1.2231, "step": 2813 }, { "epoch": 0.07, "learning_rate": 9.967447584313685e-06, "loss": 1.1379, "step": 2814 }, { "epoch": 0.07, "learning_rate": 9.967404784711756e-06, "loss": 0.6811, "step": 2815 }, { "epoch": 0.07, "learning_rate": 9.967361957084068e-06, "loss": 1.1875, "step": 2816 }, { "epoch": 0.07, "learning_rate": 9.967319101430861e-06, "loss": 1.2684, "step": 2817 }, { "epoch": 0.07, "learning_rate": 9.967276217752377e-06, "loss": 1.2484, "step": 2818 }, { "epoch": 0.07, "learning_rate": 9.96723330604886e-06, "loss": 0.9992, "step": 2819 }, { "epoch": 0.07, "learning_rate": 9.967190366320551e-06, "loss": 1.0438, "step": 2820 }, { "epoch": 0.07, "learning_rate": 9.967147398567689e-06, "loss": 1.3211, "step": 2821 }, { "epoch": 0.07, "learning_rate": 9.967104402790522e-06, "loss": 1.1998, "step": 2822 }, { "epoch": 0.07, "learning_rate": 9.96706137898929e-06, "loss": 1.0783, "step": 2823 }, { "epoch": 0.07, "learning_rate": 9.967018327164233e-06, "loss": 1.1844, "step": 2824 }, { "epoch": 0.07, "learning_rate": 9.966975247315599e-06, "loss": 1.1842, "step": 2825 }, { "epoch": 0.07, "learning_rate": 9.966932139443626e-06, "loss": 1.0491, "step": 2826 }, { "epoch": 0.07, "learning_rate": 9.96688900354856e-06, "loss": 1.1972, "step": 2827 }, { "epoch": 0.07, "learning_rate": 9.966845839630646e-06, "loss": 0.9771, "step": 2828 }, { "epoch": 0.07, "learning_rate": 9.966802647690124e-06, "loss": 0.9874, "step": 2829 }, { "epoch": 0.07, "learning_rate": 9.96675942772724e-06, "loss": 1.1699, "step": 2830 }, { "epoch": 0.07, "learning_rate": 9.966716179742237e-06, "loss": 1.0117, "step": 2831 }, { "epoch": 0.07, "learning_rate": 9.96667290373536e-06, "loss": 0.9277, "step": 2832 }, { "epoch": 0.07, "learning_rate": 9.966629599706851e-06, "loss": 1.0862, "step": 2833 }, { "epoch": 0.07, "learning_rate": 9.966586267656957e-06, "loss": 1.2417, "step": 2834 }, { "epoch": 0.07, "learning_rate": 9.966542907585922e-06, "loss": 1.0501, "step": 2835 }, { "epoch": 0.07, "learning_rate": 9.966499519493986e-06, "loss": 1.0434, "step": 2836 }, { "epoch": 0.07, "learning_rate": 9.9664561033814e-06, "loss": 1.1122, "step": 2837 }, { "epoch": 0.07, "learning_rate": 9.966412659248405e-06, "loss": 1.3256, "step": 2838 }, { "epoch": 0.07, "learning_rate": 9.96636918709525e-06, "loss": 1.1135, "step": 2839 }, { "epoch": 0.07, "learning_rate": 9.966325686922177e-06, "loss": 1.017, "step": 2840 }, { "epoch": 0.07, "learning_rate": 9.966282158729431e-06, "loss": 1.169, "step": 2841 }, { "epoch": 0.07, "learning_rate": 9.96623860251726e-06, "loss": 1.4241, "step": 2842 }, { "epoch": 0.07, "learning_rate": 9.966195018285907e-06, "loss": 1.1124, "step": 2843 }, { "epoch": 0.07, "learning_rate": 9.966151406035622e-06, "loss": 1.0136, "step": 2844 }, { "epoch": 0.07, "learning_rate": 9.966107765766646e-06, "loss": 1.2189, "step": 2845 }, { "epoch": 0.07, "learning_rate": 9.96606409747923e-06, "loss": 1.0696, "step": 2846 }, { "epoch": 0.07, "learning_rate": 9.966020401173617e-06, "loss": 1.0948, "step": 2847 }, { "epoch": 0.07, "learning_rate": 9.965976676850056e-06, "loss": 1.2643, "step": 2848 }, { "epoch": 0.07, "learning_rate": 9.965932924508793e-06, "loss": 1.132, "step": 2849 }, { "epoch": 0.07, "learning_rate": 9.965889144150072e-06, "loss": 1.0823, "step": 2850 }, { "epoch": 0.07, "learning_rate": 9.965845335774142e-06, "loss": 0.8347, "step": 2851 }, { "epoch": 0.07, "learning_rate": 9.965801499381252e-06, "loss": 1.0629, "step": 2852 }, { "epoch": 0.07, "learning_rate": 9.965757634971647e-06, "loss": 0.8783, "step": 2853 }, { "epoch": 0.07, "learning_rate": 9.965713742545574e-06, "loss": 1.1555, "step": 2854 }, { "epoch": 0.07, "learning_rate": 9.965669822103284e-06, "loss": 1.0851, "step": 2855 }, { "epoch": 0.07, "learning_rate": 9.96562587364502e-06, "loss": 0.9688, "step": 2856 }, { "epoch": 0.07, "learning_rate": 9.965581897171034e-06, "loss": 1.1772, "step": 2857 }, { "epoch": 0.07, "learning_rate": 9.965537892681573e-06, "loss": 1.3468, "step": 2858 }, { "epoch": 0.07, "learning_rate": 9.965493860176887e-06, "loss": 1.2476, "step": 2859 }, { "epoch": 0.07, "learning_rate": 9.965449799657219e-06, "loss": 1.2074, "step": 2860 }, { "epoch": 0.07, "learning_rate": 9.965405711122823e-06, "loss": 0.9548, "step": 2861 }, { "epoch": 0.07, "learning_rate": 9.965361594573943e-06, "loss": 1.2655, "step": 2862 }, { "epoch": 0.07, "learning_rate": 9.965317450010833e-06, "loss": 1.1382, "step": 2863 }, { "epoch": 0.07, "learning_rate": 9.96527327743374e-06, "loss": 1.1281, "step": 2864 }, { "epoch": 0.07, "learning_rate": 9.965229076842912e-06, "loss": 1.0105, "step": 2865 }, { "epoch": 0.07, "learning_rate": 9.965184848238599e-06, "loss": 1.1446, "step": 2866 }, { "epoch": 0.07, "learning_rate": 9.965140591621051e-06, "loss": 1.225, "step": 2867 }, { "epoch": 0.07, "learning_rate": 9.965096306990518e-06, "loss": 0.8851, "step": 2868 }, { "epoch": 0.07, "learning_rate": 9.96505199434725e-06, "loss": 1.0971, "step": 2869 }, { "epoch": 0.07, "learning_rate": 9.965007653691495e-06, "loss": 0.7563, "step": 2870 }, { "epoch": 0.07, "learning_rate": 9.964963285023506e-06, "loss": 1.2661, "step": 2871 }, { "epoch": 0.07, "learning_rate": 9.964918888343531e-06, "loss": 1.1042, "step": 2872 }, { "epoch": 0.07, "learning_rate": 9.964874463651821e-06, "loss": 1.1374, "step": 2873 }, { "epoch": 0.07, "learning_rate": 9.964830010948628e-06, "loss": 0.7578, "step": 2874 }, { "epoch": 0.07, "learning_rate": 9.9647855302342e-06, "loss": 1.1209, "step": 2875 }, { "epoch": 0.07, "learning_rate": 9.96474102150879e-06, "loss": 1.0472, "step": 2876 }, { "epoch": 0.07, "learning_rate": 9.96469648477265e-06, "loss": 0.9054, "step": 2877 }, { "epoch": 0.07, "learning_rate": 9.964651920026029e-06, "loss": 1.0213, "step": 2878 }, { "epoch": 0.07, "learning_rate": 9.96460732726918e-06, "loss": 0.9993, "step": 2879 }, { "epoch": 0.07, "learning_rate": 9.964562706502357e-06, "loss": 1.0339, "step": 2880 }, { "epoch": 0.07, "learning_rate": 9.964518057725805e-06, "loss": 1.1011, "step": 2881 }, { "epoch": 0.07, "learning_rate": 9.96447338093978e-06, "loss": 0.9429, "step": 2882 }, { "epoch": 0.07, "learning_rate": 9.964428676144537e-06, "loss": 1.0307, "step": 2883 }, { "epoch": 0.07, "learning_rate": 9.964383943340323e-06, "loss": 1.1108, "step": 2884 }, { "epoch": 0.07, "learning_rate": 9.964339182527393e-06, "loss": 1.012, "step": 2885 }, { "epoch": 0.07, "learning_rate": 9.964294393705998e-06, "loss": 1.0091, "step": 2886 }, { "epoch": 0.07, "learning_rate": 9.964249576876392e-06, "loss": 1.0461, "step": 2887 }, { "epoch": 0.07, "learning_rate": 9.964204732038829e-06, "loss": 1.0997, "step": 2888 }, { "epoch": 0.07, "learning_rate": 9.964159859193558e-06, "loss": 0.8836, "step": 2889 }, { "epoch": 0.07, "learning_rate": 9.964114958340837e-06, "loss": 0.9475, "step": 2890 }, { "epoch": 0.07, "learning_rate": 9.964070029480917e-06, "loss": 1.1458, "step": 2891 }, { "epoch": 0.07, "learning_rate": 9.964025072614049e-06, "loss": 0.9036, "step": 2892 }, { "epoch": 0.07, "learning_rate": 9.963980087740492e-06, "loss": 1.0127, "step": 2893 }, { "epoch": 0.07, "learning_rate": 9.963935074860496e-06, "loss": 1.1895, "step": 2894 }, { "epoch": 0.07, "learning_rate": 9.963890033974316e-06, "loss": 1.0623, "step": 2895 }, { "epoch": 0.07, "learning_rate": 9.963844965082206e-06, "loss": 0.8595, "step": 2896 }, { "epoch": 0.07, "learning_rate": 9.96379986818442e-06, "loss": 1.2882, "step": 2897 }, { "epoch": 0.07, "learning_rate": 9.963754743281213e-06, "loss": 1.2777, "step": 2898 }, { "epoch": 0.07, "learning_rate": 9.96370959037284e-06, "loss": 0.9052, "step": 2899 }, { "epoch": 0.07, "learning_rate": 9.963664409459554e-06, "loss": 0.952, "step": 2900 }, { "epoch": 0.07, "learning_rate": 9.963619200541612e-06, "loss": 1.1131, "step": 2901 }, { "epoch": 0.07, "learning_rate": 9.963573963619269e-06, "loss": 1.1293, "step": 2902 }, { "epoch": 0.07, "learning_rate": 9.963528698692777e-06, "loss": 1.0981, "step": 2903 }, { "epoch": 0.07, "learning_rate": 9.963483405762396e-06, "loss": 1.2644, "step": 2904 }, { "epoch": 0.07, "learning_rate": 9.963438084828377e-06, "loss": 1.1331, "step": 2905 }, { "epoch": 0.07, "learning_rate": 9.96339273589098e-06, "loss": 1.1452, "step": 2906 }, { "epoch": 0.07, "learning_rate": 9.963347358950457e-06, "loss": 1.1721, "step": 2907 }, { "epoch": 0.07, "learning_rate": 9.963301954007067e-06, "loss": 1.1049, "step": 2908 }, { "epoch": 0.07, "learning_rate": 9.963256521061064e-06, "loss": 1.028, "step": 2909 }, { "epoch": 0.07, "learning_rate": 9.963211060112707e-06, "loss": 0.9328, "step": 2910 }, { "epoch": 0.07, "learning_rate": 9.96316557116225e-06, "loss": 1.0133, "step": 2911 }, { "epoch": 0.07, "learning_rate": 9.963120054209949e-06, "loss": 1.2584, "step": 2912 }, { "epoch": 0.07, "learning_rate": 9.963074509256062e-06, "loss": 0.9941, "step": 2913 }, { "epoch": 0.07, "learning_rate": 9.96302893630085e-06, "loss": 1.0131, "step": 2914 }, { "epoch": 0.07, "learning_rate": 9.962983335344563e-06, "loss": 1.2125, "step": 2915 }, { "epoch": 0.07, "learning_rate": 9.962937706387463e-06, "loss": 1.1661, "step": 2916 }, { "epoch": 0.07, "learning_rate": 9.962892049429806e-06, "loss": 0.9681, "step": 2917 }, { "epoch": 0.07, "learning_rate": 9.962846364471848e-06, "loss": 0.9382, "step": 2918 }, { "epoch": 0.07, "learning_rate": 9.96280065151385e-06, "loss": 1.1396, "step": 2919 }, { "epoch": 0.07, "learning_rate": 9.962754910556068e-06, "loss": 0.8761, "step": 2920 }, { "epoch": 0.07, "learning_rate": 9.96270914159876e-06, "loss": 1.0562, "step": 2921 }, { "epoch": 0.07, "learning_rate": 9.962663344642184e-06, "loss": 0.9429, "step": 2922 }, { "epoch": 0.07, "learning_rate": 9.962617519686602e-06, "loss": 1.1535, "step": 2923 }, { "epoch": 0.07, "learning_rate": 9.962571666732266e-06, "loss": 1.1152, "step": 2924 }, { "epoch": 0.07, "learning_rate": 9.96252578577944e-06, "loss": 0.8888, "step": 2925 }, { "epoch": 0.07, "learning_rate": 9.96247987682838e-06, "loss": 0.953, "step": 2926 }, { "epoch": 0.07, "learning_rate": 9.962433939879347e-06, "loss": 1.1428, "step": 2927 }, { "epoch": 0.07, "learning_rate": 9.962387974932599e-06, "loss": 1.2241, "step": 2928 }, { "epoch": 0.07, "learning_rate": 9.962341981988394e-06, "loss": 1.0592, "step": 2929 }, { "epoch": 0.07, "learning_rate": 9.962295961046996e-06, "loss": 1.0958, "step": 2930 }, { "epoch": 0.07, "learning_rate": 9.96224991210866e-06, "loss": 1.4402, "step": 2931 }, { "epoch": 0.07, "learning_rate": 9.962203835173648e-06, "loss": 0.9723, "step": 2932 }, { "epoch": 0.07, "learning_rate": 9.962157730242218e-06, "loss": 1.0259, "step": 2933 }, { "epoch": 0.07, "learning_rate": 9.962111597314635e-06, "loss": 1.0878, "step": 2934 }, { "epoch": 0.07, "learning_rate": 9.962065436391152e-06, "loss": 1.077, "step": 2935 }, { "epoch": 0.07, "learning_rate": 9.962019247472037e-06, "loss": 1.2034, "step": 2936 }, { "epoch": 0.07, "learning_rate": 9.961973030557545e-06, "loss": 1.3878, "step": 2937 }, { "epoch": 0.07, "learning_rate": 9.961926785647939e-06, "loss": 1.1743, "step": 2938 }, { "epoch": 0.07, "learning_rate": 9.961880512743479e-06, "loss": 0.9301, "step": 2939 }, { "epoch": 0.07, "learning_rate": 9.961834211844427e-06, "loss": 1.0308, "step": 2940 }, { "epoch": 0.07, "learning_rate": 9.961787882951043e-06, "loss": 1.2607, "step": 2941 }, { "epoch": 0.07, "learning_rate": 9.96174152606359e-06, "loss": 0.9544, "step": 2942 }, { "epoch": 0.07, "learning_rate": 9.96169514118233e-06, "loss": 1.1336, "step": 2943 }, { "epoch": 0.07, "learning_rate": 9.961648728307523e-06, "loss": 0.9916, "step": 2944 }, { "epoch": 0.07, "learning_rate": 9.96160228743943e-06, "loss": 1.0949, "step": 2945 }, { "epoch": 0.07, "learning_rate": 9.961555818578315e-06, "loss": 1.0613, "step": 2946 }, { "epoch": 0.07, "learning_rate": 9.96150932172444e-06, "loss": 0.89, "step": 2947 }, { "epoch": 0.07, "learning_rate": 9.961462796878067e-06, "loss": 0.9789, "step": 2948 }, { "epoch": 0.07, "learning_rate": 9.961416244039458e-06, "loss": 1.3122, "step": 2949 }, { "epoch": 0.07, "learning_rate": 9.961369663208876e-06, "loss": 0.9101, "step": 2950 }, { "epoch": 0.07, "learning_rate": 9.961323054386585e-06, "loss": 1.2856, "step": 2951 }, { "epoch": 0.07, "learning_rate": 9.961276417572845e-06, "loss": 0.946, "step": 2952 }, { "epoch": 0.07, "learning_rate": 9.961229752767921e-06, "loss": 1.1908, "step": 2953 }, { "epoch": 0.07, "learning_rate": 9.961183059972078e-06, "loss": 1.02, "step": 2954 }, { "epoch": 0.07, "learning_rate": 9.961136339185576e-06, "loss": 0.9994, "step": 2955 }, { "epoch": 0.07, "learning_rate": 9.961089590408681e-06, "loss": 1.1445, "step": 2956 }, { "epoch": 0.07, "learning_rate": 9.961042813641655e-06, "loss": 0.9636, "step": 2957 }, { "epoch": 0.07, "learning_rate": 9.960996008884765e-06, "loss": 1.1892, "step": 2958 }, { "epoch": 0.07, "learning_rate": 9.96094917613827e-06, "loss": 0.9033, "step": 2959 }, { "epoch": 0.07, "learning_rate": 9.960902315402439e-06, "loss": 0.9875, "step": 2960 }, { "epoch": 0.07, "learning_rate": 9.960855426677533e-06, "loss": 0.9763, "step": 2961 }, { "epoch": 0.07, "learning_rate": 9.96080850996382e-06, "loss": 1.0534, "step": 2962 }, { "epoch": 0.07, "learning_rate": 9.960761565261564e-06, "loss": 0.9247, "step": 2963 }, { "epoch": 0.07, "learning_rate": 9.960714592571025e-06, "loss": 1.177, "step": 2964 }, { "epoch": 0.07, "learning_rate": 9.960667591892474e-06, "loss": 0.9652, "step": 2965 }, { "epoch": 0.07, "learning_rate": 9.960620563226175e-06, "loss": 0.8642, "step": 2966 }, { "epoch": 0.07, "learning_rate": 9.960573506572391e-06, "loss": 1.0465, "step": 2967 }, { "epoch": 0.07, "learning_rate": 9.960526421931387e-06, "loss": 1.2409, "step": 2968 }, { "epoch": 0.07, "learning_rate": 9.960479309303432e-06, "loss": 1.1202, "step": 2969 }, { "epoch": 0.07, "learning_rate": 9.96043216868879e-06, "loss": 0.8549, "step": 2970 }, { "epoch": 0.07, "learning_rate": 9.960385000087727e-06, "loss": 1.116, "step": 2971 }, { "epoch": 0.07, "learning_rate": 9.960337803500509e-06, "loss": 1.1178, "step": 2972 }, { "epoch": 0.07, "learning_rate": 9.960290578927403e-06, "loss": 1.264, "step": 2973 }, { "epoch": 0.07, "learning_rate": 9.960243326368675e-06, "loss": 1.1258, "step": 2974 }, { "epoch": 0.07, "learning_rate": 9.96019604582459e-06, "loss": 0.9445, "step": 2975 }, { "epoch": 0.07, "learning_rate": 9.960148737295419e-06, "loss": 1.143, "step": 2976 }, { "epoch": 0.07, "learning_rate": 9.960101400781424e-06, "loss": 0.9604, "step": 2977 }, { "epoch": 0.07, "learning_rate": 9.960054036282875e-06, "loss": 1.2557, "step": 2978 }, { "epoch": 0.07, "learning_rate": 9.96000664380004e-06, "loss": 1.15, "step": 2979 }, { "epoch": 0.07, "learning_rate": 9.959959223333182e-06, "loss": 1.043, "step": 2980 }, { "epoch": 0.07, "learning_rate": 9.959911774882573e-06, "loss": 0.8682, "step": 2981 }, { "epoch": 0.07, "learning_rate": 9.95986429844848e-06, "loss": 1.0188, "step": 2982 }, { "epoch": 0.07, "learning_rate": 9.959816794031168e-06, "loss": 0.9987, "step": 2983 }, { "epoch": 0.07, "learning_rate": 9.95976926163091e-06, "loss": 1.092, "step": 2984 }, { "epoch": 0.07, "learning_rate": 9.959721701247968e-06, "loss": 0.8709, "step": 2985 }, { "epoch": 0.07, "learning_rate": 9.959674112882615e-06, "loss": 1.0719, "step": 2986 }, { "epoch": 0.07, "learning_rate": 9.959626496535118e-06, "loss": 1.1022, "step": 2987 }, { "epoch": 0.07, "learning_rate": 9.959578852205745e-06, "loss": 1.3001, "step": 2988 }, { "epoch": 0.07, "learning_rate": 9.959531179894766e-06, "loss": 1.0335, "step": 2989 }, { "epoch": 0.07, "learning_rate": 9.95948347960245e-06, "loss": 1.1263, "step": 2990 }, { "epoch": 0.07, "learning_rate": 9.959435751329065e-06, "loss": 1.0214, "step": 2991 }, { "epoch": 0.07, "learning_rate": 9.95938799507488e-06, "loss": 1.0712, "step": 2992 }, { "epoch": 0.07, "learning_rate": 9.959340210840166e-06, "loss": 1.205, "step": 2993 }, { "epoch": 0.07, "learning_rate": 9.959292398625192e-06, "loss": 1.3157, "step": 2994 }, { "epoch": 0.07, "learning_rate": 9.959244558430228e-06, "loss": 1.1355, "step": 2995 }, { "epoch": 0.07, "learning_rate": 9.959196690255543e-06, "loss": 1.2313, "step": 2996 }, { "epoch": 0.07, "learning_rate": 9.959148794101408e-06, "loss": 0.917, "step": 2997 }, { "epoch": 0.07, "learning_rate": 9.959100869968093e-06, "loss": 0.8391, "step": 2998 }, { "epoch": 0.07, "learning_rate": 9.959052917855867e-06, "loss": 1.06, "step": 2999 }, { "epoch": 0.07, "learning_rate": 9.959004937765002e-06, "loss": 0.9317, "step": 3000 }, { "epoch": 0.07, "learning_rate": 9.958956929695769e-06, "loss": 1.1585, "step": 3001 }, { "epoch": 0.07, "learning_rate": 9.958908893648437e-06, "loss": 0.8373, "step": 3002 }, { "epoch": 0.07, "learning_rate": 9.95886082962328e-06, "loss": 0.9265, "step": 3003 }, { "epoch": 0.07, "learning_rate": 9.958812737620566e-06, "loss": 1.2138, "step": 3004 }, { "epoch": 0.07, "learning_rate": 9.95876461764057e-06, "loss": 1.0519, "step": 3005 }, { "epoch": 0.07, "learning_rate": 9.958716469683561e-06, "loss": 1.2323, "step": 3006 }, { "epoch": 0.07, "learning_rate": 9.958668293749809e-06, "loss": 1.0977, "step": 3007 }, { "epoch": 0.07, "learning_rate": 9.95862008983959e-06, "loss": 0.76, "step": 3008 }, { "epoch": 0.07, "learning_rate": 9.958571857953173e-06, "loss": 1.3398, "step": 3009 }, { "epoch": 0.07, "learning_rate": 9.95852359809083e-06, "loss": 1.412, "step": 3010 }, { "epoch": 0.07, "learning_rate": 9.958475310252835e-06, "loss": 0.8011, "step": 3011 }, { "epoch": 0.07, "learning_rate": 9.958426994439459e-06, "loss": 1.1456, "step": 3012 }, { "epoch": 0.07, "learning_rate": 9.958378650650975e-06, "loss": 0.7487, "step": 3013 }, { "epoch": 0.07, "learning_rate": 9.958330278887656e-06, "loss": 1.0336, "step": 3014 }, { "epoch": 0.07, "learning_rate": 9.958281879149776e-06, "loss": 1.2714, "step": 3015 }, { "epoch": 0.07, "learning_rate": 9.958233451437606e-06, "loss": 1.1417, "step": 3016 }, { "epoch": 0.07, "learning_rate": 9.95818499575142e-06, "loss": 0.9339, "step": 3017 }, { "epoch": 0.07, "learning_rate": 9.958136512091492e-06, "loss": 1.1374, "step": 3018 }, { "epoch": 0.07, "learning_rate": 9.958088000458095e-06, "loss": 1.1836, "step": 3019 }, { "epoch": 0.07, "learning_rate": 9.958039460851503e-06, "loss": 1.073, "step": 3020 }, { "epoch": 0.07, "learning_rate": 9.957990893271987e-06, "loss": 1.0966, "step": 3021 }, { "epoch": 0.07, "learning_rate": 9.957942297719828e-06, "loss": 1.2596, "step": 3022 }, { "epoch": 0.07, "learning_rate": 9.957893674195292e-06, "loss": 1.2954, "step": 3023 }, { "epoch": 0.07, "learning_rate": 9.95784502269866e-06, "loss": 1.2294, "step": 3024 }, { "epoch": 0.07, "learning_rate": 9.957796343230202e-06, "loss": 1.0741, "step": 3025 }, { "epoch": 0.07, "learning_rate": 9.957747635790194e-06, "loss": 1.0519, "step": 3026 }, { "epoch": 0.07, "learning_rate": 9.957698900378912e-06, "loss": 1.0312, "step": 3027 }, { "epoch": 0.07, "learning_rate": 9.957650136996628e-06, "loss": 1.1859, "step": 3028 }, { "epoch": 0.07, "learning_rate": 9.95760134564362e-06, "loss": 1.0138, "step": 3029 }, { "epoch": 0.07, "learning_rate": 9.957552526320164e-06, "loss": 1.0734, "step": 3030 }, { "epoch": 0.07, "learning_rate": 9.957503679026534e-06, "loss": 0.9175, "step": 3031 }, { "epoch": 0.07, "learning_rate": 9.957454803763004e-06, "loss": 1.2111, "step": 3032 }, { "epoch": 0.07, "learning_rate": 9.957405900529853e-06, "loss": 1.2051, "step": 3033 }, { "epoch": 0.07, "learning_rate": 9.957356969327353e-06, "loss": 1.0755, "step": 3034 }, { "epoch": 0.07, "learning_rate": 9.957308010155783e-06, "loss": 1.0619, "step": 3035 }, { "epoch": 0.07, "learning_rate": 9.957259023015418e-06, "loss": 1.2832, "step": 3036 }, { "epoch": 0.07, "learning_rate": 9.957210007906537e-06, "loss": 0.9624, "step": 3037 }, { "epoch": 0.07, "learning_rate": 9.957160964829412e-06, "loss": 0.9581, "step": 3038 }, { "epoch": 0.07, "learning_rate": 9.957111893784321e-06, "loss": 1.1117, "step": 3039 }, { "epoch": 0.07, "learning_rate": 9.957062794771544e-06, "loss": 1.2023, "step": 3040 }, { "epoch": 0.07, "learning_rate": 9.957013667791355e-06, "loss": 1.1022, "step": 3041 }, { "epoch": 0.07, "learning_rate": 9.956964512844034e-06, "loss": 1.2515, "step": 3042 }, { "epoch": 0.07, "learning_rate": 9.956915329929854e-06, "loss": 1.0144, "step": 3043 }, { "epoch": 0.07, "learning_rate": 9.956866119049095e-06, "loss": 1.039, "step": 3044 }, { "epoch": 0.07, "learning_rate": 9.956816880202036e-06, "loss": 1.001, "step": 3045 }, { "epoch": 0.07, "learning_rate": 9.956767613388952e-06, "loss": 1.2469, "step": 3046 }, { "epoch": 0.07, "learning_rate": 9.956718318610123e-06, "loss": 0.8078, "step": 3047 }, { "epoch": 0.07, "learning_rate": 9.956668995865826e-06, "loss": 1.146, "step": 3048 }, { "epoch": 0.07, "learning_rate": 9.95661964515634e-06, "loss": 1.017, "step": 3049 }, { "epoch": 0.07, "learning_rate": 9.956570266481942e-06, "loss": 1.0664, "step": 3050 }, { "epoch": 0.07, "learning_rate": 9.956520859842915e-06, "loss": 1.2891, "step": 3051 }, { "epoch": 0.07, "learning_rate": 9.956471425239531e-06, "loss": 0.9773, "step": 3052 }, { "epoch": 0.07, "learning_rate": 9.956421962672073e-06, "loss": 1.0643, "step": 3053 }, { "epoch": 0.07, "learning_rate": 9.95637247214082e-06, "loss": 1.0416, "step": 3054 }, { "epoch": 0.07, "learning_rate": 9.956322953646052e-06, "loss": 1.1851, "step": 3055 }, { "epoch": 0.07, "learning_rate": 9.956273407188044e-06, "loss": 0.9893, "step": 3056 }, { "epoch": 0.07, "learning_rate": 9.95622383276708e-06, "loss": 0.8108, "step": 3057 }, { "epoch": 0.07, "learning_rate": 9.95617423038344e-06, "loss": 1.1059, "step": 3058 }, { "epoch": 0.07, "learning_rate": 9.9561246000374e-06, "loss": 0.7584, "step": 3059 }, { "epoch": 0.07, "learning_rate": 9.956074941729242e-06, "loss": 0.7989, "step": 3060 }, { "epoch": 0.07, "learning_rate": 9.956025255459248e-06, "loss": 1.0377, "step": 3061 }, { "epoch": 0.07, "learning_rate": 9.955975541227694e-06, "loss": 1.1566, "step": 3062 }, { "epoch": 0.07, "learning_rate": 9.955925799034865e-06, "loss": 0.9823, "step": 3063 }, { "epoch": 0.07, "learning_rate": 9.95587602888104e-06, "loss": 1.0208, "step": 3064 }, { "epoch": 0.07, "learning_rate": 9.955826230766498e-06, "loss": 1.1326, "step": 3065 }, { "epoch": 0.07, "learning_rate": 9.955776404691524e-06, "loss": 1.0083, "step": 3066 }, { "epoch": 0.07, "learning_rate": 9.955726550656395e-06, "loss": 1.4223, "step": 3067 }, { "epoch": 0.07, "learning_rate": 9.955676668661395e-06, "loss": 1.0555, "step": 3068 }, { "epoch": 0.07, "learning_rate": 9.955626758706802e-06, "loss": 1.2306, "step": 3069 }, { "epoch": 0.07, "learning_rate": 9.955576820792901e-06, "loss": 1.2554, "step": 3070 }, { "epoch": 0.07, "learning_rate": 9.955526854919972e-06, "loss": 1.1856, "step": 3071 }, { "epoch": 0.07, "learning_rate": 9.9554768610883e-06, "loss": 0.9552, "step": 3072 }, { "epoch": 0.07, "learning_rate": 9.955426839298162e-06, "loss": 1.277, "step": 3073 }, { "epoch": 0.07, "learning_rate": 9.955376789549845e-06, "loss": 1.4045, "step": 3074 }, { "epoch": 0.07, "learning_rate": 9.955326711843626e-06, "loss": 1.2215, "step": 3075 }, { "epoch": 0.07, "learning_rate": 9.955276606179795e-06, "loss": 0.8933, "step": 3076 }, { "epoch": 0.07, "learning_rate": 9.955226472558628e-06, "loss": 1.0532, "step": 3077 }, { "epoch": 0.07, "learning_rate": 9.95517631098041e-06, "loss": 0.9837, "step": 3078 }, { "epoch": 0.07, "learning_rate": 9.955126121445426e-06, "loss": 1.2378, "step": 3079 }, { "epoch": 0.07, "learning_rate": 9.955075903953955e-06, "loss": 0.9021, "step": 3080 }, { "epoch": 0.07, "learning_rate": 9.955025658506285e-06, "loss": 1.1464, "step": 3081 }, { "epoch": 0.07, "learning_rate": 9.954975385102696e-06, "loss": 0.8869, "step": 3082 }, { "epoch": 0.07, "learning_rate": 9.954925083743474e-06, "loss": 1.0763, "step": 3083 }, { "epoch": 0.07, "learning_rate": 9.954874754428901e-06, "loss": 0.924, "step": 3084 }, { "epoch": 0.07, "learning_rate": 9.954824397159262e-06, "loss": 1.2556, "step": 3085 }, { "epoch": 0.07, "learning_rate": 9.95477401193484e-06, "loss": 0.9966, "step": 3086 }, { "epoch": 0.07, "learning_rate": 9.95472359875592e-06, "loss": 1.192, "step": 3087 }, { "epoch": 0.07, "learning_rate": 9.954673157622787e-06, "loss": 0.8498, "step": 3088 }, { "epoch": 0.07, "learning_rate": 9.954622688535725e-06, "loss": 1.3019, "step": 3089 }, { "epoch": 0.07, "learning_rate": 9.95457219149502e-06, "loss": 0.9489, "step": 3090 }, { "epoch": 0.07, "learning_rate": 9.954521666500953e-06, "loss": 1.0436, "step": 3091 }, { "epoch": 0.07, "learning_rate": 9.954471113553815e-06, "loss": 1.0207, "step": 3092 }, { "epoch": 0.07, "learning_rate": 9.954420532653886e-06, "loss": 0.881, "step": 3093 }, { "epoch": 0.07, "learning_rate": 9.954369923801453e-06, "loss": 1.157, "step": 3094 }, { "epoch": 0.07, "learning_rate": 9.954319286996803e-06, "loss": 0.8697, "step": 3095 }, { "epoch": 0.07, "learning_rate": 9.95426862224022e-06, "loss": 0.8003, "step": 3096 }, { "epoch": 0.07, "learning_rate": 9.954217929531991e-06, "loss": 1.1647, "step": 3097 }, { "epoch": 0.07, "learning_rate": 9.9541672088724e-06, "loss": 1.1124, "step": 3098 }, { "epoch": 0.07, "learning_rate": 9.954116460261738e-06, "loss": 0.8071, "step": 3099 }, { "epoch": 0.07, "learning_rate": 9.954065683700285e-06, "loss": 0.9379, "step": 3100 }, { "epoch": 0.07, "learning_rate": 9.95401487918833e-06, "loss": 0.7262, "step": 3101 }, { "epoch": 0.07, "learning_rate": 9.95396404672616e-06, "loss": 1.0818, "step": 3102 }, { "epoch": 0.07, "learning_rate": 9.953913186314064e-06, "loss": 1.2074, "step": 3103 }, { "epoch": 0.07, "learning_rate": 9.953862297952326e-06, "loss": 1.0232, "step": 3104 }, { "epoch": 0.07, "learning_rate": 9.953811381641233e-06, "loss": 1.0447, "step": 3105 }, { "epoch": 0.07, "learning_rate": 9.953760437381073e-06, "loss": 1.1838, "step": 3106 }, { "epoch": 0.07, "learning_rate": 9.953709465172135e-06, "loss": 1.1926, "step": 3107 }, { "epoch": 0.07, "learning_rate": 9.953658465014704e-06, "loss": 1.0492, "step": 3108 }, { "epoch": 0.07, "learning_rate": 9.953607436909069e-06, "loss": 0.9957, "step": 3109 }, { "epoch": 0.07, "learning_rate": 9.953556380855517e-06, "loss": 1.2602, "step": 3110 }, { "epoch": 0.07, "learning_rate": 9.953505296854339e-06, "loss": 1.1434, "step": 3111 }, { "epoch": 0.07, "learning_rate": 9.95345418490582e-06, "loss": 1.1497, "step": 3112 }, { "epoch": 0.07, "learning_rate": 9.953403045010248e-06, "loss": 1.3589, "step": 3113 }, { "epoch": 0.07, "learning_rate": 9.953351877167916e-06, "loss": 0.9445, "step": 3114 }, { "epoch": 0.07, "learning_rate": 9.953300681379109e-06, "loss": 0.9655, "step": 3115 }, { "epoch": 0.07, "learning_rate": 9.953249457644114e-06, "loss": 1.1059, "step": 3116 }, { "epoch": 0.07, "learning_rate": 9.953198205963223e-06, "loss": 1.5318, "step": 3117 }, { "epoch": 0.07, "learning_rate": 9.953146926336726e-06, "loss": 0.7649, "step": 3118 }, { "epoch": 0.07, "learning_rate": 9.95309561876491e-06, "loss": 1.1105, "step": 3119 }, { "epoch": 0.07, "learning_rate": 9.953044283248066e-06, "loss": 1.1535, "step": 3120 }, { "epoch": 0.07, "learning_rate": 9.952992919786483e-06, "loss": 1.101, "step": 3121 }, { "epoch": 0.07, "learning_rate": 9.952941528380452e-06, "loss": 1.1778, "step": 3122 }, { "epoch": 0.07, "learning_rate": 9.952890109030259e-06, "loss": 1.0785, "step": 3123 }, { "epoch": 0.07, "learning_rate": 9.952838661736199e-06, "loss": 1.2054, "step": 3124 }, { "epoch": 0.07, "learning_rate": 9.952787186498559e-06, "loss": 0.8719, "step": 3125 }, { "epoch": 0.07, "learning_rate": 9.952735683317631e-06, "loss": 1.0718, "step": 3126 }, { "epoch": 0.07, "learning_rate": 9.952684152193706e-06, "loss": 0.7751, "step": 3127 }, { "epoch": 0.07, "learning_rate": 9.952632593127074e-06, "loss": 0.8657, "step": 3128 }, { "epoch": 0.07, "learning_rate": 9.952581006118026e-06, "loss": 0.9702, "step": 3129 }, { "epoch": 0.07, "learning_rate": 9.95252939116685e-06, "loss": 1.205, "step": 3130 }, { "epoch": 0.07, "learning_rate": 9.952477748273843e-06, "loss": 1.1393, "step": 3131 }, { "epoch": 0.07, "learning_rate": 9.952426077439292e-06, "loss": 1.1946, "step": 3132 }, { "epoch": 0.07, "learning_rate": 9.95237437866349e-06, "loss": 0.9893, "step": 3133 }, { "epoch": 0.07, "learning_rate": 9.95232265194673e-06, "loss": 1.0995, "step": 3134 }, { "epoch": 0.07, "learning_rate": 9.9522708972893e-06, "loss": 0.9589, "step": 3135 }, { "epoch": 0.07, "learning_rate": 9.952219114691496e-06, "loss": 1.0171, "step": 3136 }, { "epoch": 0.07, "learning_rate": 9.952167304153608e-06, "loss": 1.2001, "step": 3137 }, { "epoch": 0.07, "learning_rate": 9.95211546567593e-06, "loss": 0.9851, "step": 3138 }, { "epoch": 0.07, "learning_rate": 9.952063599258752e-06, "loss": 1.0908, "step": 3139 }, { "epoch": 0.07, "learning_rate": 9.95201170490237e-06, "loss": 1.1795, "step": 3140 }, { "epoch": 0.07, "learning_rate": 9.951959782607073e-06, "loss": 1.0865, "step": 3141 }, { "epoch": 0.07, "learning_rate": 9.951907832373156e-06, "loss": 0.9644, "step": 3142 }, { "epoch": 0.07, "learning_rate": 9.951855854200912e-06, "loss": 1.0973, "step": 3143 }, { "epoch": 0.07, "learning_rate": 9.951803848090634e-06, "loss": 1.0903, "step": 3144 }, { "epoch": 0.07, "learning_rate": 9.951751814042616e-06, "loss": 0.8675, "step": 3145 }, { "epoch": 0.07, "learning_rate": 9.951699752057151e-06, "loss": 1.2123, "step": 3146 }, { "epoch": 0.07, "learning_rate": 9.951647662134533e-06, "loss": 1.2381, "step": 3147 }, { "epoch": 0.07, "learning_rate": 9.951595544275055e-06, "loss": 1.3765, "step": 3148 }, { "epoch": 0.07, "learning_rate": 9.95154339847901e-06, "loss": 0.9989, "step": 3149 }, { "epoch": 0.07, "learning_rate": 9.951491224746698e-06, "loss": 1.0455, "step": 3150 }, { "epoch": 0.07, "learning_rate": 9.951439023078406e-06, "loss": 1.2841, "step": 3151 }, { "epoch": 0.07, "learning_rate": 9.951386793474435e-06, "loss": 1.2184, "step": 3152 }, { "epoch": 0.07, "learning_rate": 9.951334535935073e-06, "loss": 1.1417, "step": 3153 }, { "epoch": 0.07, "learning_rate": 9.95128225046062e-06, "loss": 1.0556, "step": 3154 }, { "epoch": 0.07, "learning_rate": 9.95122993705137e-06, "loss": 1.2473, "step": 3155 }, { "epoch": 0.07, "learning_rate": 9.951177595707617e-06, "loss": 0.9828, "step": 3156 }, { "epoch": 0.07, "learning_rate": 9.951125226429656e-06, "loss": 1.2116, "step": 3157 }, { "epoch": 0.07, "learning_rate": 9.951072829217785e-06, "loss": 1.0636, "step": 3158 }, { "epoch": 0.07, "learning_rate": 9.951020404072295e-06, "loss": 1.0798, "step": 3159 }, { "epoch": 0.07, "learning_rate": 9.950967950993487e-06, "loss": 1.34, "step": 3160 }, { "epoch": 0.07, "learning_rate": 9.950915469981654e-06, "loss": 1.1834, "step": 3161 }, { "epoch": 0.07, "learning_rate": 9.950862961037093e-06, "loss": 1.0267, "step": 3162 }, { "epoch": 0.07, "learning_rate": 9.9508104241601e-06, "loss": 1.3351, "step": 3163 }, { "epoch": 0.07, "learning_rate": 9.95075785935097e-06, "loss": 1.289, "step": 3164 }, { "epoch": 0.07, "learning_rate": 9.950705266610003e-06, "loss": 1.1461, "step": 3165 }, { "epoch": 0.07, "learning_rate": 9.950652645937491e-06, "loss": 1.0904, "step": 3166 }, { "epoch": 0.07, "learning_rate": 9.950599997333736e-06, "loss": 1.0008, "step": 3167 }, { "epoch": 0.07, "learning_rate": 9.95054732079903e-06, "loss": 1.1375, "step": 3168 }, { "epoch": 0.07, "learning_rate": 9.950494616333676e-06, "loss": 1.0952, "step": 3169 }, { "epoch": 0.07, "learning_rate": 9.950441883937967e-06, "loss": 0.9052, "step": 3170 }, { "epoch": 0.07, "learning_rate": 9.9503891236122e-06, "loss": 0.8373, "step": 3171 }, { "epoch": 0.07, "learning_rate": 9.950336335356677e-06, "loss": 1.1671, "step": 3172 }, { "epoch": 0.07, "learning_rate": 9.950283519171691e-06, "loss": 1.0714, "step": 3173 }, { "epoch": 0.07, "learning_rate": 9.950230675057541e-06, "loss": 0.9729, "step": 3174 }, { "epoch": 0.07, "learning_rate": 9.95017780301453e-06, "loss": 1.2524, "step": 3175 }, { "epoch": 0.07, "learning_rate": 9.950124903042949e-06, "loss": 0.9349, "step": 3176 }, { "epoch": 0.07, "learning_rate": 9.950071975143101e-06, "loss": 0.9605, "step": 3177 }, { "epoch": 0.07, "learning_rate": 9.950019019315285e-06, "loss": 1.0444, "step": 3178 }, { "epoch": 0.07, "learning_rate": 9.949966035559797e-06, "loss": 0.7965, "step": 3179 }, { "epoch": 0.07, "learning_rate": 9.949913023876937e-06, "loss": 1.4376, "step": 3180 }, { "epoch": 0.07, "learning_rate": 9.949859984267005e-06, "loss": 0.8779, "step": 3181 }, { "epoch": 0.07, "learning_rate": 9.9498069167303e-06, "loss": 1.0272, "step": 3182 }, { "epoch": 0.07, "learning_rate": 9.94975382126712e-06, "loss": 1.2024, "step": 3183 }, { "epoch": 0.07, "learning_rate": 9.949700697877766e-06, "loss": 1.2349, "step": 3184 }, { "epoch": 0.07, "learning_rate": 9.949647546562538e-06, "loss": 1.0581, "step": 3185 }, { "epoch": 0.07, "learning_rate": 9.949594367321735e-06, "loss": 1.0421, "step": 3186 }, { "epoch": 0.07, "learning_rate": 9.949541160155657e-06, "loss": 1.0186, "step": 3187 }, { "epoch": 0.07, "learning_rate": 9.949487925064605e-06, "loss": 0.9158, "step": 3188 }, { "epoch": 0.07, "learning_rate": 9.94943466204888e-06, "loss": 1.2234, "step": 3189 }, { "epoch": 0.07, "learning_rate": 9.94938137110878e-06, "loss": 1.0229, "step": 3190 }, { "epoch": 0.07, "learning_rate": 9.949328052244606e-06, "loss": 1.0371, "step": 3191 }, { "epoch": 0.07, "learning_rate": 9.949274705456659e-06, "loss": 0.9318, "step": 3192 }, { "epoch": 0.07, "learning_rate": 9.949221330745243e-06, "loss": 0.9845, "step": 3193 }, { "epoch": 0.07, "learning_rate": 9.949167928110657e-06, "loss": 1.0665, "step": 3194 }, { "epoch": 0.07, "learning_rate": 9.9491144975532e-06, "loss": 1.1518, "step": 3195 }, { "epoch": 0.07, "learning_rate": 9.949061039073179e-06, "loss": 1.2711, "step": 3196 }, { "epoch": 0.07, "learning_rate": 9.949007552670888e-06, "loss": 1.0527, "step": 3197 }, { "epoch": 0.07, "learning_rate": 9.948954038346637e-06, "loss": 0.8507, "step": 3198 }, { "epoch": 0.07, "learning_rate": 9.948900496100721e-06, "loss": 0.9864, "step": 3199 }, { "epoch": 0.07, "learning_rate": 9.948846925933446e-06, "loss": 0.9326, "step": 3200 }, { "epoch": 0.07, "learning_rate": 9.948793327845115e-06, "loss": 0.9482, "step": 3201 }, { "epoch": 0.07, "learning_rate": 9.948739701836027e-06, "loss": 0.9937, "step": 3202 }, { "epoch": 0.07, "learning_rate": 9.948686047906486e-06, "loss": 1.2012, "step": 3203 }, { "epoch": 0.07, "learning_rate": 9.948632366056795e-06, "loss": 1.3955, "step": 3204 }, { "epoch": 0.07, "learning_rate": 9.948578656287258e-06, "loss": 1.1647, "step": 3205 }, { "epoch": 0.07, "learning_rate": 9.948524918598175e-06, "loss": 1.0628, "step": 3206 }, { "epoch": 0.07, "learning_rate": 9.948471152989853e-06, "loss": 1.1181, "step": 3207 }, { "epoch": 0.07, "learning_rate": 9.948417359462593e-06, "loss": 1.2935, "step": 3208 }, { "epoch": 0.07, "learning_rate": 9.948363538016697e-06, "loss": 1.1618, "step": 3209 }, { "epoch": 0.07, "learning_rate": 9.948309688652471e-06, "loss": 1.1198, "step": 3210 }, { "epoch": 0.07, "learning_rate": 9.94825581137022e-06, "loss": 1.1931, "step": 3211 }, { "epoch": 0.07, "learning_rate": 9.948201906170245e-06, "loss": 1.1962, "step": 3212 }, { "epoch": 0.07, "learning_rate": 9.948147973052851e-06, "loss": 0.6956, "step": 3213 }, { "epoch": 0.07, "learning_rate": 9.948094012018343e-06, "loss": 1.0628, "step": 3214 }, { "epoch": 0.07, "learning_rate": 9.948040023067028e-06, "loss": 1.5485, "step": 3215 }, { "epoch": 0.07, "learning_rate": 9.947986006199204e-06, "loss": 0.9482, "step": 3216 }, { "epoch": 0.07, "learning_rate": 9.94793196141518e-06, "loss": 0.9616, "step": 3217 }, { "epoch": 0.07, "learning_rate": 9.947877888715263e-06, "loss": 1.2476, "step": 3218 }, { "epoch": 0.07, "learning_rate": 9.947823788099754e-06, "loss": 1.231, "step": 3219 }, { "epoch": 0.07, "learning_rate": 9.947769659568957e-06, "loss": 1.2278, "step": 3220 }, { "epoch": 0.07, "learning_rate": 9.947715503123184e-06, "loss": 0.9651, "step": 3221 }, { "epoch": 0.07, "learning_rate": 9.947661318762736e-06, "loss": 0.9423, "step": 3222 }, { "epoch": 0.07, "learning_rate": 9.947607106487917e-06, "loss": 1.1185, "step": 3223 }, { "epoch": 0.07, "learning_rate": 9.947552866299037e-06, "loss": 1.4184, "step": 3224 }, { "epoch": 0.07, "learning_rate": 9.947498598196401e-06, "loss": 1.1149, "step": 3225 }, { "epoch": 0.07, "learning_rate": 9.947444302180313e-06, "loss": 0.8779, "step": 3226 }, { "epoch": 0.07, "learning_rate": 9.947389978251082e-06, "loss": 0.9894, "step": 3227 }, { "epoch": 0.07, "learning_rate": 9.947335626409013e-06, "loss": 1.1963, "step": 3228 }, { "epoch": 0.07, "learning_rate": 9.947281246654412e-06, "loss": 0.9983, "step": 3229 }, { "epoch": 0.07, "learning_rate": 9.947226838987587e-06, "loss": 1.1016, "step": 3230 }, { "epoch": 0.07, "learning_rate": 9.947172403408845e-06, "loss": 0.972, "step": 3231 }, { "epoch": 0.07, "learning_rate": 9.947117939918494e-06, "loss": 1.1408, "step": 3232 }, { "epoch": 0.07, "learning_rate": 9.947063448516838e-06, "loss": 0.9698, "step": 3233 }, { "epoch": 0.08, "learning_rate": 9.947008929204188e-06, "loss": 1.1165, "step": 3234 }, { "epoch": 0.08, "learning_rate": 9.946954381980848e-06, "loss": 1.2046, "step": 3235 }, { "epoch": 0.08, "learning_rate": 9.946899806847131e-06, "loss": 0.9855, "step": 3236 }, { "epoch": 0.08, "learning_rate": 9.94684520380334e-06, "loss": 1.0558, "step": 3237 }, { "epoch": 0.08, "learning_rate": 9.946790572849785e-06, "loss": 1.04, "step": 3238 }, { "epoch": 0.08, "learning_rate": 9.946735913986773e-06, "loss": 1.0685, "step": 3239 }, { "epoch": 0.08, "learning_rate": 9.946681227214617e-06, "loss": 1.1299, "step": 3240 }, { "epoch": 0.08, "learning_rate": 9.946626512533619e-06, "loss": 1.0942, "step": 3241 }, { "epoch": 0.08, "learning_rate": 9.94657176994409e-06, "loss": 1.0146, "step": 3242 }, { "epoch": 0.08, "learning_rate": 9.94651699944634e-06, "loss": 1.0246, "step": 3243 }, { "epoch": 0.08, "learning_rate": 9.94646220104068e-06, "loss": 1.077, "step": 3244 }, { "epoch": 0.08, "learning_rate": 9.946407374727414e-06, "loss": 0.818, "step": 3245 }, { "epoch": 0.08, "learning_rate": 9.946352520506856e-06, "loss": 1.0033, "step": 3246 }, { "epoch": 0.08, "learning_rate": 9.946297638379312e-06, "loss": 0.9499, "step": 3247 }, { "epoch": 0.08, "learning_rate": 9.946242728345095e-06, "loss": 1.2071, "step": 3248 }, { "epoch": 0.08, "learning_rate": 9.946187790404511e-06, "loss": 1.0882, "step": 3249 }, { "epoch": 0.08, "learning_rate": 9.946132824557872e-06, "loss": 0.9964, "step": 3250 }, { "epoch": 0.08, "learning_rate": 9.94607783080549e-06, "loss": 0.9981, "step": 3251 }, { "epoch": 0.08, "learning_rate": 9.946022809147672e-06, "loss": 0.9843, "step": 3252 }, { "epoch": 0.08, "learning_rate": 9.94596775958473e-06, "loss": 1.2213, "step": 3253 }, { "epoch": 0.08, "learning_rate": 9.945912682116974e-06, "loss": 1.3306, "step": 3254 }, { "epoch": 0.08, "learning_rate": 9.945857576744715e-06, "loss": 1.0813, "step": 3255 }, { "epoch": 0.08, "learning_rate": 9.945802443468265e-06, "loss": 1.2466, "step": 3256 }, { "epoch": 0.08, "learning_rate": 9.945747282287932e-06, "loss": 0.8879, "step": 3257 }, { "epoch": 0.08, "learning_rate": 9.945692093204031e-06, "loss": 1.1943, "step": 3258 }, { "epoch": 0.08, "learning_rate": 9.945636876216871e-06, "loss": 0.9744, "step": 3259 }, { "epoch": 0.08, "learning_rate": 9.945581631326764e-06, "loss": 1.1881, "step": 3260 }, { "epoch": 0.08, "learning_rate": 9.945526358534021e-06, "loss": 1.1397, "step": 3261 }, { "epoch": 0.08, "learning_rate": 9.945471057838956e-06, "loss": 1.2685, "step": 3262 }, { "epoch": 0.08, "learning_rate": 9.94541572924188e-06, "loss": 0.9816, "step": 3263 }, { "epoch": 0.08, "learning_rate": 9.945360372743105e-06, "loss": 1.0709, "step": 3264 }, { "epoch": 0.08, "learning_rate": 9.945304988342941e-06, "loss": 1.1994, "step": 3265 }, { "epoch": 0.08, "learning_rate": 9.945249576041705e-06, "loss": 1.2824, "step": 3266 }, { "epoch": 0.08, "learning_rate": 9.945194135839707e-06, "loss": 1.277, "step": 3267 }, { "epoch": 0.08, "learning_rate": 9.945138667737258e-06, "loss": 1.0344, "step": 3268 }, { "epoch": 0.08, "learning_rate": 9.945083171734676e-06, "loss": 0.8338, "step": 3269 }, { "epoch": 0.08, "learning_rate": 9.945027647832268e-06, "loss": 0.9934, "step": 3270 }, { "epoch": 0.08, "learning_rate": 9.944972096030352e-06, "loss": 1.2775, "step": 3271 }, { "epoch": 0.08, "learning_rate": 9.944916516329239e-06, "loss": 1.196, "step": 3272 }, { "epoch": 0.08, "learning_rate": 9.944860908729244e-06, "loss": 1.0279, "step": 3273 }, { "epoch": 0.08, "learning_rate": 9.94480527323068e-06, "loss": 1.1512, "step": 3274 }, { "epoch": 0.08, "learning_rate": 9.944749609833861e-06, "loss": 0.894, "step": 3275 }, { "epoch": 0.08, "learning_rate": 9.944693918539102e-06, "loss": 1.1582, "step": 3276 }, { "epoch": 0.08, "learning_rate": 9.944638199346716e-06, "loss": 0.9672, "step": 3277 }, { "epoch": 0.08, "learning_rate": 9.944582452257017e-06, "loss": 0.9857, "step": 3278 }, { "epoch": 0.08, "learning_rate": 9.94452667727032e-06, "loss": 0.8898, "step": 3279 }, { "epoch": 0.08, "learning_rate": 9.94447087438694e-06, "loss": 1.282, "step": 3280 }, { "epoch": 0.08, "learning_rate": 9.944415043607191e-06, "loss": 1.0268, "step": 3281 }, { "epoch": 0.08, "learning_rate": 9.94435918493139e-06, "loss": 1.0617, "step": 3282 }, { "epoch": 0.08, "learning_rate": 9.94430329835985e-06, "loss": 1.1912, "step": 3283 }, { "epoch": 0.08, "learning_rate": 9.944247383892886e-06, "loss": 1.3318, "step": 3284 }, { "epoch": 0.08, "learning_rate": 9.944191441530817e-06, "loss": 0.9496, "step": 3285 }, { "epoch": 0.08, "learning_rate": 9.944135471273954e-06, "loss": 0.9758, "step": 3286 }, { "epoch": 0.08, "learning_rate": 9.944079473122617e-06, "loss": 1.0238, "step": 3287 }, { "epoch": 0.08, "learning_rate": 9.944023447077118e-06, "loss": 1.1904, "step": 3288 }, { "epoch": 0.08, "learning_rate": 9.943967393137777e-06, "loss": 0.8425, "step": 3289 }, { "epoch": 0.08, "learning_rate": 9.943911311304906e-06, "loss": 1.0801, "step": 3290 }, { "epoch": 0.08, "learning_rate": 9.943855201578825e-06, "loss": 1.1111, "step": 3291 }, { "epoch": 0.08, "learning_rate": 9.94379906395985e-06, "loss": 1.1637, "step": 3292 }, { "epoch": 0.08, "learning_rate": 9.943742898448294e-06, "loss": 1.019, "step": 3293 }, { "epoch": 0.08, "learning_rate": 9.94368670504448e-06, "loss": 1.0503, "step": 3294 }, { "epoch": 0.08, "learning_rate": 9.94363048374872e-06, "loss": 0.8883, "step": 3295 }, { "epoch": 0.08, "learning_rate": 9.943574234561334e-06, "loss": 1.0353, "step": 3296 }, { "epoch": 0.08, "learning_rate": 9.943517957482637e-06, "loss": 1.131, "step": 3297 }, { "epoch": 0.08, "learning_rate": 9.94346165251295e-06, "loss": 0.8124, "step": 3298 }, { "epoch": 0.08, "learning_rate": 9.943405319652588e-06, "loss": 1.3286, "step": 3299 }, { "epoch": 0.08, "learning_rate": 9.943348958901869e-06, "loss": 0.9836, "step": 3300 }, { "epoch": 0.08, "learning_rate": 9.943292570261112e-06, "loss": 1.0706, "step": 3301 }, { "epoch": 0.08, "learning_rate": 9.943236153730634e-06, "loss": 1.0199, "step": 3302 }, { "epoch": 0.08, "learning_rate": 9.943179709310753e-06, "loss": 1.1586, "step": 3303 }, { "epoch": 0.08, "learning_rate": 9.94312323700179e-06, "loss": 0.9595, "step": 3304 }, { "epoch": 0.08, "learning_rate": 9.94306673680406e-06, "loss": 1.0343, "step": 3305 }, { "epoch": 0.08, "learning_rate": 9.943010208717885e-06, "loss": 1.0462, "step": 3306 }, { "epoch": 0.08, "learning_rate": 9.942953652743583e-06, "loss": 1.1161, "step": 3307 }, { "epoch": 0.08, "learning_rate": 9.942897068881473e-06, "loss": 1.2417, "step": 3308 }, { "epoch": 0.08, "learning_rate": 9.942840457131872e-06, "loss": 0.9299, "step": 3309 }, { "epoch": 0.08, "learning_rate": 9.942783817495103e-06, "loss": 1.1634, "step": 3310 }, { "epoch": 0.08, "learning_rate": 9.942727149971486e-06, "loss": 1.3151, "step": 3311 }, { "epoch": 0.08, "learning_rate": 9.942670454561334e-06, "loss": 1.2501, "step": 3312 }, { "epoch": 0.08, "learning_rate": 9.942613731264974e-06, "loss": 0.8475, "step": 3313 }, { "epoch": 0.08, "learning_rate": 9.942556980082723e-06, "loss": 1.2386, "step": 3314 }, { "epoch": 0.08, "learning_rate": 9.942500201014901e-06, "loss": 1.034, "step": 3315 }, { "epoch": 0.08, "learning_rate": 9.942443394061832e-06, "loss": 1.0044, "step": 3316 }, { "epoch": 0.08, "learning_rate": 9.942386559223832e-06, "loss": 1.0181, "step": 3317 }, { "epoch": 0.08, "learning_rate": 9.94232969650122e-06, "loss": 1.0074, "step": 3318 }, { "epoch": 0.08, "learning_rate": 9.942272805894324e-06, "loss": 0.8662, "step": 3319 }, { "epoch": 0.08, "learning_rate": 9.94221588740346e-06, "loss": 1.1284, "step": 3320 }, { "epoch": 0.08, "learning_rate": 9.94215894102895e-06, "loss": 1.0816, "step": 3321 }, { "epoch": 0.08, "learning_rate": 9.942101966771116e-06, "loss": 1.3612, "step": 3322 }, { "epoch": 0.08, "learning_rate": 9.942044964630278e-06, "loss": 0.9531, "step": 3323 }, { "epoch": 0.08, "learning_rate": 9.941987934606759e-06, "loss": 0.7981, "step": 3324 }, { "epoch": 0.08, "learning_rate": 9.941930876700879e-06, "loss": 1.1169, "step": 3325 }, { "epoch": 0.08, "learning_rate": 9.941873790912962e-06, "loss": 0.8858, "step": 3326 }, { "epoch": 0.08, "learning_rate": 9.941816677243329e-06, "loss": 0.9091, "step": 3327 }, { "epoch": 0.08, "learning_rate": 9.941759535692303e-06, "loss": 0.8718, "step": 3328 }, { "epoch": 0.08, "learning_rate": 9.941702366260205e-06, "loss": 1.2085, "step": 3329 }, { "epoch": 0.08, "learning_rate": 9.941645168947358e-06, "loss": 1.189, "step": 3330 }, { "epoch": 0.08, "learning_rate": 9.941587943754087e-06, "loss": 1.2745, "step": 3331 }, { "epoch": 0.08, "learning_rate": 9.941530690680713e-06, "loss": 1.0267, "step": 3332 }, { "epoch": 0.08, "learning_rate": 9.941473409727556e-06, "loss": 1.0011, "step": 3333 }, { "epoch": 0.08, "learning_rate": 9.941416100894944e-06, "loss": 1.0849, "step": 3334 }, { "epoch": 0.08, "learning_rate": 9.941358764183199e-06, "loss": 0.8816, "step": 3335 }, { "epoch": 0.08, "learning_rate": 9.941301399592643e-06, "loss": 1.5141, "step": 3336 }, { "epoch": 0.08, "learning_rate": 9.941244007123602e-06, "loss": 0.9522, "step": 3337 }, { "epoch": 0.08, "learning_rate": 9.941186586776396e-06, "loss": 1.2908, "step": 3338 }, { "epoch": 0.08, "learning_rate": 9.941129138551352e-06, "loss": 1.092, "step": 3339 }, { "epoch": 0.08, "learning_rate": 9.941071662448796e-06, "loss": 1.2196, "step": 3340 }, { "epoch": 0.08, "learning_rate": 9.94101415846905e-06, "loss": 1.2939, "step": 3341 }, { "epoch": 0.08, "learning_rate": 9.940956626612435e-06, "loss": 0.9382, "step": 3342 }, { "epoch": 0.08, "learning_rate": 9.94089906687928e-06, "loss": 1.3412, "step": 3343 }, { "epoch": 0.08, "learning_rate": 9.940841479269909e-06, "loss": 0.9283, "step": 3344 }, { "epoch": 0.08, "learning_rate": 9.940783863784645e-06, "loss": 1.2799, "step": 3345 }, { "epoch": 0.08, "learning_rate": 9.940726220423817e-06, "loss": 1.1846, "step": 3346 }, { "epoch": 0.08, "learning_rate": 9.940668549187747e-06, "loss": 1.2462, "step": 3347 }, { "epoch": 0.08, "learning_rate": 9.94061085007676e-06, "loss": 1.2301, "step": 3348 }, { "epoch": 0.08, "learning_rate": 9.940553123091183e-06, "loss": 1.1129, "step": 3349 }, { "epoch": 0.08, "learning_rate": 9.940495368231342e-06, "loss": 1.2597, "step": 3350 }, { "epoch": 0.08, "learning_rate": 9.94043758549756e-06, "loss": 1.1161, "step": 3351 }, { "epoch": 0.08, "learning_rate": 9.940379774890168e-06, "loss": 1.2252, "step": 3352 }, { "epoch": 0.08, "learning_rate": 9.940321936409487e-06, "loss": 0.9796, "step": 3353 }, { "epoch": 0.08, "learning_rate": 9.940264070055847e-06, "loss": 0.8998, "step": 3354 }, { "epoch": 0.08, "learning_rate": 9.940206175829574e-06, "loss": 1.049, "step": 3355 }, { "epoch": 0.08, "learning_rate": 9.940148253730992e-06, "loss": 1.0839, "step": 3356 }, { "epoch": 0.08, "learning_rate": 9.94009030376043e-06, "loss": 1.0379, "step": 3357 }, { "epoch": 0.08, "learning_rate": 9.940032325918216e-06, "loss": 1.4355, "step": 3358 }, { "epoch": 0.08, "learning_rate": 9.939974320204675e-06, "loss": 1.128, "step": 3359 }, { "epoch": 0.08, "learning_rate": 9.939916286620133e-06, "loss": 1.2653, "step": 3360 }, { "epoch": 0.08, "learning_rate": 9.939858225164921e-06, "loss": 1.1569, "step": 3361 }, { "epoch": 0.08, "learning_rate": 9.939800135839366e-06, "loss": 1.1754, "step": 3362 }, { "epoch": 0.08, "learning_rate": 9.939742018643792e-06, "loss": 1.1356, "step": 3363 }, { "epoch": 0.08, "learning_rate": 9.939683873578532e-06, "loss": 0.897, "step": 3364 }, { "epoch": 0.08, "learning_rate": 9.93962570064391e-06, "loss": 1.3063, "step": 3365 }, { "epoch": 0.08, "learning_rate": 9.939567499840256e-06, "loss": 0.6565, "step": 3366 }, { "epoch": 0.08, "learning_rate": 9.9395092711679e-06, "loss": 0.8813, "step": 3367 }, { "epoch": 0.08, "learning_rate": 9.939451014627166e-06, "loss": 1.0642, "step": 3368 }, { "epoch": 0.08, "learning_rate": 9.939392730218386e-06, "loss": 0.9408, "step": 3369 }, { "epoch": 0.08, "learning_rate": 9.939334417941888e-06, "loss": 1.1094, "step": 3370 }, { "epoch": 0.08, "learning_rate": 9.939276077798004e-06, "loss": 1.0376, "step": 3371 }, { "epoch": 0.08, "learning_rate": 9.939217709787056e-06, "loss": 0.8529, "step": 3372 }, { "epoch": 0.08, "learning_rate": 9.939159313909381e-06, "loss": 1.0318, "step": 3373 }, { "epoch": 0.08, "learning_rate": 9.939100890165303e-06, "loss": 1.1166, "step": 3374 }, { "epoch": 0.08, "learning_rate": 9.939042438555155e-06, "loss": 1.0376, "step": 3375 }, { "epoch": 0.08, "learning_rate": 9.938983959079266e-06, "loss": 0.9041, "step": 3376 }, { "epoch": 0.08, "learning_rate": 9.938925451737964e-06, "loss": 1.1584, "step": 3377 }, { "epoch": 0.08, "learning_rate": 9.938866916531581e-06, "loss": 0.9668, "step": 3378 }, { "epoch": 0.08, "learning_rate": 9.938808353460448e-06, "loss": 0.8069, "step": 3379 }, { "epoch": 0.08, "learning_rate": 9.938749762524893e-06, "loss": 0.991, "step": 3380 }, { "epoch": 0.08, "learning_rate": 9.938691143725247e-06, "loss": 1.05, "step": 3381 }, { "epoch": 0.08, "learning_rate": 9.938632497061843e-06, "loss": 1.071, "step": 3382 }, { "epoch": 0.08, "learning_rate": 9.938573822535009e-06, "loss": 1.2291, "step": 3383 }, { "epoch": 0.08, "learning_rate": 9.938515120145079e-06, "loss": 0.9586, "step": 3384 }, { "epoch": 0.08, "learning_rate": 9.938456389892382e-06, "loss": 0.6428, "step": 3385 }, { "epoch": 0.08, "learning_rate": 9.93839763177725e-06, "loss": 0.9632, "step": 3386 }, { "epoch": 0.08, "learning_rate": 9.938338845800015e-06, "loss": 0.8386, "step": 3387 }, { "epoch": 0.08, "learning_rate": 9.938280031961007e-06, "loss": 1.2752, "step": 3388 }, { "epoch": 0.08, "learning_rate": 9.93822119026056e-06, "loss": 1.0703, "step": 3389 }, { "epoch": 0.08, "learning_rate": 9.938162320699003e-06, "loss": 1.2041, "step": 3390 }, { "epoch": 0.08, "learning_rate": 9.938103423276672e-06, "loss": 1.3056, "step": 3391 }, { "epoch": 0.08, "learning_rate": 9.938044497993898e-06, "loss": 1.2145, "step": 3392 }, { "epoch": 0.08, "learning_rate": 9.93798554485101e-06, "loss": 1.0469, "step": 3393 }, { "epoch": 0.08, "learning_rate": 9.937926563848345e-06, "loss": 1.2007, "step": 3394 }, { "epoch": 0.08, "learning_rate": 9.937867554986234e-06, "loss": 1.1714, "step": 3395 }, { "epoch": 0.08, "learning_rate": 9.93780851826501e-06, "loss": 1.0286, "step": 3396 }, { "epoch": 0.08, "learning_rate": 9.937749453685008e-06, "loss": 1.0205, "step": 3397 }, { "epoch": 0.08, "learning_rate": 9.937690361246558e-06, "loss": 1.132, "step": 3398 }, { "epoch": 0.08, "learning_rate": 9.937631240949993e-06, "loss": 0.9531, "step": 3399 }, { "epoch": 0.08, "learning_rate": 9.937572092795652e-06, "loss": 0.9912, "step": 3400 }, { "epoch": 0.08, "learning_rate": 9.937512916783863e-06, "loss": 1.1033, "step": 3401 }, { "epoch": 0.08, "learning_rate": 9.937453712914962e-06, "loss": 0.9258, "step": 3402 }, { "epoch": 0.08, "learning_rate": 9.937394481189284e-06, "loss": 1.0637, "step": 3403 }, { "epoch": 0.08, "learning_rate": 9.937335221607163e-06, "loss": 1.1259, "step": 3404 }, { "epoch": 0.08, "learning_rate": 9.937275934168931e-06, "loss": 1.1339, "step": 3405 }, { "epoch": 0.08, "learning_rate": 9.937216618874923e-06, "loss": 1.0987, "step": 3406 }, { "epoch": 0.08, "learning_rate": 9.937157275725475e-06, "loss": 0.9934, "step": 3407 }, { "epoch": 0.08, "learning_rate": 9.937097904720923e-06, "loss": 1.0804, "step": 3408 }, { "epoch": 0.08, "learning_rate": 9.9370385058616e-06, "loss": 1.1327, "step": 3409 }, { "epoch": 0.08, "learning_rate": 9.936979079147842e-06, "loss": 0.991, "step": 3410 }, { "epoch": 0.08, "learning_rate": 9.936919624579983e-06, "loss": 1.1686, "step": 3411 }, { "epoch": 0.08, "learning_rate": 9.936860142158358e-06, "loss": 1.28, "step": 3412 }, { "epoch": 0.08, "learning_rate": 9.936800631883305e-06, "loss": 0.8633, "step": 3413 }, { "epoch": 0.08, "learning_rate": 9.93674109375516e-06, "loss": 1.1928, "step": 3414 }, { "epoch": 0.08, "learning_rate": 9.936681527774256e-06, "loss": 0.9463, "step": 3415 }, { "epoch": 0.08, "learning_rate": 9.936621933940931e-06, "loss": 1.1008, "step": 3416 }, { "epoch": 0.08, "learning_rate": 9.936562312255521e-06, "loss": 1.2171, "step": 3417 }, { "epoch": 0.08, "learning_rate": 9.936502662718362e-06, "loss": 1.2266, "step": 3418 }, { "epoch": 0.08, "learning_rate": 9.936442985329792e-06, "loss": 1.1695, "step": 3419 }, { "epoch": 0.08, "learning_rate": 9.936383280090145e-06, "loss": 0.923, "step": 3420 }, { "epoch": 0.08, "learning_rate": 9.93632354699976e-06, "loss": 1.2333, "step": 3421 }, { "epoch": 0.08, "learning_rate": 9.936263786058973e-06, "loss": 1.0974, "step": 3422 }, { "epoch": 0.08, "learning_rate": 9.936203997268121e-06, "loss": 0.9109, "step": 3423 }, { "epoch": 0.08, "learning_rate": 9.936144180627543e-06, "loss": 0.8388, "step": 3424 }, { "epoch": 0.08, "learning_rate": 9.936084336137575e-06, "loss": 0.9183, "step": 3425 }, { "epoch": 0.08, "learning_rate": 9.936024463798554e-06, "loss": 1.0768, "step": 3426 }, { "epoch": 0.08, "learning_rate": 9.935964563610818e-06, "loss": 0.7959, "step": 3427 }, { "epoch": 0.08, "learning_rate": 9.935904635574708e-06, "loss": 0.9487, "step": 3428 }, { "epoch": 0.08, "learning_rate": 9.935844679690558e-06, "loss": 1.0302, "step": 3429 }, { "epoch": 0.08, "learning_rate": 9.935784695958709e-06, "loss": 0.9026, "step": 3430 }, { "epoch": 0.08, "learning_rate": 9.935724684379498e-06, "loss": 0.7601, "step": 3431 }, { "epoch": 0.08, "learning_rate": 9.935664644953265e-06, "loss": 0.8892, "step": 3432 }, { "epoch": 0.08, "learning_rate": 9.935604577680347e-06, "loss": 1.1024, "step": 3433 }, { "epoch": 0.08, "learning_rate": 9.935544482561084e-06, "loss": 1.1598, "step": 3434 }, { "epoch": 0.08, "learning_rate": 9.935484359595815e-06, "loss": 1.2079, "step": 3435 }, { "epoch": 0.08, "learning_rate": 9.935424208784877e-06, "loss": 0.9963, "step": 3436 }, { "epoch": 0.08, "learning_rate": 9.935364030128614e-06, "loss": 1.2471, "step": 3437 }, { "epoch": 0.08, "learning_rate": 9.93530382362736e-06, "loss": 1.0574, "step": 3438 }, { "epoch": 0.08, "learning_rate": 9.93524358928146e-06, "loss": 0.9679, "step": 3439 }, { "epoch": 0.08, "learning_rate": 9.93518332709125e-06, "loss": 1.1091, "step": 3440 }, { "epoch": 0.08, "learning_rate": 9.935123037057073e-06, "loss": 1.0634, "step": 3441 }, { "epoch": 0.08, "learning_rate": 9.935062719179265e-06, "loss": 0.7606, "step": 3442 }, { "epoch": 0.08, "learning_rate": 9.935002373458171e-06, "loss": 1.1273, "step": 3443 }, { "epoch": 0.08, "learning_rate": 9.93494199989413e-06, "loss": 1.2064, "step": 3444 }, { "epoch": 0.08, "learning_rate": 9.934881598487478e-06, "loss": 1.0409, "step": 3445 }, { "epoch": 0.08, "learning_rate": 9.934821169238563e-06, "loss": 0.9958, "step": 3446 }, { "epoch": 0.08, "learning_rate": 9.934760712147722e-06, "loss": 1.1978, "step": 3447 }, { "epoch": 0.08, "learning_rate": 9.934700227215297e-06, "loss": 1.1387, "step": 3448 }, { "epoch": 0.08, "learning_rate": 9.934639714441628e-06, "loss": 0.8343, "step": 3449 }, { "epoch": 0.08, "learning_rate": 9.934579173827059e-06, "loss": 1.0388, "step": 3450 }, { "epoch": 0.08, "learning_rate": 9.934518605371927e-06, "loss": 1.1533, "step": 3451 }, { "epoch": 0.08, "learning_rate": 9.93445800907658e-06, "loss": 1.1238, "step": 3452 }, { "epoch": 0.08, "learning_rate": 9.934397384941354e-06, "loss": 0.9852, "step": 3453 }, { "epoch": 0.08, "learning_rate": 9.934336732966594e-06, "loss": 1.198, "step": 3454 }, { "epoch": 0.08, "learning_rate": 9.934276053152642e-06, "loss": 1.1134, "step": 3455 }, { "epoch": 0.08, "learning_rate": 9.934215345499843e-06, "loss": 1.0142, "step": 3456 }, { "epoch": 0.08, "learning_rate": 9.934154610008532e-06, "loss": 1.1281, "step": 3457 }, { "epoch": 0.08, "learning_rate": 9.93409384667906e-06, "loss": 0.9623, "step": 3458 }, { "epoch": 0.08, "learning_rate": 9.934033055511765e-06, "loss": 1.1008, "step": 3459 }, { "epoch": 0.08, "learning_rate": 9.93397223650699e-06, "loss": 1.1704, "step": 3460 }, { "epoch": 0.08, "learning_rate": 9.93391138966508e-06, "loss": 1.2238, "step": 3461 }, { "epoch": 0.08, "learning_rate": 9.933850514986377e-06, "loss": 1.0134, "step": 3462 }, { "epoch": 0.08, "learning_rate": 9.933789612471224e-06, "loss": 1.1617, "step": 3463 }, { "epoch": 0.08, "learning_rate": 9.93372868211997e-06, "loss": 1.2356, "step": 3464 }, { "epoch": 0.08, "learning_rate": 9.93366772393295e-06, "loss": 1.1264, "step": 3465 }, { "epoch": 0.08, "learning_rate": 9.933606737910515e-06, "loss": 1.1715, "step": 3466 }, { "epoch": 0.08, "learning_rate": 9.933545724053005e-06, "loss": 1.0355, "step": 3467 }, { "epoch": 0.08, "learning_rate": 9.933484682360766e-06, "loss": 0.8954, "step": 3468 }, { "epoch": 0.08, "learning_rate": 9.933423612834141e-06, "loss": 0.8911, "step": 3469 }, { "epoch": 0.08, "learning_rate": 9.933362515473477e-06, "loss": 1.0375, "step": 3470 }, { "epoch": 0.08, "learning_rate": 9.933301390279116e-06, "loss": 1.1161, "step": 3471 }, { "epoch": 0.08, "learning_rate": 9.933240237251406e-06, "loss": 1.1023, "step": 3472 }, { "epoch": 0.08, "learning_rate": 9.933179056390687e-06, "loss": 1.1975, "step": 3473 }, { "epoch": 0.08, "learning_rate": 9.93311784769731e-06, "loss": 0.948, "step": 3474 }, { "epoch": 0.08, "learning_rate": 9.933056611171617e-06, "loss": 1.1386, "step": 3475 }, { "epoch": 0.08, "learning_rate": 9.932995346813953e-06, "loss": 1.15, "step": 3476 }, { "epoch": 0.08, "learning_rate": 9.932934054624666e-06, "loss": 0.9728, "step": 3477 }, { "epoch": 0.08, "learning_rate": 9.9328727346041e-06, "loss": 1.3742, "step": 3478 }, { "epoch": 0.08, "learning_rate": 9.932811386752604e-06, "loss": 1.2573, "step": 3479 }, { "epoch": 0.08, "learning_rate": 9.932750011070518e-06, "loss": 1.0324, "step": 3480 }, { "epoch": 0.08, "learning_rate": 9.932688607558194e-06, "loss": 1.2202, "step": 3481 }, { "epoch": 0.08, "learning_rate": 9.932627176215976e-06, "loss": 1.0489, "step": 3482 }, { "epoch": 0.08, "learning_rate": 9.932565717044211e-06, "loss": 1.0129, "step": 3483 }, { "epoch": 0.08, "learning_rate": 9.932504230043245e-06, "loss": 0.8652, "step": 3484 }, { "epoch": 0.08, "learning_rate": 9.932442715213428e-06, "loss": 1.1004, "step": 3485 }, { "epoch": 0.08, "learning_rate": 9.932381172555102e-06, "loss": 1.1711, "step": 3486 }, { "epoch": 0.08, "learning_rate": 9.932319602068618e-06, "loss": 1.0989, "step": 3487 }, { "epoch": 0.08, "learning_rate": 9.932258003754323e-06, "loss": 1.0953, "step": 3488 }, { "epoch": 0.08, "learning_rate": 9.932196377612562e-06, "loss": 1.1297, "step": 3489 }, { "epoch": 0.08, "learning_rate": 9.932134723643687e-06, "loss": 1.2927, "step": 3490 }, { "epoch": 0.08, "learning_rate": 9.932073041848041e-06, "loss": 1.0929, "step": 3491 }, { "epoch": 0.08, "learning_rate": 9.932011332225976e-06, "loss": 1.2188, "step": 3492 }, { "epoch": 0.08, "learning_rate": 9.931949594777838e-06, "loss": 1.1779, "step": 3493 }, { "epoch": 0.08, "learning_rate": 9.931887829503975e-06, "loss": 1.1716, "step": 3494 }, { "epoch": 0.08, "learning_rate": 9.931826036404737e-06, "loss": 1.037, "step": 3495 }, { "epoch": 0.08, "learning_rate": 9.931764215480472e-06, "loss": 1.0101, "step": 3496 }, { "epoch": 0.08, "learning_rate": 9.931702366731531e-06, "loss": 1.0497, "step": 3497 }, { "epoch": 0.08, "learning_rate": 9.931640490158257e-06, "loss": 1.1495, "step": 3498 }, { "epoch": 0.08, "learning_rate": 9.931578585761005e-06, "loss": 0.9609, "step": 3499 }, { "epoch": 0.08, "learning_rate": 9.93151665354012e-06, "loss": 1.2603, "step": 3500 }, { "epoch": 0.08, "learning_rate": 9.931454693495956e-06, "loss": 1.394, "step": 3501 }, { "epoch": 0.08, "learning_rate": 9.93139270562886e-06, "loss": 0.7966, "step": 3502 }, { "epoch": 0.08, "learning_rate": 9.93133068993918e-06, "loss": 1.2947, "step": 3503 }, { "epoch": 0.08, "learning_rate": 9.931268646427268e-06, "loss": 1.0222, "step": 3504 }, { "epoch": 0.08, "learning_rate": 9.931206575093476e-06, "loss": 1.3151, "step": 3505 }, { "epoch": 0.08, "learning_rate": 9.931144475938148e-06, "loss": 1.1283, "step": 3506 }, { "epoch": 0.08, "learning_rate": 9.931082348961641e-06, "loss": 1.1426, "step": 3507 }, { "epoch": 0.08, "learning_rate": 9.931020194164302e-06, "loss": 0.9333, "step": 3508 }, { "epoch": 0.08, "learning_rate": 9.930958011546482e-06, "loss": 1.2454, "step": 3509 }, { "epoch": 0.08, "learning_rate": 9.930895801108533e-06, "loss": 1.0354, "step": 3510 }, { "epoch": 0.08, "learning_rate": 9.930833562850805e-06, "loss": 1.0678, "step": 3511 }, { "epoch": 0.08, "learning_rate": 9.93077129677365e-06, "loss": 1.1421, "step": 3512 }, { "epoch": 0.08, "learning_rate": 9.93070900287742e-06, "loss": 1.1417, "step": 3513 }, { "epoch": 0.08, "learning_rate": 9.930646681162463e-06, "loss": 1.0791, "step": 3514 }, { "epoch": 0.08, "learning_rate": 9.930584331629132e-06, "loss": 0.9283, "step": 3515 }, { "epoch": 0.08, "learning_rate": 9.930521954277783e-06, "loss": 1.1359, "step": 3516 }, { "epoch": 0.08, "learning_rate": 9.930459549108761e-06, "loss": 1.131, "step": 3517 }, { "epoch": 0.08, "learning_rate": 9.930397116122422e-06, "loss": 1.1293, "step": 3518 }, { "epoch": 0.08, "learning_rate": 9.93033465531912e-06, "loss": 1.0007, "step": 3519 }, { "epoch": 0.08, "learning_rate": 9.930272166699203e-06, "loss": 1.2709, "step": 3520 }, { "epoch": 0.08, "learning_rate": 9.930209650263028e-06, "loss": 1.2406, "step": 3521 }, { "epoch": 0.08, "learning_rate": 9.930147106010946e-06, "loss": 1.2366, "step": 3522 }, { "epoch": 0.08, "learning_rate": 9.930084533943306e-06, "loss": 1.1995, "step": 3523 }, { "epoch": 0.08, "learning_rate": 9.930021934060467e-06, "loss": 1.3349, "step": 3524 }, { "epoch": 0.08, "learning_rate": 9.92995930636278e-06, "loss": 1.0253, "step": 3525 }, { "epoch": 0.08, "learning_rate": 9.929896650850596e-06, "loss": 0.836, "step": 3526 }, { "epoch": 0.08, "learning_rate": 9.929833967524271e-06, "loss": 0.9341, "step": 3527 }, { "epoch": 0.08, "learning_rate": 9.92977125638416e-06, "loss": 1.0695, "step": 3528 }, { "epoch": 0.08, "learning_rate": 9.929708517430612e-06, "loss": 0.906, "step": 3529 }, { "epoch": 0.08, "learning_rate": 9.929645750663985e-06, "loss": 1.2137, "step": 3530 }, { "epoch": 0.08, "learning_rate": 9.92958295608463e-06, "loss": 0.9053, "step": 3531 }, { "epoch": 0.08, "learning_rate": 9.929520133692907e-06, "loss": 0.8109, "step": 3532 }, { "epoch": 0.08, "learning_rate": 9.929457283489165e-06, "loss": 1.2838, "step": 3533 }, { "epoch": 0.08, "learning_rate": 9.929394405473761e-06, "loss": 1.191, "step": 3534 }, { "epoch": 0.08, "learning_rate": 9.929331499647048e-06, "loss": 1.0449, "step": 3535 }, { "epoch": 0.08, "learning_rate": 9.929268566009383e-06, "loss": 1.142, "step": 3536 }, { "epoch": 0.08, "learning_rate": 9.929205604561118e-06, "loss": 1.3716, "step": 3537 }, { "epoch": 0.08, "learning_rate": 9.929142615302611e-06, "loss": 1.1836, "step": 3538 }, { "epoch": 0.08, "learning_rate": 9.92907959823422e-06, "loss": 1.0733, "step": 3539 }, { "epoch": 0.08, "learning_rate": 9.929016553356294e-06, "loss": 1.0938, "step": 3540 }, { "epoch": 0.08, "learning_rate": 9.928953480669192e-06, "loss": 0.9974, "step": 3541 }, { "epoch": 0.08, "learning_rate": 9.92889038017327e-06, "loss": 1.0723, "step": 3542 }, { "epoch": 0.08, "learning_rate": 9.928827251868883e-06, "loss": 1.2356, "step": 3543 }, { "epoch": 0.08, "learning_rate": 9.928764095756389e-06, "loss": 1.0127, "step": 3544 }, { "epoch": 0.08, "learning_rate": 9.928700911836143e-06, "loss": 1.1624, "step": 3545 }, { "epoch": 0.08, "learning_rate": 9.928637700108502e-06, "loss": 1.0323, "step": 3546 }, { "epoch": 0.08, "learning_rate": 9.928574460573822e-06, "loss": 1.1246, "step": 3547 }, { "epoch": 0.08, "learning_rate": 9.928511193232459e-06, "loss": 1.1685, "step": 3548 }, { "epoch": 0.08, "learning_rate": 9.928447898084773e-06, "loss": 1.0897, "step": 3549 }, { "epoch": 0.08, "learning_rate": 9.928384575131118e-06, "loss": 0.7482, "step": 3550 }, { "epoch": 0.08, "learning_rate": 9.928321224371854e-06, "loss": 1.3798, "step": 3551 }, { "epoch": 0.08, "learning_rate": 9.928257845807335e-06, "loss": 1.1854, "step": 3552 }, { "epoch": 0.08, "learning_rate": 9.928194439437921e-06, "loss": 1.0511, "step": 3553 }, { "epoch": 0.08, "learning_rate": 9.92813100526397e-06, "loss": 1.0621, "step": 3554 }, { "epoch": 0.08, "learning_rate": 9.928067543285838e-06, "loss": 1.1448, "step": 3555 }, { "epoch": 0.08, "learning_rate": 9.928004053503886e-06, "loss": 0.9073, "step": 3556 }, { "epoch": 0.08, "learning_rate": 9.927940535918467e-06, "loss": 0.9616, "step": 3557 }, { "epoch": 0.08, "learning_rate": 9.927876990529945e-06, "loss": 0.9045, "step": 3558 }, { "epoch": 0.08, "learning_rate": 9.927813417338677e-06, "loss": 0.9117, "step": 3559 }, { "epoch": 0.08, "learning_rate": 9.92774981634502e-06, "loss": 0.7893, "step": 3560 }, { "epoch": 0.08, "learning_rate": 9.927686187549332e-06, "loss": 1.0721, "step": 3561 }, { "epoch": 0.08, "learning_rate": 9.927622530951978e-06, "loss": 0.9731, "step": 3562 }, { "epoch": 0.08, "learning_rate": 9.92755884655331e-06, "loss": 1.1161, "step": 3563 }, { "epoch": 0.08, "learning_rate": 9.927495134353689e-06, "loss": 1.2064, "step": 3564 }, { "epoch": 0.08, "learning_rate": 9.927431394353477e-06, "loss": 0.9905, "step": 3565 }, { "epoch": 0.08, "learning_rate": 9.927367626553031e-06, "loss": 0.9025, "step": 3566 }, { "epoch": 0.08, "learning_rate": 9.927303830952713e-06, "loss": 1.0226, "step": 3567 }, { "epoch": 0.08, "learning_rate": 9.927240007552883e-06, "loss": 1.0459, "step": 3568 }, { "epoch": 0.08, "learning_rate": 9.9271761563539e-06, "loss": 1.2041, "step": 3569 }, { "epoch": 0.08, "learning_rate": 9.927112277356122e-06, "loss": 0.9871, "step": 3570 }, { "epoch": 0.08, "learning_rate": 9.927048370559912e-06, "loss": 1.087, "step": 3571 }, { "epoch": 0.08, "learning_rate": 9.926984435965631e-06, "loss": 0.8951, "step": 3572 }, { "epoch": 0.08, "learning_rate": 9.92692047357364e-06, "loss": 0.8949, "step": 3573 }, { "epoch": 0.08, "learning_rate": 9.9268564833843e-06, "loss": 1.0545, "step": 3574 }, { "epoch": 0.08, "learning_rate": 9.926792465397968e-06, "loss": 1.1797, "step": 3575 }, { "epoch": 0.08, "learning_rate": 9.926728419615009e-06, "loss": 1.0544, "step": 3576 }, { "epoch": 0.08, "learning_rate": 9.926664346035782e-06, "loss": 1.2566, "step": 3577 }, { "epoch": 0.08, "learning_rate": 9.926600244660651e-06, "loss": 1.1934, "step": 3578 }, { "epoch": 0.08, "learning_rate": 9.926536115489977e-06, "loss": 1.2225, "step": 3579 }, { "epoch": 0.08, "learning_rate": 9.926471958524123e-06, "loss": 1.1859, "step": 3580 }, { "epoch": 0.08, "learning_rate": 9.926407773763445e-06, "loss": 1.3894, "step": 3581 }, { "epoch": 0.08, "learning_rate": 9.926343561208313e-06, "loss": 1.0488, "step": 3582 }, { "epoch": 0.08, "learning_rate": 9.926279320859085e-06, "loss": 1.0484, "step": 3583 }, { "epoch": 0.08, "learning_rate": 9.926215052716123e-06, "loss": 1.1877, "step": 3584 }, { "epoch": 0.08, "learning_rate": 9.92615075677979e-06, "loss": 1.1649, "step": 3585 }, { "epoch": 0.08, "learning_rate": 9.926086433050453e-06, "loss": 1.1806, "step": 3586 }, { "epoch": 0.08, "learning_rate": 9.926022081528468e-06, "loss": 1.1432, "step": 3587 }, { "epoch": 0.08, "learning_rate": 9.925957702214203e-06, "loss": 0.9977, "step": 3588 }, { "epoch": 0.08, "learning_rate": 9.92589329510802e-06, "loss": 1.218, "step": 3589 }, { "epoch": 0.08, "learning_rate": 9.925828860210282e-06, "loss": 1.1757, "step": 3590 }, { "epoch": 0.08, "learning_rate": 9.925764397521352e-06, "loss": 0.9809, "step": 3591 }, { "epoch": 0.08, "learning_rate": 9.925699907041594e-06, "loss": 1.319, "step": 3592 }, { "epoch": 0.08, "learning_rate": 9.925635388771373e-06, "loss": 1.1844, "step": 3593 }, { "epoch": 0.08, "learning_rate": 9.925570842711051e-06, "loss": 1.1141, "step": 3594 }, { "epoch": 0.08, "learning_rate": 9.925506268860995e-06, "loss": 0.9184, "step": 3595 }, { "epoch": 0.08, "learning_rate": 9.925441667221566e-06, "loss": 1.1112, "step": 3596 }, { "epoch": 0.08, "learning_rate": 9.925377037793131e-06, "loss": 1.0517, "step": 3597 }, { "epoch": 0.08, "learning_rate": 9.925312380576056e-06, "loss": 1.1002, "step": 3598 }, { "epoch": 0.08, "learning_rate": 9.9252476955707e-06, "loss": 1.4679, "step": 3599 }, { "epoch": 0.08, "learning_rate": 9.925182982777433e-06, "loss": 1.3348, "step": 3600 }, { "epoch": 0.08, "learning_rate": 9.925118242196618e-06, "loss": 1.3152, "step": 3601 }, { "epoch": 0.08, "learning_rate": 9.925053473828622e-06, "loss": 0.8892, "step": 3602 }, { "epoch": 0.08, "learning_rate": 9.924988677673808e-06, "loss": 1.0765, "step": 3603 }, { "epoch": 0.08, "learning_rate": 9.924923853732544e-06, "loss": 0.966, "step": 3604 }, { "epoch": 0.08, "learning_rate": 9.924859002005195e-06, "loss": 1.1189, "step": 3605 }, { "epoch": 0.08, "learning_rate": 9.924794122492125e-06, "loss": 0.9898, "step": 3606 }, { "epoch": 0.08, "learning_rate": 9.924729215193702e-06, "loss": 0.8175, "step": 3607 }, { "epoch": 0.08, "learning_rate": 9.924664280110292e-06, "loss": 1.0341, "step": 3608 }, { "epoch": 0.08, "learning_rate": 9.924599317242262e-06, "loss": 1.4236, "step": 3609 }, { "epoch": 0.08, "learning_rate": 9.924534326589976e-06, "loss": 0.8853, "step": 3610 }, { "epoch": 0.08, "learning_rate": 9.924469308153803e-06, "loss": 1.0173, "step": 3611 }, { "epoch": 0.08, "learning_rate": 9.924404261934109e-06, "loss": 1.2083, "step": 3612 }, { "epoch": 0.08, "learning_rate": 9.924339187931262e-06, "loss": 1.087, "step": 3613 }, { "epoch": 0.08, "learning_rate": 9.924274086145627e-06, "loss": 1.1529, "step": 3614 }, { "epoch": 0.08, "learning_rate": 9.924208956577573e-06, "loss": 0.9577, "step": 3615 }, { "epoch": 0.08, "learning_rate": 9.924143799227468e-06, "loss": 1.1519, "step": 3616 }, { "epoch": 0.08, "learning_rate": 9.924078614095678e-06, "loss": 1.0873, "step": 3617 }, { "epoch": 0.08, "learning_rate": 9.92401340118257e-06, "loss": 1.3415, "step": 3618 }, { "epoch": 0.08, "learning_rate": 9.923948160488515e-06, "loss": 1.008, "step": 3619 }, { "epoch": 0.08, "learning_rate": 9.923882892013879e-06, "loss": 1.0259, "step": 3620 }, { "epoch": 0.08, "learning_rate": 9.92381759575903e-06, "loss": 1.1625, "step": 3621 }, { "epoch": 0.08, "learning_rate": 9.923752271724338e-06, "loss": 1.0245, "step": 3622 }, { "epoch": 0.08, "learning_rate": 9.923686919910169e-06, "loss": 1.1024, "step": 3623 }, { "epoch": 0.08, "learning_rate": 9.923621540316894e-06, "loss": 1.0017, "step": 3624 }, { "epoch": 0.08, "learning_rate": 9.923556132944883e-06, "loss": 1.222, "step": 3625 }, { "epoch": 0.08, "learning_rate": 9.923490697794502e-06, "loss": 1.1062, "step": 3626 }, { "epoch": 0.08, "learning_rate": 9.923425234866121e-06, "loss": 0.9865, "step": 3627 }, { "epoch": 0.08, "learning_rate": 9.92335974416011e-06, "loss": 0.97, "step": 3628 }, { "epoch": 0.08, "learning_rate": 9.923294225676839e-06, "loss": 1.2894, "step": 3629 }, { "epoch": 0.08, "learning_rate": 9.923228679416674e-06, "loss": 1.0392, "step": 3630 }, { "epoch": 0.08, "learning_rate": 9.92316310537999e-06, "loss": 0.9698, "step": 3631 }, { "epoch": 0.08, "learning_rate": 9.923097503567155e-06, "loss": 1.0764, "step": 3632 }, { "epoch": 0.08, "learning_rate": 9.923031873978539e-06, "loss": 1.0201, "step": 3633 }, { "epoch": 0.08, "learning_rate": 9.92296621661451e-06, "loss": 0.8702, "step": 3634 }, { "epoch": 0.08, "learning_rate": 9.922900531475442e-06, "loss": 1.3205, "step": 3635 }, { "epoch": 0.08, "learning_rate": 9.922834818561702e-06, "loss": 0.9985, "step": 3636 }, { "epoch": 0.08, "learning_rate": 9.922769077873666e-06, "loss": 0.953, "step": 3637 }, { "epoch": 0.08, "learning_rate": 9.9227033094117e-06, "loss": 1.1149, "step": 3638 }, { "epoch": 0.08, "learning_rate": 9.922637513176177e-06, "loss": 1.2395, "step": 3639 }, { "epoch": 0.08, "learning_rate": 9.922571689167468e-06, "loss": 1.1465, "step": 3640 }, { "epoch": 0.08, "learning_rate": 9.922505837385944e-06, "loss": 0.901, "step": 3641 }, { "epoch": 0.08, "learning_rate": 9.922439957831977e-06, "loss": 1.1392, "step": 3642 }, { "epoch": 0.08, "learning_rate": 9.92237405050594e-06, "loss": 1.051, "step": 3643 }, { "epoch": 0.08, "learning_rate": 9.922308115408202e-06, "loss": 0.8467, "step": 3644 }, { "epoch": 0.08, "learning_rate": 9.922242152539136e-06, "loss": 0.8413, "step": 3645 }, { "epoch": 0.08, "learning_rate": 9.922176161899115e-06, "loss": 1.174, "step": 3646 }, { "epoch": 0.08, "learning_rate": 9.92211014348851e-06, "loss": 1.0193, "step": 3647 }, { "epoch": 0.08, "learning_rate": 9.922044097307695e-06, "loss": 1.1978, "step": 3648 }, { "epoch": 0.08, "learning_rate": 9.921978023357044e-06, "loss": 1.5048, "step": 3649 }, { "epoch": 0.08, "learning_rate": 9.921911921636927e-06, "loss": 0.9285, "step": 3650 }, { "epoch": 0.08, "learning_rate": 9.921845792147715e-06, "loss": 1.044, "step": 3651 }, { "epoch": 0.08, "learning_rate": 9.921779634889786e-06, "loss": 0.9277, "step": 3652 }, { "epoch": 0.08, "learning_rate": 9.921713449863512e-06, "loss": 0.9583, "step": 3653 }, { "epoch": 0.08, "learning_rate": 9.921647237069264e-06, "loss": 1.1493, "step": 3654 }, { "epoch": 0.08, "learning_rate": 9.921580996507417e-06, "loss": 1.035, "step": 3655 }, { "epoch": 0.08, "learning_rate": 9.921514728178346e-06, "loss": 1.0823, "step": 3656 }, { "epoch": 0.08, "learning_rate": 9.921448432082422e-06, "loss": 0.8856, "step": 3657 }, { "epoch": 0.08, "learning_rate": 9.921382108220021e-06, "loss": 1.1305, "step": 3658 }, { "epoch": 0.08, "learning_rate": 9.921315756591518e-06, "loss": 1.0947, "step": 3659 }, { "epoch": 0.08, "learning_rate": 9.921249377197287e-06, "loss": 1.2638, "step": 3660 }, { "epoch": 0.08, "learning_rate": 9.9211829700377e-06, "loss": 1.2225, "step": 3661 }, { "epoch": 0.08, "learning_rate": 9.921116535113133e-06, "loss": 1.0698, "step": 3662 }, { "epoch": 0.08, "learning_rate": 9.921050072423964e-06, "loss": 1.0206, "step": 3663 }, { "epoch": 0.08, "learning_rate": 9.920983581970562e-06, "loss": 1.107, "step": 3664 }, { "epoch": 0.08, "learning_rate": 9.920917063753305e-06, "loss": 1.2569, "step": 3665 }, { "epoch": 0.09, "learning_rate": 9.920850517772572e-06, "loss": 1.1678, "step": 3666 }, { "epoch": 0.09, "learning_rate": 9.920783944028733e-06, "loss": 1.1453, "step": 3667 }, { "epoch": 0.09, "learning_rate": 9.920717342522166e-06, "loss": 1.0678, "step": 3668 }, { "epoch": 0.09, "learning_rate": 9.920650713253248e-06, "loss": 1.0795, "step": 3669 }, { "epoch": 0.09, "learning_rate": 9.920584056222351e-06, "loss": 1.1097, "step": 3670 }, { "epoch": 0.09, "learning_rate": 9.920517371429854e-06, "loss": 1.0719, "step": 3671 }, { "epoch": 0.09, "learning_rate": 9.920450658876134e-06, "loss": 1.0431, "step": 3672 }, { "epoch": 0.09, "learning_rate": 9.920383918561565e-06, "loss": 1.1001, "step": 3673 }, { "epoch": 0.09, "learning_rate": 9.920317150486525e-06, "loss": 1.0639, "step": 3674 }, { "epoch": 0.09, "learning_rate": 9.920250354651391e-06, "loss": 1.1795, "step": 3675 }, { "epoch": 0.09, "learning_rate": 9.920183531056538e-06, "loss": 0.9792, "step": 3676 }, { "epoch": 0.09, "learning_rate": 9.920116679702345e-06, "loss": 1.0147, "step": 3677 }, { "epoch": 0.09, "learning_rate": 9.920049800589186e-06, "loss": 1.2173, "step": 3678 }, { "epoch": 0.09, "learning_rate": 9.919982893717443e-06, "loss": 1.2846, "step": 3679 }, { "epoch": 0.09, "learning_rate": 9.919915959087492e-06, "loss": 0.9355, "step": 3680 }, { "epoch": 0.09, "learning_rate": 9.919848996699707e-06, "loss": 1.0979, "step": 3681 }, { "epoch": 0.09, "learning_rate": 9.91978200655447e-06, "loss": 1.312, "step": 3682 }, { "epoch": 0.09, "learning_rate": 9.919714988652158e-06, "loss": 1.2684, "step": 3683 }, { "epoch": 0.09, "learning_rate": 9.91964794299315e-06, "loss": 1.0335, "step": 3684 }, { "epoch": 0.09, "learning_rate": 9.919580869577821e-06, "loss": 1.0825, "step": 3685 }, { "epoch": 0.09, "learning_rate": 9.919513768406551e-06, "loss": 0.9661, "step": 3686 }, { "epoch": 0.09, "learning_rate": 9.91944663947972e-06, "loss": 1.1527, "step": 3687 }, { "epoch": 0.09, "learning_rate": 9.919379482797705e-06, "loss": 0.9061, "step": 3688 }, { "epoch": 0.09, "learning_rate": 9.919312298360886e-06, "loss": 1.01, "step": 3689 }, { "epoch": 0.09, "learning_rate": 9.919245086169642e-06, "loss": 1.226, "step": 3690 }, { "epoch": 0.09, "learning_rate": 9.919177846224351e-06, "loss": 0.9577, "step": 3691 }, { "epoch": 0.09, "learning_rate": 9.919110578525392e-06, "loss": 1.1713, "step": 3692 }, { "epoch": 0.09, "learning_rate": 9.919043283073148e-06, "loss": 0.9858, "step": 3693 }, { "epoch": 0.09, "learning_rate": 9.918975959867996e-06, "loss": 1.1732, "step": 3694 }, { "epoch": 0.09, "learning_rate": 9.918908608910316e-06, "loss": 1.1784, "step": 3695 }, { "epoch": 0.09, "learning_rate": 9.918841230200488e-06, "loss": 1.0584, "step": 3696 }, { "epoch": 0.09, "learning_rate": 9.918773823738892e-06, "loss": 1.104, "step": 3697 }, { "epoch": 0.09, "learning_rate": 9.918706389525909e-06, "loss": 1.0251, "step": 3698 }, { "epoch": 0.09, "learning_rate": 9.91863892756192e-06, "loss": 0.8642, "step": 3699 }, { "epoch": 0.09, "learning_rate": 9.918571437847305e-06, "loss": 0.9352, "step": 3700 }, { "epoch": 0.09, "learning_rate": 9.918503920382443e-06, "loss": 0.9593, "step": 3701 }, { "epoch": 0.09, "learning_rate": 9.918436375167718e-06, "loss": 0.9345, "step": 3702 }, { "epoch": 0.09, "learning_rate": 9.918368802203507e-06, "loss": 0.8397, "step": 3703 }, { "epoch": 0.09, "learning_rate": 9.918301201490194e-06, "loss": 1.2361, "step": 3704 }, { "epoch": 0.09, "learning_rate": 9.918233573028161e-06, "loss": 0.97, "step": 3705 }, { "epoch": 0.09, "learning_rate": 9.91816591681779e-06, "loss": 1.0955, "step": 3706 }, { "epoch": 0.09, "learning_rate": 9.918098232859461e-06, "loss": 1.201, "step": 3707 }, { "epoch": 0.09, "learning_rate": 9.918030521153556e-06, "loss": 1.1851, "step": 3708 }, { "epoch": 0.09, "learning_rate": 9.917962781700457e-06, "loss": 1.1446, "step": 3709 }, { "epoch": 0.09, "learning_rate": 9.917895014500547e-06, "loss": 1.226, "step": 3710 }, { "epoch": 0.09, "learning_rate": 9.917827219554208e-06, "loss": 0.8733, "step": 3711 }, { "epoch": 0.09, "learning_rate": 9.917759396861822e-06, "loss": 1.1928, "step": 3712 }, { "epoch": 0.09, "learning_rate": 9.917691546423772e-06, "loss": 1.0884, "step": 3713 }, { "epoch": 0.09, "learning_rate": 9.917623668240441e-06, "loss": 0.9168, "step": 3714 }, { "epoch": 0.09, "learning_rate": 9.91755576231221e-06, "loss": 0.9904, "step": 3715 }, { "epoch": 0.09, "learning_rate": 9.917487828639466e-06, "loss": 1.1098, "step": 3716 }, { "epoch": 0.09, "learning_rate": 9.917419867222589e-06, "loss": 1.0434, "step": 3717 }, { "epoch": 0.09, "learning_rate": 9.917351878061965e-06, "loss": 0.9025, "step": 3718 }, { "epoch": 0.09, "learning_rate": 9.917283861157975e-06, "loss": 0.9091, "step": 3719 }, { "epoch": 0.09, "learning_rate": 9.917215816511003e-06, "loss": 1.0702, "step": 3720 }, { "epoch": 0.09, "learning_rate": 9.917147744121436e-06, "loss": 0.9507, "step": 3721 }, { "epoch": 0.09, "learning_rate": 9.917079643989654e-06, "loss": 0.9454, "step": 3722 }, { "epoch": 0.09, "learning_rate": 9.917011516116043e-06, "loss": 1.0536, "step": 3723 }, { "epoch": 0.09, "learning_rate": 9.91694336050099e-06, "loss": 1.012, "step": 3724 }, { "epoch": 0.09, "learning_rate": 9.916875177144876e-06, "loss": 1.1083, "step": 3725 }, { "epoch": 0.09, "learning_rate": 9.916806966048086e-06, "loss": 1.1436, "step": 3726 }, { "epoch": 0.09, "learning_rate": 9.916738727211006e-06, "loss": 1.0453, "step": 3727 }, { "epoch": 0.09, "learning_rate": 9.916670460634019e-06, "loss": 1.1277, "step": 3728 }, { "epoch": 0.09, "learning_rate": 9.916602166317514e-06, "loss": 1.0682, "step": 3729 }, { "epoch": 0.09, "learning_rate": 9.916533844261873e-06, "loss": 1.3004, "step": 3730 }, { "epoch": 0.09, "learning_rate": 9.916465494467482e-06, "loss": 0.9853, "step": 3731 }, { "epoch": 0.09, "learning_rate": 9.916397116934727e-06, "loss": 1.166, "step": 3732 }, { "epoch": 0.09, "learning_rate": 9.916328711663996e-06, "loss": 0.9057, "step": 3733 }, { "epoch": 0.09, "learning_rate": 9.91626027865567e-06, "loss": 0.9822, "step": 3734 }, { "epoch": 0.09, "learning_rate": 9.916191817910139e-06, "loss": 1.1517, "step": 3735 }, { "epoch": 0.09, "learning_rate": 9.916123329427789e-06, "loss": 1.1519, "step": 3736 }, { "epoch": 0.09, "learning_rate": 9.916054813209005e-06, "loss": 1.1857, "step": 3737 }, { "epoch": 0.09, "learning_rate": 9.915986269254174e-06, "loss": 0.8614, "step": 3738 }, { "epoch": 0.09, "learning_rate": 9.915917697563681e-06, "loss": 1.093, "step": 3739 }, { "epoch": 0.09, "learning_rate": 9.915849098137918e-06, "loss": 1.0327, "step": 3740 }, { "epoch": 0.09, "learning_rate": 9.915780470977267e-06, "loss": 1.0652, "step": 3741 }, { "epoch": 0.09, "learning_rate": 9.915711816082117e-06, "loss": 1.2055, "step": 3742 }, { "epoch": 0.09, "learning_rate": 9.915643133452856e-06, "loss": 1.1141, "step": 3743 }, { "epoch": 0.09, "learning_rate": 9.915574423089872e-06, "loss": 0.954, "step": 3744 }, { "epoch": 0.09, "learning_rate": 9.91550568499355e-06, "loss": 1.1744, "step": 3745 }, { "epoch": 0.09, "learning_rate": 9.91543691916428e-06, "loss": 1.3114, "step": 3746 }, { "epoch": 0.09, "learning_rate": 9.915368125602447e-06, "loss": 1.1126, "step": 3747 }, { "epoch": 0.09, "learning_rate": 9.915299304308442e-06, "loss": 1.1265, "step": 3748 }, { "epoch": 0.09, "learning_rate": 9.915230455282654e-06, "loss": 1.0395, "step": 3749 }, { "epoch": 0.09, "learning_rate": 9.91516157852547e-06, "loss": 1.0281, "step": 3750 }, { "epoch": 0.09, "learning_rate": 9.915092674037277e-06, "loss": 0.8867, "step": 3751 }, { "epoch": 0.09, "learning_rate": 9.915023741818467e-06, "loss": 1.1487, "step": 3752 }, { "epoch": 0.09, "learning_rate": 9.914954781869427e-06, "loss": 0.8587, "step": 3753 }, { "epoch": 0.09, "learning_rate": 9.914885794190547e-06, "loss": 0.8964, "step": 3754 }, { "epoch": 0.09, "learning_rate": 9.914816778782215e-06, "loss": 0.9998, "step": 3755 }, { "epoch": 0.09, "learning_rate": 9.91474773564482e-06, "loss": 0.9755, "step": 3756 }, { "epoch": 0.09, "learning_rate": 9.914678664778755e-06, "loss": 0.9775, "step": 3757 }, { "epoch": 0.09, "learning_rate": 9.914609566184406e-06, "loss": 1.117, "step": 3758 }, { "epoch": 0.09, "learning_rate": 9.914540439862164e-06, "loss": 1.1446, "step": 3759 }, { "epoch": 0.09, "learning_rate": 9.914471285812419e-06, "loss": 1.0915, "step": 3760 }, { "epoch": 0.09, "learning_rate": 9.914402104035561e-06, "loss": 0.9254, "step": 3761 }, { "epoch": 0.09, "learning_rate": 9.914332894531983e-06, "loss": 1.0542, "step": 3762 }, { "epoch": 0.09, "learning_rate": 9.91426365730207e-06, "loss": 0.9362, "step": 3763 }, { "epoch": 0.09, "learning_rate": 9.914194392346218e-06, "loss": 1.1406, "step": 3764 }, { "epoch": 0.09, "learning_rate": 9.914125099664814e-06, "loss": 0.9175, "step": 3765 }, { "epoch": 0.09, "learning_rate": 9.914055779258252e-06, "loss": 1.0153, "step": 3766 }, { "epoch": 0.09, "learning_rate": 9.913986431126921e-06, "loss": 0.8396, "step": 3767 }, { "epoch": 0.09, "learning_rate": 9.913917055271212e-06, "loss": 1.2799, "step": 3768 }, { "epoch": 0.09, "learning_rate": 9.913847651691517e-06, "loss": 1.0863, "step": 3769 }, { "epoch": 0.09, "learning_rate": 9.913778220388228e-06, "loss": 0.927, "step": 3770 }, { "epoch": 0.09, "learning_rate": 9.913708761361738e-06, "loss": 1.1795, "step": 3771 }, { "epoch": 0.09, "learning_rate": 9.913639274612435e-06, "loss": 0.9498, "step": 3772 }, { "epoch": 0.09, "learning_rate": 9.913569760140716e-06, "loss": 1.1725, "step": 3773 }, { "epoch": 0.09, "learning_rate": 9.913500217946967e-06, "loss": 1.3426, "step": 3774 }, { "epoch": 0.09, "learning_rate": 9.913430648031588e-06, "loss": 0.7791, "step": 3775 }, { "epoch": 0.09, "learning_rate": 9.913361050394964e-06, "loss": 0.971, "step": 3776 }, { "epoch": 0.09, "learning_rate": 9.913291425037495e-06, "loss": 0.8805, "step": 3777 }, { "epoch": 0.09, "learning_rate": 9.913221771959568e-06, "loss": 0.9995, "step": 3778 }, { "epoch": 0.09, "learning_rate": 9.913152091161578e-06, "loss": 0.9688, "step": 3779 }, { "epoch": 0.09, "learning_rate": 9.913082382643918e-06, "loss": 1.1575, "step": 3780 }, { "epoch": 0.09, "learning_rate": 9.91301264640698e-06, "loss": 0.8514, "step": 3781 }, { "epoch": 0.09, "learning_rate": 9.91294288245116e-06, "loss": 0.9803, "step": 3782 }, { "epoch": 0.09, "learning_rate": 9.91287309077685e-06, "loss": 1.0417, "step": 3783 }, { "epoch": 0.09, "learning_rate": 9.912803271384446e-06, "loss": 0.8738, "step": 3784 }, { "epoch": 0.09, "learning_rate": 9.912733424274339e-06, "loss": 1.2328, "step": 3785 }, { "epoch": 0.09, "learning_rate": 9.912663549446925e-06, "loss": 1.1324, "step": 3786 }, { "epoch": 0.09, "learning_rate": 9.912593646902596e-06, "loss": 0.9733, "step": 3787 }, { "epoch": 0.09, "learning_rate": 9.912523716641749e-06, "loss": 0.85, "step": 3788 }, { "epoch": 0.09, "learning_rate": 9.912453758664777e-06, "loss": 1.1061, "step": 3789 }, { "epoch": 0.09, "learning_rate": 9.912383772972075e-06, "loss": 1.027, "step": 3790 }, { "epoch": 0.09, "learning_rate": 9.912313759564036e-06, "loss": 0.8919, "step": 3791 }, { "epoch": 0.09, "learning_rate": 9.91224371844106e-06, "loss": 1.2297, "step": 3792 }, { "epoch": 0.09, "learning_rate": 9.912173649603537e-06, "loss": 1.0727, "step": 3793 }, { "epoch": 0.09, "learning_rate": 9.912103553051865e-06, "loss": 1.4545, "step": 3794 }, { "epoch": 0.09, "learning_rate": 9.912033428786438e-06, "loss": 1.2264, "step": 3795 }, { "epoch": 0.09, "learning_rate": 9.911963276807655e-06, "loss": 1.1732, "step": 3796 }, { "epoch": 0.09, "learning_rate": 9.911893097115909e-06, "loss": 1.0697, "step": 3797 }, { "epoch": 0.09, "learning_rate": 9.911822889711592e-06, "loss": 1.0343, "step": 3798 }, { "epoch": 0.09, "learning_rate": 9.911752654595108e-06, "loss": 1.0071, "step": 3799 }, { "epoch": 0.09, "learning_rate": 9.911682391766849e-06, "loss": 0.9824, "step": 3800 }, { "epoch": 0.09, "learning_rate": 9.911612101227213e-06, "loss": 1.464, "step": 3801 }, { "epoch": 0.09, "learning_rate": 9.911541782976594e-06, "loss": 1.0466, "step": 3802 }, { "epoch": 0.09, "learning_rate": 9.911471437015391e-06, "loss": 0.9161, "step": 3803 }, { "epoch": 0.09, "learning_rate": 9.911401063344e-06, "loss": 0.9835, "step": 3804 }, { "epoch": 0.09, "learning_rate": 9.91133066196282e-06, "loss": 1.2182, "step": 3805 }, { "epoch": 0.09, "learning_rate": 9.911260232872244e-06, "loss": 1.0482, "step": 3806 }, { "epoch": 0.09, "learning_rate": 9.911189776072671e-06, "loss": 1.3007, "step": 3807 }, { "epoch": 0.09, "learning_rate": 9.911119291564503e-06, "loss": 1.1477, "step": 3808 }, { "epoch": 0.09, "learning_rate": 9.911048779348132e-06, "loss": 0.822, "step": 3809 }, { "epoch": 0.09, "learning_rate": 9.910978239423958e-06, "loss": 0.8567, "step": 3810 }, { "epoch": 0.09, "learning_rate": 9.910907671792379e-06, "loss": 1.0592, "step": 3811 }, { "epoch": 0.09, "learning_rate": 9.910837076453791e-06, "loss": 1.2224, "step": 3812 }, { "epoch": 0.09, "learning_rate": 9.910766453408597e-06, "loss": 1.1927, "step": 3813 }, { "epoch": 0.09, "learning_rate": 9.910695802657192e-06, "loss": 0.988, "step": 3814 }, { "epoch": 0.09, "learning_rate": 9.910625124199975e-06, "loss": 0.9794, "step": 3815 }, { "epoch": 0.09, "learning_rate": 9.910554418037345e-06, "loss": 1.1168, "step": 3816 }, { "epoch": 0.09, "learning_rate": 9.9104836841697e-06, "loss": 1.0701, "step": 3817 }, { "epoch": 0.09, "learning_rate": 9.910412922597443e-06, "loss": 1.115, "step": 3818 }, { "epoch": 0.09, "learning_rate": 9.910342133320967e-06, "loss": 0.895, "step": 3819 }, { "epoch": 0.09, "learning_rate": 9.910271316340676e-06, "loss": 0.8771, "step": 3820 }, { "epoch": 0.09, "learning_rate": 9.910200471656968e-06, "loss": 1.0409, "step": 3821 }, { "epoch": 0.09, "learning_rate": 9.910129599270245e-06, "loss": 0.9681, "step": 3822 }, { "epoch": 0.09, "learning_rate": 9.910058699180902e-06, "loss": 1.4135, "step": 3823 }, { "epoch": 0.09, "learning_rate": 9.909987771389344e-06, "loss": 0.8153, "step": 3824 }, { "epoch": 0.09, "learning_rate": 9.909916815895967e-06, "loss": 1.2163, "step": 3825 }, { "epoch": 0.09, "learning_rate": 9.909845832701175e-06, "loss": 1.1835, "step": 3826 }, { "epoch": 0.09, "learning_rate": 9.909774821805365e-06, "loss": 1.0871, "step": 3827 }, { "epoch": 0.09, "learning_rate": 9.909703783208941e-06, "loss": 1.1234, "step": 3828 }, { "epoch": 0.09, "learning_rate": 9.909632716912302e-06, "loss": 0.839, "step": 3829 }, { "epoch": 0.09, "learning_rate": 9.909561622915848e-06, "loss": 1.1987, "step": 3830 }, { "epoch": 0.09, "learning_rate": 9.909490501219981e-06, "loss": 0.8323, "step": 3831 }, { "epoch": 0.09, "learning_rate": 9.909419351825105e-06, "loss": 1.0882, "step": 3832 }, { "epoch": 0.09, "learning_rate": 9.909348174731616e-06, "loss": 0.8674, "step": 3833 }, { "epoch": 0.09, "learning_rate": 9.909276969939921e-06, "loss": 1.0741, "step": 3834 }, { "epoch": 0.09, "learning_rate": 9.909205737450418e-06, "loss": 0.9801, "step": 3835 }, { "epoch": 0.09, "learning_rate": 9.90913447726351e-06, "loss": 1.0415, "step": 3836 }, { "epoch": 0.09, "learning_rate": 9.9090631893796e-06, "loss": 0.8129, "step": 3837 }, { "epoch": 0.09, "learning_rate": 9.908991873799088e-06, "loss": 1.1192, "step": 3838 }, { "epoch": 0.09, "learning_rate": 9.908920530522379e-06, "loss": 1.0697, "step": 3839 }, { "epoch": 0.09, "learning_rate": 9.908849159549875e-06, "loss": 1.091, "step": 3840 }, { "epoch": 0.09, "learning_rate": 9.908777760881976e-06, "loss": 1.1562, "step": 3841 }, { "epoch": 0.09, "learning_rate": 9.90870633451909e-06, "loss": 0.9782, "step": 3842 }, { "epoch": 0.09, "learning_rate": 9.908634880461614e-06, "loss": 0.934, "step": 3843 }, { "epoch": 0.09, "learning_rate": 9.908563398709954e-06, "loss": 0.9052, "step": 3844 }, { "epoch": 0.09, "learning_rate": 9.908491889264513e-06, "loss": 1.1406, "step": 3845 }, { "epoch": 0.09, "learning_rate": 9.908420352125695e-06, "loss": 1.4209, "step": 3846 }, { "epoch": 0.09, "learning_rate": 9.908348787293905e-06, "loss": 1.2081, "step": 3847 }, { "epoch": 0.09, "learning_rate": 9.908277194769543e-06, "loss": 1.138, "step": 3848 }, { "epoch": 0.09, "learning_rate": 9.908205574553015e-06, "loss": 1.005, "step": 3849 }, { "epoch": 0.09, "learning_rate": 9.908133926644725e-06, "loss": 1.088, "step": 3850 }, { "epoch": 0.09, "learning_rate": 9.908062251045079e-06, "loss": 1.1588, "step": 3851 }, { "epoch": 0.09, "learning_rate": 9.907990547754477e-06, "loss": 0.9368, "step": 3852 }, { "epoch": 0.09, "learning_rate": 9.907918816773327e-06, "loss": 0.9271, "step": 3853 }, { "epoch": 0.09, "learning_rate": 9.907847058102034e-06, "loss": 0.8953, "step": 3854 }, { "epoch": 0.09, "learning_rate": 9.907775271741e-06, "loss": 1.0076, "step": 3855 }, { "epoch": 0.09, "learning_rate": 9.907703457690634e-06, "loss": 1.1342, "step": 3856 }, { "epoch": 0.09, "learning_rate": 9.907631615951337e-06, "loss": 1.0615, "step": 3857 }, { "epoch": 0.09, "learning_rate": 9.907559746523517e-06, "loss": 1.0921, "step": 3858 }, { "epoch": 0.09, "learning_rate": 9.90748784940758e-06, "loss": 1.2323, "step": 3859 }, { "epoch": 0.09, "learning_rate": 9.907415924603929e-06, "loss": 0.8347, "step": 3860 }, { "epoch": 0.09, "learning_rate": 9.907343972112971e-06, "loss": 1.1413, "step": 3861 }, { "epoch": 0.09, "learning_rate": 9.907271991935112e-06, "loss": 1.0621, "step": 3862 }, { "epoch": 0.09, "learning_rate": 9.907199984070758e-06, "loss": 0.9539, "step": 3863 }, { "epoch": 0.09, "learning_rate": 9.907127948520316e-06, "loss": 0.8033, "step": 3864 }, { "epoch": 0.09, "learning_rate": 9.907055885284192e-06, "loss": 0.804, "step": 3865 }, { "epoch": 0.09, "learning_rate": 9.906983794362792e-06, "loss": 0.8833, "step": 3866 }, { "epoch": 0.09, "learning_rate": 9.906911675756524e-06, "loss": 0.8445, "step": 3867 }, { "epoch": 0.09, "learning_rate": 9.906839529465794e-06, "loss": 1.195, "step": 3868 }, { "epoch": 0.09, "learning_rate": 9.90676735549101e-06, "loss": 0.8837, "step": 3869 }, { "epoch": 0.09, "learning_rate": 9.906695153832577e-06, "loss": 1.1319, "step": 3870 }, { "epoch": 0.09, "learning_rate": 9.906622924490903e-06, "loss": 1.015, "step": 3871 }, { "epoch": 0.09, "learning_rate": 9.906550667466397e-06, "loss": 0.9704, "step": 3872 }, { "epoch": 0.09, "learning_rate": 9.906478382759466e-06, "loss": 0.993, "step": 3873 }, { "epoch": 0.09, "learning_rate": 9.906406070370518e-06, "loss": 1.0891, "step": 3874 }, { "epoch": 0.09, "learning_rate": 9.90633373029996e-06, "loss": 1.0147, "step": 3875 }, { "epoch": 0.09, "learning_rate": 9.906261362548201e-06, "loss": 1.1388, "step": 3876 }, { "epoch": 0.09, "learning_rate": 9.906188967115648e-06, "loss": 1.1226, "step": 3877 }, { "epoch": 0.09, "learning_rate": 9.906116544002713e-06, "loss": 1.0843, "step": 3878 }, { "epoch": 0.09, "learning_rate": 9.906044093209801e-06, "loss": 1.045, "step": 3879 }, { "epoch": 0.09, "learning_rate": 9.905971614737321e-06, "loss": 1.1943, "step": 3880 }, { "epoch": 0.09, "learning_rate": 9.905899108585685e-06, "loss": 1.2143, "step": 3881 }, { "epoch": 0.09, "learning_rate": 9.9058265747553e-06, "loss": 1.2416, "step": 3882 }, { "epoch": 0.09, "learning_rate": 9.905754013246572e-06, "loss": 1.1736, "step": 3883 }, { "epoch": 0.09, "learning_rate": 9.905681424059917e-06, "loss": 1.1262, "step": 3884 }, { "epoch": 0.09, "learning_rate": 9.905608807195738e-06, "loss": 1.1579, "step": 3885 }, { "epoch": 0.09, "learning_rate": 9.90553616265445e-06, "loss": 0.9573, "step": 3886 }, { "epoch": 0.09, "learning_rate": 9.90546349043646e-06, "loss": 1.033, "step": 3887 }, { "epoch": 0.09, "learning_rate": 9.905390790542178e-06, "loss": 0.8163, "step": 3888 }, { "epoch": 0.09, "learning_rate": 9.905318062972016e-06, "loss": 1.0524, "step": 3889 }, { "epoch": 0.09, "learning_rate": 9.905245307726383e-06, "loss": 1.1024, "step": 3890 }, { "epoch": 0.09, "learning_rate": 9.905172524805688e-06, "loss": 0.8062, "step": 3891 }, { "epoch": 0.09, "learning_rate": 9.905099714210346e-06, "loss": 1.0252, "step": 3892 }, { "epoch": 0.09, "learning_rate": 9.905026875940762e-06, "loss": 0.9997, "step": 3893 }, { "epoch": 0.09, "learning_rate": 9.904954009997352e-06, "loss": 1.127, "step": 3894 }, { "epoch": 0.09, "learning_rate": 9.904881116380525e-06, "loss": 1.0575, "step": 3895 }, { "epoch": 0.09, "learning_rate": 9.90480819509069e-06, "loss": 1.1432, "step": 3896 }, { "epoch": 0.09, "learning_rate": 9.904735246128265e-06, "loss": 1.0682, "step": 3897 }, { "epoch": 0.09, "learning_rate": 9.904662269493654e-06, "loss": 0.9402, "step": 3898 }, { "epoch": 0.09, "learning_rate": 9.904589265187274e-06, "loss": 1.1624, "step": 3899 }, { "epoch": 0.09, "learning_rate": 9.904516233209534e-06, "loss": 1.199, "step": 3900 }, { "epoch": 0.09, "learning_rate": 9.904443173560848e-06, "loss": 1.0436, "step": 3901 }, { "epoch": 0.09, "learning_rate": 9.904370086241626e-06, "loss": 1.3067, "step": 3902 }, { "epoch": 0.09, "learning_rate": 9.904296971252282e-06, "loss": 0.8983, "step": 3903 }, { "epoch": 0.09, "learning_rate": 9.904223828593228e-06, "loss": 1.0739, "step": 3904 }, { "epoch": 0.09, "learning_rate": 9.904150658264878e-06, "loss": 1.1664, "step": 3905 }, { "epoch": 0.09, "learning_rate": 9.904077460267642e-06, "loss": 1.079, "step": 3906 }, { "epoch": 0.09, "learning_rate": 9.904004234601936e-06, "loss": 1.1623, "step": 3907 }, { "epoch": 0.09, "learning_rate": 9.903930981268171e-06, "loss": 1.1199, "step": 3908 }, { "epoch": 0.09, "learning_rate": 9.903857700266758e-06, "loss": 1.0802, "step": 3909 }, { "epoch": 0.09, "learning_rate": 9.903784391598117e-06, "loss": 1.1216, "step": 3910 }, { "epoch": 0.09, "learning_rate": 9.903711055262659e-06, "loss": 1.3383, "step": 3911 }, { "epoch": 0.09, "learning_rate": 9.903637691260794e-06, "loss": 0.9047, "step": 3912 }, { "epoch": 0.09, "learning_rate": 9.903564299592939e-06, "loss": 0.8312, "step": 3913 }, { "epoch": 0.09, "learning_rate": 9.903490880259509e-06, "loss": 1.2424, "step": 3914 }, { "epoch": 0.09, "learning_rate": 9.903417433260916e-06, "loss": 1.0542, "step": 3915 }, { "epoch": 0.09, "learning_rate": 9.903343958597576e-06, "loss": 1.0149, "step": 3916 }, { "epoch": 0.09, "learning_rate": 9.903270456269903e-06, "loss": 1.2125, "step": 3917 }, { "epoch": 0.09, "learning_rate": 9.903196926278312e-06, "loss": 1.3947, "step": 3918 }, { "epoch": 0.09, "learning_rate": 9.903123368623216e-06, "loss": 1.0963, "step": 3919 }, { "epoch": 0.09, "learning_rate": 9.903049783305032e-06, "loss": 1.1334, "step": 3920 }, { "epoch": 0.09, "learning_rate": 9.902976170324174e-06, "loss": 0.9853, "step": 3921 }, { "epoch": 0.09, "learning_rate": 9.90290252968106e-06, "loss": 0.9947, "step": 3922 }, { "epoch": 0.09, "learning_rate": 9.902828861376101e-06, "loss": 0.9132, "step": 3923 }, { "epoch": 0.09, "learning_rate": 9.902755165409717e-06, "loss": 1.1057, "step": 3924 }, { "epoch": 0.09, "learning_rate": 9.90268144178232e-06, "loss": 0.9783, "step": 3925 }, { "epoch": 0.09, "learning_rate": 9.90260769049433e-06, "loss": 0.9827, "step": 3926 }, { "epoch": 0.09, "learning_rate": 9.902533911546159e-06, "loss": 1.261, "step": 3927 }, { "epoch": 0.09, "learning_rate": 9.902460104938225e-06, "loss": 1.348, "step": 3928 }, { "epoch": 0.09, "learning_rate": 9.902386270670946e-06, "loss": 1.2434, "step": 3929 }, { "epoch": 0.09, "learning_rate": 9.902312408744737e-06, "loss": 1.2134, "step": 3930 }, { "epoch": 0.09, "learning_rate": 9.902238519160014e-06, "loss": 1.1871, "step": 3931 }, { "epoch": 0.09, "learning_rate": 9.902164601917194e-06, "loss": 1.1069, "step": 3932 }, { "epoch": 0.09, "learning_rate": 9.902090657016697e-06, "loss": 1.1246, "step": 3933 }, { "epoch": 0.09, "learning_rate": 9.902016684458937e-06, "loss": 0.9003, "step": 3934 }, { "epoch": 0.09, "learning_rate": 9.901942684244332e-06, "loss": 0.9582, "step": 3935 }, { "epoch": 0.09, "learning_rate": 9.901868656373298e-06, "loss": 1.1457, "step": 3936 }, { "epoch": 0.09, "learning_rate": 9.901794600846258e-06, "loss": 1.1183, "step": 3937 }, { "epoch": 0.09, "learning_rate": 9.901720517663625e-06, "loss": 1.1974, "step": 3938 }, { "epoch": 0.09, "learning_rate": 9.901646406825818e-06, "loss": 1.2333, "step": 3939 }, { "epoch": 0.09, "learning_rate": 9.901572268333255e-06, "loss": 1.0227, "step": 3940 }, { "epoch": 0.09, "learning_rate": 9.901498102186356e-06, "loss": 1.4561, "step": 3941 }, { "epoch": 0.09, "learning_rate": 9.901423908385537e-06, "loss": 1.3971, "step": 3942 }, { "epoch": 0.09, "learning_rate": 9.901349686931217e-06, "loss": 1.0665, "step": 3943 }, { "epoch": 0.09, "learning_rate": 9.901275437823817e-06, "loss": 1.005, "step": 3944 }, { "epoch": 0.09, "learning_rate": 9.901201161063752e-06, "loss": 1.3024, "step": 3945 }, { "epoch": 0.09, "learning_rate": 9.901126856651447e-06, "loss": 0.9328, "step": 3946 }, { "epoch": 0.09, "learning_rate": 9.901052524587314e-06, "loss": 1.0642, "step": 3947 }, { "epoch": 0.09, "learning_rate": 9.900978164871779e-06, "loss": 0.8068, "step": 3948 }, { "epoch": 0.09, "learning_rate": 9.900903777505256e-06, "loss": 1.1472, "step": 3949 }, { "epoch": 0.09, "learning_rate": 9.90082936248817e-06, "loss": 1.3025, "step": 3950 }, { "epoch": 0.09, "learning_rate": 9.900754919820936e-06, "loss": 0.9714, "step": 3951 }, { "epoch": 0.09, "learning_rate": 9.900680449503977e-06, "loss": 1.0657, "step": 3952 }, { "epoch": 0.09, "learning_rate": 9.900605951537712e-06, "loss": 0.9988, "step": 3953 }, { "epoch": 0.09, "learning_rate": 9.900531425922561e-06, "loss": 0.9869, "step": 3954 }, { "epoch": 0.09, "learning_rate": 9.900456872658946e-06, "loss": 0.8653, "step": 3955 }, { "epoch": 0.09, "learning_rate": 9.900382291747285e-06, "loss": 0.9972, "step": 3956 }, { "epoch": 0.09, "learning_rate": 9.900307683188001e-06, "loss": 1.1948, "step": 3957 }, { "epoch": 0.09, "learning_rate": 9.900233046981515e-06, "loss": 0.9685, "step": 3958 }, { "epoch": 0.09, "learning_rate": 9.90015838312825e-06, "loss": 0.9778, "step": 3959 }, { "epoch": 0.09, "learning_rate": 9.900083691628621e-06, "loss": 0.9732, "step": 3960 }, { "epoch": 0.09, "learning_rate": 9.900008972483055e-06, "loss": 0.8711, "step": 3961 }, { "epoch": 0.09, "learning_rate": 9.89993422569197e-06, "loss": 1.0117, "step": 3962 }, { "epoch": 0.09, "learning_rate": 9.89985945125579e-06, "loss": 1.1269, "step": 3963 }, { "epoch": 0.09, "learning_rate": 9.899784649174937e-06, "loss": 0.8546, "step": 3964 }, { "epoch": 0.09, "learning_rate": 9.899709819449832e-06, "loss": 0.9093, "step": 3965 }, { "epoch": 0.09, "learning_rate": 9.899634962080898e-06, "loss": 1.122, "step": 3966 }, { "epoch": 0.09, "learning_rate": 9.899560077068555e-06, "loss": 1.4575, "step": 3967 }, { "epoch": 0.09, "learning_rate": 9.89948516441323e-06, "loss": 1.1068, "step": 3968 }, { "epoch": 0.09, "learning_rate": 9.89941022411534e-06, "loss": 1.0805, "step": 3969 }, { "epoch": 0.09, "learning_rate": 9.899335256175312e-06, "loss": 1.3177, "step": 3970 }, { "epoch": 0.09, "learning_rate": 9.89926026059357e-06, "loss": 0.936, "step": 3971 }, { "epoch": 0.09, "learning_rate": 9.899185237370532e-06, "loss": 1.1199, "step": 3972 }, { "epoch": 0.09, "learning_rate": 9.899110186506625e-06, "loss": 1.1743, "step": 3973 }, { "epoch": 0.09, "learning_rate": 9.899035108002271e-06, "loss": 1.0786, "step": 3974 }, { "epoch": 0.09, "learning_rate": 9.898960001857896e-06, "loss": 1.2016, "step": 3975 }, { "epoch": 0.09, "learning_rate": 9.89888486807392e-06, "loss": 0.9032, "step": 3976 }, { "epoch": 0.09, "learning_rate": 9.898809706650769e-06, "loss": 1.1677, "step": 3977 }, { "epoch": 0.09, "learning_rate": 9.898734517588868e-06, "loss": 0.816, "step": 3978 }, { "epoch": 0.09, "learning_rate": 9.89865930088864e-06, "loss": 1.1382, "step": 3979 }, { "epoch": 0.09, "learning_rate": 9.898584056550508e-06, "loss": 1.285, "step": 3980 }, { "epoch": 0.09, "learning_rate": 9.898508784574898e-06, "loss": 1.0666, "step": 3981 }, { "epoch": 0.09, "learning_rate": 9.898433484962236e-06, "loss": 1.3083, "step": 3982 }, { "epoch": 0.09, "learning_rate": 9.898358157712946e-06, "loss": 1.1929, "step": 3983 }, { "epoch": 0.09, "learning_rate": 9.89828280282745e-06, "loss": 1.0175, "step": 3984 }, { "epoch": 0.09, "learning_rate": 9.898207420306177e-06, "loss": 1.1383, "step": 3985 }, { "epoch": 0.09, "learning_rate": 9.89813201014955e-06, "loss": 1.0782, "step": 3986 }, { "epoch": 0.09, "learning_rate": 9.898056572357997e-06, "loss": 1.3638, "step": 3987 }, { "epoch": 0.09, "learning_rate": 9.897981106931942e-06, "loss": 1.2599, "step": 3988 }, { "epoch": 0.09, "learning_rate": 9.89790561387181e-06, "loss": 1.2835, "step": 3989 }, { "epoch": 0.09, "learning_rate": 9.897830093178026e-06, "loss": 1.3358, "step": 3990 }, { "epoch": 0.09, "learning_rate": 9.89775454485102e-06, "loss": 0.9444, "step": 3991 }, { "epoch": 0.09, "learning_rate": 9.897678968891215e-06, "loss": 1.1731, "step": 3992 }, { "epoch": 0.09, "learning_rate": 9.89760336529904e-06, "loss": 0.976, "step": 3993 }, { "epoch": 0.09, "learning_rate": 9.897527734074919e-06, "loss": 1.3302, "step": 3994 }, { "epoch": 0.09, "learning_rate": 9.897452075219279e-06, "loss": 1.2463, "step": 3995 }, { "epoch": 0.09, "learning_rate": 9.897376388732548e-06, "loss": 1.3046, "step": 3996 }, { "epoch": 0.09, "learning_rate": 9.897300674615152e-06, "loss": 1.0133, "step": 3997 }, { "epoch": 0.09, "learning_rate": 9.89722493286752e-06, "loss": 0.9659, "step": 3998 }, { "epoch": 0.09, "learning_rate": 9.897149163490076e-06, "loss": 1.1738, "step": 3999 }, { "epoch": 0.09, "learning_rate": 9.897073366483252e-06, "loss": 0.846, "step": 4000 }, { "epoch": 0.09, "learning_rate": 9.896997541847471e-06, "loss": 1.1175, "step": 4001 }, { "epoch": 0.09, "learning_rate": 9.896921689583164e-06, "loss": 1.2718, "step": 4002 }, { "epoch": 0.09, "learning_rate": 9.896845809690759e-06, "loss": 1.2831, "step": 4003 }, { "epoch": 0.09, "learning_rate": 9.89676990217068e-06, "loss": 1.0038, "step": 4004 }, { "epoch": 0.09, "learning_rate": 9.89669396702336e-06, "loss": 1.0949, "step": 4005 }, { "epoch": 0.09, "learning_rate": 9.896618004249226e-06, "loss": 1.0228, "step": 4006 }, { "epoch": 0.09, "learning_rate": 9.896542013848707e-06, "loss": 1.1873, "step": 4007 }, { "epoch": 0.09, "learning_rate": 9.89646599582223e-06, "loss": 0.8941, "step": 4008 }, { "epoch": 0.09, "learning_rate": 9.896389950170224e-06, "loss": 1.0505, "step": 4009 }, { "epoch": 0.09, "learning_rate": 9.89631387689312e-06, "loss": 0.8457, "step": 4010 }, { "epoch": 0.09, "learning_rate": 9.896237775991347e-06, "loss": 1.1795, "step": 4011 }, { "epoch": 0.09, "learning_rate": 9.896161647465332e-06, "loss": 1.0484, "step": 4012 }, { "epoch": 0.09, "learning_rate": 9.896085491315509e-06, "loss": 0.7272, "step": 4013 }, { "epoch": 0.09, "learning_rate": 9.8960093075423e-06, "loss": 1.0814, "step": 4014 }, { "epoch": 0.09, "learning_rate": 9.895933096146142e-06, "loss": 1.137, "step": 4015 }, { "epoch": 0.09, "learning_rate": 9.895856857127463e-06, "loss": 0.9167, "step": 4016 }, { "epoch": 0.09, "learning_rate": 9.895780590486693e-06, "loss": 1.2267, "step": 4017 }, { "epoch": 0.09, "learning_rate": 9.89570429622426e-06, "loss": 0.9393, "step": 4018 }, { "epoch": 0.09, "learning_rate": 9.895627974340598e-06, "loss": 1.0112, "step": 4019 }, { "epoch": 0.09, "learning_rate": 9.895551624836135e-06, "loss": 0.8014, "step": 4020 }, { "epoch": 0.09, "learning_rate": 9.895475247711301e-06, "loss": 1.3464, "step": 4021 }, { "epoch": 0.09, "learning_rate": 9.895398842966531e-06, "loss": 0.8393, "step": 4022 }, { "epoch": 0.09, "learning_rate": 9.895322410602254e-06, "loss": 0.9805, "step": 4023 }, { "epoch": 0.09, "learning_rate": 9.8952459506189e-06, "loss": 1.0285, "step": 4024 }, { "epoch": 0.09, "learning_rate": 9.895169463016903e-06, "loss": 1.3918, "step": 4025 }, { "epoch": 0.09, "learning_rate": 9.89509294779669e-06, "loss": 0.9491, "step": 4026 }, { "epoch": 0.09, "learning_rate": 9.895016404958696e-06, "loss": 1.222, "step": 4027 }, { "epoch": 0.09, "learning_rate": 9.894939834503354e-06, "loss": 1.012, "step": 4028 }, { "epoch": 0.09, "learning_rate": 9.894863236431095e-06, "loss": 0.9429, "step": 4029 }, { "epoch": 0.09, "learning_rate": 9.894786610742348e-06, "loss": 1.191, "step": 4030 }, { "epoch": 0.09, "learning_rate": 9.894709957437551e-06, "loss": 1.0803, "step": 4031 }, { "epoch": 0.09, "learning_rate": 9.894633276517132e-06, "loss": 0.9627, "step": 4032 }, { "epoch": 0.09, "learning_rate": 9.894556567981524e-06, "loss": 1.1209, "step": 4033 }, { "epoch": 0.09, "learning_rate": 9.894479831831161e-06, "loss": 1.08, "step": 4034 }, { "epoch": 0.09, "learning_rate": 9.894403068066476e-06, "loss": 1.1857, "step": 4035 }, { "epoch": 0.09, "learning_rate": 9.894326276687902e-06, "loss": 1.089, "step": 4036 }, { "epoch": 0.09, "learning_rate": 9.894249457695873e-06, "loss": 0.9456, "step": 4037 }, { "epoch": 0.09, "learning_rate": 9.89417261109082e-06, "loss": 1.1756, "step": 4038 }, { "epoch": 0.09, "learning_rate": 9.894095736873177e-06, "loss": 1.2878, "step": 4039 }, { "epoch": 0.09, "learning_rate": 9.894018835043382e-06, "loss": 1.0444, "step": 4040 }, { "epoch": 0.09, "learning_rate": 9.893941905601863e-06, "loss": 0.9713, "step": 4041 }, { "epoch": 0.09, "learning_rate": 9.893864948549057e-06, "loss": 1.0437, "step": 4042 }, { "epoch": 0.09, "learning_rate": 9.893787963885399e-06, "loss": 0.8506, "step": 4043 }, { "epoch": 0.09, "learning_rate": 9.893710951611322e-06, "loss": 0.9661, "step": 4044 }, { "epoch": 0.09, "learning_rate": 9.89363391172726e-06, "loss": 1.2079, "step": 4045 }, { "epoch": 0.09, "learning_rate": 9.893556844233648e-06, "loss": 1.1124, "step": 4046 }, { "epoch": 0.09, "learning_rate": 9.893479749130923e-06, "loss": 1.1071, "step": 4047 }, { "epoch": 0.09, "learning_rate": 9.893402626419516e-06, "loss": 1.1215, "step": 4048 }, { "epoch": 0.09, "learning_rate": 9.893325476099865e-06, "loss": 1.1972, "step": 4049 }, { "epoch": 0.09, "learning_rate": 9.893248298172404e-06, "loss": 1.0521, "step": 4050 }, { "epoch": 0.09, "learning_rate": 9.89317109263757e-06, "loss": 1.0536, "step": 4051 }, { "epoch": 0.09, "learning_rate": 9.893093859495796e-06, "loss": 1.2263, "step": 4052 }, { "epoch": 0.09, "learning_rate": 9.893016598747521e-06, "loss": 1.1748, "step": 4053 }, { "epoch": 0.09, "learning_rate": 9.892939310393179e-06, "loss": 0.8719, "step": 4054 }, { "epoch": 0.09, "learning_rate": 9.892861994433205e-06, "loss": 1.0166, "step": 4055 }, { "epoch": 0.09, "learning_rate": 9.892784650868037e-06, "loss": 1.1528, "step": 4056 }, { "epoch": 0.09, "learning_rate": 9.892707279698111e-06, "loss": 1.1131, "step": 4057 }, { "epoch": 0.09, "learning_rate": 9.892629880923864e-06, "loss": 0.9028, "step": 4058 }, { "epoch": 0.09, "learning_rate": 9.892552454545731e-06, "loss": 1.3406, "step": 4059 }, { "epoch": 0.09, "learning_rate": 9.89247500056415e-06, "loss": 1.0462, "step": 4060 }, { "epoch": 0.09, "learning_rate": 9.892397518979557e-06, "loss": 1.0654, "step": 4061 }, { "epoch": 0.09, "learning_rate": 9.892320009792392e-06, "loss": 0.9912, "step": 4062 }, { "epoch": 0.09, "learning_rate": 9.89224247300309e-06, "loss": 1.0633, "step": 4063 }, { "epoch": 0.09, "learning_rate": 9.892164908612088e-06, "loss": 1.0278, "step": 4064 }, { "epoch": 0.09, "learning_rate": 9.892087316619822e-06, "loss": 1.0966, "step": 4065 }, { "epoch": 0.09, "learning_rate": 9.892009697026737e-06, "loss": 1.1762, "step": 4066 }, { "epoch": 0.09, "learning_rate": 9.89193204983326e-06, "loss": 1.1929, "step": 4067 }, { "epoch": 0.09, "learning_rate": 9.891854375039841e-06, "loss": 0.8423, "step": 4068 }, { "epoch": 0.09, "learning_rate": 9.89177667264691e-06, "loss": 1.1096, "step": 4069 }, { "epoch": 0.09, "learning_rate": 9.891698942654908e-06, "loss": 0.9561, "step": 4070 }, { "epoch": 0.09, "learning_rate": 9.891621185064272e-06, "loss": 0.9905, "step": 4071 }, { "epoch": 0.09, "learning_rate": 9.891543399875445e-06, "loss": 0.9333, "step": 4072 }, { "epoch": 0.09, "learning_rate": 9.89146558708886e-06, "loss": 1.0406, "step": 4073 }, { "epoch": 0.09, "learning_rate": 9.891387746704959e-06, "loss": 1.4235, "step": 4074 }, { "epoch": 0.09, "learning_rate": 9.891309878724183e-06, "loss": 0.963, "step": 4075 }, { "epoch": 0.09, "learning_rate": 9.891231983146967e-06, "loss": 0.8455, "step": 4076 }, { "epoch": 0.09, "learning_rate": 9.891154059973755e-06, "loss": 0.7672, "step": 4077 }, { "epoch": 0.09, "learning_rate": 9.891076109204982e-06, "loss": 0.9356, "step": 4078 }, { "epoch": 0.09, "learning_rate": 9.890998130841093e-06, "loss": 1.0641, "step": 4079 }, { "epoch": 0.09, "learning_rate": 9.890920124882523e-06, "loss": 0.9881, "step": 4080 }, { "epoch": 0.09, "learning_rate": 9.890842091329715e-06, "loss": 1.0599, "step": 4081 }, { "epoch": 0.09, "learning_rate": 9.89076403018311e-06, "loss": 1.4075, "step": 4082 }, { "epoch": 0.09, "learning_rate": 9.890685941443145e-06, "loss": 1.0903, "step": 4083 }, { "epoch": 0.09, "learning_rate": 9.890607825110265e-06, "loss": 0.9561, "step": 4084 }, { "epoch": 0.09, "learning_rate": 9.890529681184906e-06, "loss": 0.9181, "step": 4085 }, { "epoch": 0.09, "learning_rate": 9.890451509667513e-06, "loss": 1.3729, "step": 4086 }, { "epoch": 0.09, "learning_rate": 9.890373310558524e-06, "loss": 1.1368, "step": 4087 }, { "epoch": 0.09, "learning_rate": 9.890295083858382e-06, "loss": 0.8978, "step": 4088 }, { "epoch": 0.09, "learning_rate": 9.890216829567527e-06, "loss": 1.0552, "step": 4089 }, { "epoch": 0.09, "learning_rate": 9.890138547686402e-06, "loss": 0.9726, "step": 4090 }, { "epoch": 0.09, "learning_rate": 9.890060238215447e-06, "loss": 1.1074, "step": 4091 }, { "epoch": 0.09, "learning_rate": 9.889981901155105e-06, "loss": 1.1846, "step": 4092 }, { "epoch": 0.09, "learning_rate": 9.88990353650582e-06, "loss": 0.9965, "step": 4093 }, { "epoch": 0.09, "learning_rate": 9.889825144268029e-06, "loss": 0.9435, "step": 4094 }, { "epoch": 0.09, "learning_rate": 9.88974672444218e-06, "loss": 1.0513, "step": 4095 }, { "epoch": 0.09, "learning_rate": 9.88966827702871e-06, "loss": 0.973, "step": 4096 }, { "epoch": 0.1, "learning_rate": 9.889589802028065e-06, "loss": 0.87, "step": 4097 }, { "epoch": 0.1, "learning_rate": 9.889511299440686e-06, "loss": 1.1237, "step": 4098 }, { "epoch": 0.1, "learning_rate": 9.889432769267018e-06, "loss": 0.9368, "step": 4099 }, { "epoch": 0.1, "learning_rate": 9.889354211507503e-06, "loss": 1.1945, "step": 4100 }, { "epoch": 0.1, "learning_rate": 9.889275626162583e-06, "loss": 0.9292, "step": 4101 }, { "epoch": 0.1, "learning_rate": 9.889197013232703e-06, "loss": 1.0399, "step": 4102 }, { "epoch": 0.1, "learning_rate": 9.889118372718308e-06, "loss": 0.8965, "step": 4103 }, { "epoch": 0.1, "learning_rate": 9.889039704619837e-06, "loss": 1.1551, "step": 4104 }, { "epoch": 0.1, "learning_rate": 9.888961008937737e-06, "loss": 0.9668, "step": 4105 }, { "epoch": 0.1, "learning_rate": 9.888882285672451e-06, "loss": 1.0705, "step": 4106 }, { "epoch": 0.1, "learning_rate": 9.888803534824425e-06, "loss": 1.1881, "step": 4107 }, { "epoch": 0.1, "learning_rate": 9.888724756394104e-06, "loss": 1.0711, "step": 4108 }, { "epoch": 0.1, "learning_rate": 9.888645950381928e-06, "loss": 1.2945, "step": 4109 }, { "epoch": 0.1, "learning_rate": 9.888567116788344e-06, "loss": 1.0858, "step": 4110 }, { "epoch": 0.1, "learning_rate": 9.888488255613797e-06, "loss": 0.7731, "step": 4111 }, { "epoch": 0.1, "learning_rate": 9.88840936685873e-06, "loss": 0.7935, "step": 4112 }, { "epoch": 0.1, "learning_rate": 9.888330450523593e-06, "loss": 1.0679, "step": 4113 }, { "epoch": 0.1, "learning_rate": 9.888251506608828e-06, "loss": 0.9075, "step": 4114 }, { "epoch": 0.1, "learning_rate": 9.888172535114878e-06, "loss": 1.0257, "step": 4115 }, { "epoch": 0.1, "learning_rate": 9.888093536042192e-06, "loss": 1.3304, "step": 4116 }, { "epoch": 0.1, "learning_rate": 9.888014509391216e-06, "loss": 1.352, "step": 4117 }, { "epoch": 0.1, "learning_rate": 9.887935455162393e-06, "loss": 1.2752, "step": 4118 }, { "epoch": 0.1, "learning_rate": 9.887856373356172e-06, "loss": 1.3623, "step": 4119 }, { "epoch": 0.1, "learning_rate": 9.887777263972998e-06, "loss": 0.8469, "step": 4120 }, { "epoch": 0.1, "learning_rate": 9.887698127013315e-06, "loss": 0.9765, "step": 4121 }, { "epoch": 0.1, "learning_rate": 9.887618962477572e-06, "loss": 0.862, "step": 4122 }, { "epoch": 0.1, "learning_rate": 9.887539770366218e-06, "loss": 1.1958, "step": 4123 }, { "epoch": 0.1, "learning_rate": 9.887460550679696e-06, "loss": 1.0707, "step": 4124 }, { "epoch": 0.1, "learning_rate": 9.887381303418453e-06, "loss": 1.0628, "step": 4125 }, { "epoch": 0.1, "learning_rate": 9.887302028582937e-06, "loss": 1.1911, "step": 4126 }, { "epoch": 0.1, "learning_rate": 9.887222726173595e-06, "loss": 1.062, "step": 4127 }, { "epoch": 0.1, "learning_rate": 9.887143396190877e-06, "loss": 1.4385, "step": 4128 }, { "epoch": 0.1, "learning_rate": 9.887064038635226e-06, "loss": 1.0543, "step": 4129 }, { "epoch": 0.1, "learning_rate": 9.886984653507093e-06, "loss": 1.1635, "step": 4130 }, { "epoch": 0.1, "learning_rate": 9.886905240806926e-06, "loss": 1.0794, "step": 4131 }, { "epoch": 0.1, "learning_rate": 9.886825800535172e-06, "loss": 1.1184, "step": 4132 }, { "epoch": 0.1, "learning_rate": 9.886746332692277e-06, "loss": 1.2268, "step": 4133 }, { "epoch": 0.1, "learning_rate": 9.886666837278694e-06, "loss": 1.131, "step": 4134 }, { "epoch": 0.1, "learning_rate": 9.886587314294867e-06, "loss": 0.9431, "step": 4135 }, { "epoch": 0.1, "learning_rate": 9.886507763741248e-06, "loss": 1.2009, "step": 4136 }, { "epoch": 0.1, "learning_rate": 9.886428185618284e-06, "loss": 1.184, "step": 4137 }, { "epoch": 0.1, "learning_rate": 9.886348579926425e-06, "loss": 1.143, "step": 4138 }, { "epoch": 0.1, "learning_rate": 9.88626894666612e-06, "loss": 1.1308, "step": 4139 }, { "epoch": 0.1, "learning_rate": 9.886189285837818e-06, "loss": 0.9705, "step": 4140 }, { "epoch": 0.1, "learning_rate": 9.886109597441968e-06, "loss": 1.1202, "step": 4141 }, { "epoch": 0.1, "learning_rate": 9.88602988147902e-06, "loss": 1.1003, "step": 4142 }, { "epoch": 0.1, "learning_rate": 9.885950137949425e-06, "loss": 0.9121, "step": 4143 }, { "epoch": 0.1, "learning_rate": 9.88587036685363e-06, "loss": 0.8833, "step": 4144 }, { "epoch": 0.1, "learning_rate": 9.885790568192087e-06, "loss": 1.2659, "step": 4145 }, { "epoch": 0.1, "learning_rate": 9.885710741965246e-06, "loss": 1.1116, "step": 4146 }, { "epoch": 0.1, "learning_rate": 9.885630888173559e-06, "loss": 1.0479, "step": 4147 }, { "epoch": 0.1, "learning_rate": 9.885551006817472e-06, "loss": 1.0698, "step": 4148 }, { "epoch": 0.1, "learning_rate": 9.88547109789744e-06, "loss": 1.0524, "step": 4149 }, { "epoch": 0.1, "learning_rate": 9.885391161413913e-06, "loss": 1.0389, "step": 4150 }, { "epoch": 0.1, "learning_rate": 9.88531119736734e-06, "loss": 1.0128, "step": 4151 }, { "epoch": 0.1, "learning_rate": 9.885231205758175e-06, "loss": 0.8722, "step": 4152 }, { "epoch": 0.1, "learning_rate": 9.885151186586865e-06, "loss": 0.8356, "step": 4153 }, { "epoch": 0.1, "learning_rate": 9.885071139853868e-06, "loss": 1.0332, "step": 4154 }, { "epoch": 0.1, "learning_rate": 9.88499106555963e-06, "loss": 0.8632, "step": 4155 }, { "epoch": 0.1, "learning_rate": 9.884910963704604e-06, "loss": 0.997, "step": 4156 }, { "epoch": 0.1, "learning_rate": 9.884830834289244e-06, "loss": 1.0675, "step": 4157 }, { "epoch": 0.1, "learning_rate": 9.884750677314e-06, "loss": 1.0744, "step": 4158 }, { "epoch": 0.1, "learning_rate": 9.884670492779325e-06, "loss": 0.973, "step": 4159 }, { "epoch": 0.1, "learning_rate": 9.884590280685671e-06, "loss": 0.9373, "step": 4160 }, { "epoch": 0.1, "learning_rate": 9.884510041033492e-06, "loss": 1.0899, "step": 4161 }, { "epoch": 0.1, "learning_rate": 9.884429773823238e-06, "loss": 1.1523, "step": 4162 }, { "epoch": 0.1, "learning_rate": 9.884349479055365e-06, "loss": 0.8237, "step": 4163 }, { "epoch": 0.1, "learning_rate": 9.884269156730324e-06, "loss": 1.1092, "step": 4164 }, { "epoch": 0.1, "learning_rate": 9.884188806848569e-06, "loss": 1.0017, "step": 4165 }, { "epoch": 0.1, "learning_rate": 9.884108429410553e-06, "loss": 1.1282, "step": 4166 }, { "epoch": 0.1, "learning_rate": 9.884028024416728e-06, "loss": 1.182, "step": 4167 }, { "epoch": 0.1, "learning_rate": 9.88394759186755e-06, "loss": 0.8772, "step": 4168 }, { "epoch": 0.1, "learning_rate": 9.883867131763473e-06, "loss": 1.1407, "step": 4169 }, { "epoch": 0.1, "learning_rate": 9.88378664410495e-06, "loss": 1.1418, "step": 4170 }, { "epoch": 0.1, "learning_rate": 9.883706128892432e-06, "loss": 1.2921, "step": 4171 }, { "epoch": 0.1, "learning_rate": 9.883625586126377e-06, "loss": 1.0924, "step": 4172 }, { "epoch": 0.1, "learning_rate": 9.883545015807242e-06, "loss": 1.0928, "step": 4173 }, { "epoch": 0.1, "learning_rate": 9.883464417935475e-06, "loss": 0.9551, "step": 4174 }, { "epoch": 0.1, "learning_rate": 9.883383792511533e-06, "loss": 0.9962, "step": 4175 }, { "epoch": 0.1, "learning_rate": 9.883303139535875e-06, "loss": 1.2802, "step": 4176 }, { "epoch": 0.1, "learning_rate": 9.88322245900895e-06, "loss": 1.174, "step": 4177 }, { "epoch": 0.1, "learning_rate": 9.883141750931217e-06, "loss": 0.8687, "step": 4178 }, { "epoch": 0.1, "learning_rate": 9.883061015303133e-06, "loss": 0.9187, "step": 4179 }, { "epoch": 0.1, "learning_rate": 9.882980252125147e-06, "loss": 1.2024, "step": 4180 }, { "epoch": 0.1, "learning_rate": 9.882899461397722e-06, "loss": 1.4422, "step": 4181 }, { "epoch": 0.1, "learning_rate": 9.882818643121307e-06, "loss": 0.9619, "step": 4182 }, { "epoch": 0.1, "learning_rate": 9.882737797296364e-06, "loss": 1.1356, "step": 4183 }, { "epoch": 0.1, "learning_rate": 9.882656923923346e-06, "loss": 1.1269, "step": 4184 }, { "epoch": 0.1, "learning_rate": 9.882576023002708e-06, "loss": 1.2107, "step": 4185 }, { "epoch": 0.1, "learning_rate": 9.88249509453491e-06, "loss": 1.091, "step": 4186 }, { "epoch": 0.1, "learning_rate": 9.882414138520406e-06, "loss": 1.2955, "step": 4187 }, { "epoch": 0.1, "learning_rate": 9.882333154959654e-06, "loss": 0.9619, "step": 4188 }, { "epoch": 0.1, "learning_rate": 9.88225214385311e-06, "loss": 0.9379, "step": 4189 }, { "epoch": 0.1, "learning_rate": 9.882171105201232e-06, "loss": 1.1945, "step": 4190 }, { "epoch": 0.1, "learning_rate": 9.882090039004475e-06, "loss": 0.984, "step": 4191 }, { "epoch": 0.1, "learning_rate": 9.8820089452633e-06, "loss": 1.1433, "step": 4192 }, { "epoch": 0.1, "learning_rate": 9.881927823978164e-06, "loss": 1.1734, "step": 4193 }, { "epoch": 0.1, "learning_rate": 9.88184667514952e-06, "loss": 1.0612, "step": 4194 }, { "epoch": 0.1, "learning_rate": 9.881765498777831e-06, "loss": 1.0459, "step": 4195 }, { "epoch": 0.1, "learning_rate": 9.881684294863552e-06, "loss": 1.2647, "step": 4196 }, { "epoch": 0.1, "learning_rate": 9.881603063407144e-06, "loss": 1.0784, "step": 4197 }, { "epoch": 0.1, "learning_rate": 9.881521804409063e-06, "loss": 0.9666, "step": 4198 }, { "epoch": 0.1, "learning_rate": 9.881440517869765e-06, "loss": 0.8453, "step": 4199 }, { "epoch": 0.1, "learning_rate": 9.881359203789716e-06, "loss": 1.0239, "step": 4200 }, { "epoch": 0.1, "learning_rate": 9.881277862169367e-06, "loss": 1.0954, "step": 4201 }, { "epoch": 0.1, "learning_rate": 9.881196493009181e-06, "loss": 1.059, "step": 4202 }, { "epoch": 0.1, "learning_rate": 9.881115096309618e-06, "loss": 1.2307, "step": 4203 }, { "epoch": 0.1, "learning_rate": 9.881033672071136e-06, "loss": 0.717, "step": 4204 }, { "epoch": 0.1, "learning_rate": 9.880952220294192e-06, "loss": 0.9285, "step": 4205 }, { "epoch": 0.1, "learning_rate": 9.880870740979249e-06, "loss": 1.3136, "step": 4206 }, { "epoch": 0.1, "learning_rate": 9.880789234126764e-06, "loss": 1.0836, "step": 4207 }, { "epoch": 0.1, "learning_rate": 9.8807076997372e-06, "loss": 0.9384, "step": 4208 }, { "epoch": 0.1, "learning_rate": 9.880626137811013e-06, "loss": 1.0259, "step": 4209 }, { "epoch": 0.1, "learning_rate": 9.880544548348667e-06, "loss": 1.1061, "step": 4210 }, { "epoch": 0.1, "learning_rate": 9.880462931350619e-06, "loss": 1.0606, "step": 4211 }, { "epoch": 0.1, "learning_rate": 9.880381286817334e-06, "loss": 1.015, "step": 4212 }, { "epoch": 0.1, "learning_rate": 9.880299614749267e-06, "loss": 0.8893, "step": 4213 }, { "epoch": 0.1, "learning_rate": 9.880217915146882e-06, "loss": 1.0848, "step": 4214 }, { "epoch": 0.1, "learning_rate": 9.880136188010639e-06, "loss": 1.1678, "step": 4215 }, { "epoch": 0.1, "learning_rate": 9.880054433341e-06, "loss": 1.0003, "step": 4216 }, { "epoch": 0.1, "learning_rate": 9.879972651138428e-06, "loss": 1.1341, "step": 4217 }, { "epoch": 0.1, "learning_rate": 9.87989084140338e-06, "loss": 1.4147, "step": 4218 }, { "epoch": 0.1, "learning_rate": 9.87980900413632e-06, "loss": 0.9684, "step": 4219 }, { "epoch": 0.1, "learning_rate": 9.87972713933771e-06, "loss": 0.9546, "step": 4220 }, { "epoch": 0.1, "learning_rate": 9.87964524700801e-06, "loss": 1.0424, "step": 4221 }, { "epoch": 0.1, "learning_rate": 9.879563327147685e-06, "loss": 0.9151, "step": 4222 }, { "epoch": 0.1, "learning_rate": 9.879481379757197e-06, "loss": 1.141, "step": 4223 }, { "epoch": 0.1, "learning_rate": 9.879399404837005e-06, "loss": 1.2432, "step": 4224 }, { "epoch": 0.1, "learning_rate": 9.879317402387572e-06, "loss": 1.0238, "step": 4225 }, { "epoch": 0.1, "learning_rate": 9.879235372409364e-06, "loss": 1.0396, "step": 4226 }, { "epoch": 0.1, "learning_rate": 9.879153314902841e-06, "loss": 1.0348, "step": 4227 }, { "epoch": 0.1, "learning_rate": 9.87907122986847e-06, "loss": 0.9853, "step": 4228 }, { "epoch": 0.1, "learning_rate": 9.878989117306707e-06, "loss": 0.9398, "step": 4229 }, { "epoch": 0.1, "learning_rate": 9.878906977218021e-06, "loss": 1.3225, "step": 4230 }, { "epoch": 0.1, "learning_rate": 9.878824809602873e-06, "loss": 1.0848, "step": 4231 }, { "epoch": 0.1, "learning_rate": 9.878742614461728e-06, "loss": 0.8372, "step": 4232 }, { "epoch": 0.1, "learning_rate": 9.87866039179505e-06, "loss": 1.4483, "step": 4233 }, { "epoch": 0.1, "learning_rate": 9.8785781416033e-06, "loss": 1.0864, "step": 4234 }, { "epoch": 0.1, "learning_rate": 9.878495863886945e-06, "loss": 1.1141, "step": 4235 }, { "epoch": 0.1, "learning_rate": 9.878413558646447e-06, "loss": 1.16, "step": 4236 }, { "epoch": 0.1, "learning_rate": 9.878331225882272e-06, "loss": 1.2843, "step": 4237 }, { "epoch": 0.1, "learning_rate": 9.878248865594886e-06, "loss": 0.8971, "step": 4238 }, { "epoch": 0.1, "learning_rate": 9.87816647778475e-06, "loss": 1.1681, "step": 4239 }, { "epoch": 0.1, "learning_rate": 9.878084062452331e-06, "loss": 1.0511, "step": 4240 }, { "epoch": 0.1, "learning_rate": 9.878001619598093e-06, "loss": 0.9293, "step": 4241 }, { "epoch": 0.1, "learning_rate": 9.877919149222502e-06, "loss": 0.941, "step": 4242 }, { "epoch": 0.1, "learning_rate": 9.877836651326023e-06, "loss": 0.96, "step": 4243 }, { "epoch": 0.1, "learning_rate": 9.87775412590912e-06, "loss": 1.0842, "step": 4244 }, { "epoch": 0.1, "learning_rate": 9.877671572972262e-06, "loss": 1.1271, "step": 4245 }, { "epoch": 0.1, "learning_rate": 9.877588992515912e-06, "loss": 1.0836, "step": 4246 }, { "epoch": 0.1, "learning_rate": 9.877506384540537e-06, "loss": 0.8482, "step": 4247 }, { "epoch": 0.1, "learning_rate": 9.877423749046601e-06, "loss": 1.119, "step": 4248 }, { "epoch": 0.1, "learning_rate": 9.877341086034575e-06, "loss": 0.8711, "step": 4249 }, { "epoch": 0.1, "learning_rate": 9.87725839550492e-06, "loss": 1.267, "step": 4250 }, { "epoch": 0.1, "learning_rate": 9.877175677458106e-06, "loss": 1.0679, "step": 4251 }, { "epoch": 0.1, "learning_rate": 9.877092931894599e-06, "loss": 0.9242, "step": 4252 }, { "epoch": 0.1, "learning_rate": 9.877010158814864e-06, "loss": 1.0366, "step": 4253 }, { "epoch": 0.1, "learning_rate": 9.87692735821937e-06, "loss": 0.9802, "step": 4254 }, { "epoch": 0.1, "learning_rate": 9.876844530108584e-06, "loss": 1.0889, "step": 4255 }, { "epoch": 0.1, "learning_rate": 9.876761674482973e-06, "loss": 1.0262, "step": 4256 }, { "epoch": 0.1, "learning_rate": 9.876678791343004e-06, "loss": 1.1567, "step": 4257 }, { "epoch": 0.1, "learning_rate": 9.876595880689143e-06, "loss": 1.15, "step": 4258 }, { "epoch": 0.1, "learning_rate": 9.876512942521864e-06, "loss": 1.0316, "step": 4259 }, { "epoch": 0.1, "learning_rate": 9.876429976841628e-06, "loss": 1.3047, "step": 4260 }, { "epoch": 0.1, "learning_rate": 9.876346983648906e-06, "loss": 1.1002, "step": 4261 }, { "epoch": 0.1, "learning_rate": 9.876263962944166e-06, "loss": 0.9725, "step": 4262 }, { "epoch": 0.1, "learning_rate": 9.876180914727875e-06, "loss": 0.8243, "step": 4263 }, { "epoch": 0.1, "learning_rate": 9.876097839000505e-06, "loss": 1.1138, "step": 4264 }, { "epoch": 0.1, "learning_rate": 9.876014735762522e-06, "loss": 1.3227, "step": 4265 }, { "epoch": 0.1, "learning_rate": 9.875931605014395e-06, "loss": 1.0389, "step": 4266 }, { "epoch": 0.1, "learning_rate": 9.875848446756595e-06, "loss": 0.9039, "step": 4267 }, { "epoch": 0.1, "learning_rate": 9.87576526098959e-06, "loss": 1.2172, "step": 4268 }, { "epoch": 0.1, "learning_rate": 9.875682047713847e-06, "loss": 1.0288, "step": 4269 }, { "epoch": 0.1, "learning_rate": 9.875598806929837e-06, "loss": 0.9858, "step": 4270 }, { "epoch": 0.1, "learning_rate": 9.875515538638033e-06, "loss": 1.2923, "step": 4271 }, { "epoch": 0.1, "learning_rate": 9.8754322428389e-06, "loss": 0.9749, "step": 4272 }, { "epoch": 0.1, "learning_rate": 9.875348919532913e-06, "loss": 1.1745, "step": 4273 }, { "epoch": 0.1, "learning_rate": 9.875265568720536e-06, "loss": 1.2525, "step": 4274 }, { "epoch": 0.1, "learning_rate": 9.875182190402241e-06, "loss": 0.8877, "step": 4275 }, { "epoch": 0.1, "learning_rate": 9.875098784578504e-06, "loss": 1.0016, "step": 4276 }, { "epoch": 0.1, "learning_rate": 9.875015351249786e-06, "loss": 0.6903, "step": 4277 }, { "epoch": 0.1, "learning_rate": 9.874931890416568e-06, "loss": 0.9707, "step": 4278 }, { "epoch": 0.1, "learning_rate": 9.874848402079312e-06, "loss": 0.9392, "step": 4279 }, { "epoch": 0.1, "learning_rate": 9.874764886238495e-06, "loss": 1.0965, "step": 4280 }, { "epoch": 0.1, "learning_rate": 9.874681342894585e-06, "loss": 1.0715, "step": 4281 }, { "epoch": 0.1, "learning_rate": 9.874597772048055e-06, "loss": 1.1319, "step": 4282 }, { "epoch": 0.1, "learning_rate": 9.874514173699376e-06, "loss": 1.055, "step": 4283 }, { "epoch": 0.1, "learning_rate": 9.874430547849022e-06, "loss": 1.2788, "step": 4284 }, { "epoch": 0.1, "learning_rate": 9.874346894497459e-06, "loss": 1.2029, "step": 4285 }, { "epoch": 0.1, "learning_rate": 9.874263213645164e-06, "loss": 0.8449, "step": 4286 }, { "epoch": 0.1, "learning_rate": 9.874179505292606e-06, "loss": 0.9644, "step": 4287 }, { "epoch": 0.1, "learning_rate": 9.87409576944026e-06, "loss": 1.1108, "step": 4288 }, { "epoch": 0.1, "learning_rate": 9.874012006088595e-06, "loss": 1.2904, "step": 4289 }, { "epoch": 0.1, "learning_rate": 9.873928215238089e-06, "loss": 0.847, "step": 4290 }, { "epoch": 0.1, "learning_rate": 9.87384439688921e-06, "loss": 1.0292, "step": 4291 }, { "epoch": 0.1, "learning_rate": 9.873760551042433e-06, "loss": 1.1903, "step": 4292 }, { "epoch": 0.1, "learning_rate": 9.87367667769823e-06, "loss": 0.7734, "step": 4293 }, { "epoch": 0.1, "learning_rate": 9.873592776857075e-06, "loss": 1.0251, "step": 4294 }, { "epoch": 0.1, "learning_rate": 9.87350884851944e-06, "loss": 1.1201, "step": 4295 }, { "epoch": 0.1, "learning_rate": 9.8734248926858e-06, "loss": 0.67, "step": 4296 }, { "epoch": 0.1, "learning_rate": 9.87334090935663e-06, "loss": 1.1603, "step": 4297 }, { "epoch": 0.1, "learning_rate": 9.8732568985324e-06, "loss": 1.0531, "step": 4298 }, { "epoch": 0.1, "learning_rate": 9.873172860213587e-06, "loss": 1.038, "step": 4299 }, { "epoch": 0.1, "learning_rate": 9.873088794400665e-06, "loss": 1.2409, "step": 4300 }, { "epoch": 0.1, "learning_rate": 9.873004701094106e-06, "loss": 1.1721, "step": 4301 }, { "epoch": 0.1, "learning_rate": 9.872920580294386e-06, "loss": 1.1567, "step": 4302 }, { "epoch": 0.1, "learning_rate": 9.87283643200198e-06, "loss": 1.0836, "step": 4303 }, { "epoch": 0.1, "learning_rate": 9.872752256217363e-06, "loss": 0.9292, "step": 4304 }, { "epoch": 0.1, "learning_rate": 9.872668052941008e-06, "loss": 1.3351, "step": 4305 }, { "epoch": 0.1, "learning_rate": 9.872583822173392e-06, "loss": 1.3431, "step": 4306 }, { "epoch": 0.1, "learning_rate": 9.87249956391499e-06, "loss": 1.0176, "step": 4307 }, { "epoch": 0.1, "learning_rate": 9.872415278166277e-06, "loss": 1.0859, "step": 4308 }, { "epoch": 0.1, "learning_rate": 9.872330964927725e-06, "loss": 1.2567, "step": 4309 }, { "epoch": 0.1, "learning_rate": 9.872246624199817e-06, "loss": 1.3557, "step": 4310 }, { "epoch": 0.1, "learning_rate": 9.872162255983024e-06, "loss": 0.8796, "step": 4311 }, { "epoch": 0.1, "learning_rate": 9.872077860277822e-06, "loss": 1.0353, "step": 4312 }, { "epoch": 0.1, "learning_rate": 9.87199343708469e-06, "loss": 1.1769, "step": 4313 }, { "epoch": 0.1, "learning_rate": 9.871908986404099e-06, "loss": 1.1434, "step": 4314 }, { "epoch": 0.1, "learning_rate": 9.871824508236531e-06, "loss": 0.946, "step": 4315 }, { "epoch": 0.1, "learning_rate": 9.871740002582461e-06, "loss": 1.1487, "step": 4316 }, { "epoch": 0.1, "learning_rate": 9.871655469442366e-06, "loss": 1.233, "step": 4317 }, { "epoch": 0.1, "learning_rate": 9.871570908816721e-06, "loss": 1.1266, "step": 4318 }, { "epoch": 0.1, "learning_rate": 9.871486320706003e-06, "loss": 0.8881, "step": 4319 }, { "epoch": 0.1, "learning_rate": 9.871401705110693e-06, "loss": 1.0479, "step": 4320 }, { "epoch": 0.1, "learning_rate": 9.871317062031265e-06, "loss": 1.2362, "step": 4321 }, { "epoch": 0.1, "learning_rate": 9.871232391468197e-06, "loss": 0.9584, "step": 4322 }, { "epoch": 0.1, "learning_rate": 9.871147693421967e-06, "loss": 0.9386, "step": 4323 }, { "epoch": 0.1, "learning_rate": 9.871062967893055e-06, "loss": 1.0444, "step": 4324 }, { "epoch": 0.1, "learning_rate": 9.870978214881934e-06, "loss": 0.8858, "step": 4325 }, { "epoch": 0.1, "learning_rate": 9.870893434389088e-06, "loss": 1.0251, "step": 4326 }, { "epoch": 0.1, "learning_rate": 9.870808626414992e-06, "loss": 1.1726, "step": 4327 }, { "epoch": 0.1, "learning_rate": 9.870723790960123e-06, "loss": 1.3189, "step": 4328 }, { "epoch": 0.1, "learning_rate": 9.870638928024964e-06, "loss": 1.2945, "step": 4329 }, { "epoch": 0.1, "learning_rate": 9.87055403760999e-06, "loss": 1.1307, "step": 4330 }, { "epoch": 0.1, "learning_rate": 9.870469119715683e-06, "loss": 0.7528, "step": 4331 }, { "epoch": 0.1, "learning_rate": 9.870384174342519e-06, "loss": 1.1025, "step": 4332 }, { "epoch": 0.1, "learning_rate": 9.87029920149098e-06, "loss": 0.7723, "step": 4333 }, { "epoch": 0.1, "learning_rate": 9.870214201161544e-06, "loss": 1.2197, "step": 4334 }, { "epoch": 0.1, "learning_rate": 9.87012917335469e-06, "loss": 1.2203, "step": 4335 }, { "epoch": 0.1, "learning_rate": 9.870044118070898e-06, "loss": 0.9449, "step": 4336 }, { "epoch": 0.1, "learning_rate": 9.869959035310649e-06, "loss": 1.1208, "step": 4337 }, { "epoch": 0.1, "learning_rate": 9.869873925074422e-06, "loss": 1.0638, "step": 4338 }, { "epoch": 0.1, "learning_rate": 9.869788787362699e-06, "loss": 1.1595, "step": 4339 }, { "epoch": 0.1, "learning_rate": 9.869703622175957e-06, "loss": 1.1457, "step": 4340 }, { "epoch": 0.1, "learning_rate": 9.86961842951468e-06, "loss": 0.9685, "step": 4341 }, { "epoch": 0.1, "learning_rate": 9.869533209379346e-06, "loss": 1.0828, "step": 4342 }, { "epoch": 0.1, "learning_rate": 9.869447961770437e-06, "loss": 1.096, "step": 4343 }, { "epoch": 0.1, "learning_rate": 9.869362686688435e-06, "loss": 1.0572, "step": 4344 }, { "epoch": 0.1, "learning_rate": 9.869277384133818e-06, "loss": 1.1722, "step": 4345 }, { "epoch": 0.1, "learning_rate": 9.86919205410707e-06, "loss": 1.1861, "step": 4346 }, { "epoch": 0.1, "learning_rate": 9.869106696608673e-06, "loss": 0.9486, "step": 4347 }, { "epoch": 0.1, "learning_rate": 9.869021311639106e-06, "loss": 1.1835, "step": 4348 }, { "epoch": 0.1, "learning_rate": 9.86893589919885e-06, "loss": 1.2195, "step": 4349 }, { "epoch": 0.1, "learning_rate": 9.868850459288392e-06, "loss": 1.1212, "step": 4350 }, { "epoch": 0.1, "learning_rate": 9.86876499190821e-06, "loss": 1.0809, "step": 4351 }, { "epoch": 0.1, "learning_rate": 9.868679497058786e-06, "loss": 1.0927, "step": 4352 }, { "epoch": 0.1, "learning_rate": 9.868593974740606e-06, "loss": 1.064, "step": 4353 }, { "epoch": 0.1, "learning_rate": 9.868508424954147e-06, "loss": 1.111, "step": 4354 }, { "epoch": 0.1, "learning_rate": 9.868422847699896e-06, "loss": 1.1482, "step": 4355 }, { "epoch": 0.1, "learning_rate": 9.868337242978334e-06, "loss": 0.9455, "step": 4356 }, { "epoch": 0.1, "learning_rate": 9.868251610789945e-06, "loss": 1.0058, "step": 4357 }, { "epoch": 0.1, "learning_rate": 9.868165951135212e-06, "loss": 0.8873, "step": 4358 }, { "epoch": 0.1, "learning_rate": 9.868080264014616e-06, "loss": 0.8661, "step": 4359 }, { "epoch": 0.1, "learning_rate": 9.867994549428643e-06, "loss": 1.1127, "step": 4360 }, { "epoch": 0.1, "learning_rate": 9.867908807377778e-06, "loss": 1.1575, "step": 4361 }, { "epoch": 0.1, "learning_rate": 9.8678230378625e-06, "loss": 1.112, "step": 4362 }, { "epoch": 0.1, "learning_rate": 9.867737240883297e-06, "loss": 1.1545, "step": 4363 }, { "epoch": 0.1, "learning_rate": 9.867651416440651e-06, "loss": 0.9928, "step": 4364 }, { "epoch": 0.1, "learning_rate": 9.867565564535046e-06, "loss": 1.1914, "step": 4365 }, { "epoch": 0.1, "learning_rate": 9.867479685166968e-06, "loss": 1.0132, "step": 4366 }, { "epoch": 0.1, "learning_rate": 9.8673937783369e-06, "loss": 1.08, "step": 4367 }, { "epoch": 0.1, "learning_rate": 9.867307844045329e-06, "loss": 0.9826, "step": 4368 }, { "epoch": 0.1, "learning_rate": 9.867221882292737e-06, "loss": 1.0534, "step": 4369 }, { "epoch": 0.1, "learning_rate": 9.867135893079611e-06, "loss": 0.8507, "step": 4370 }, { "epoch": 0.1, "learning_rate": 9.867049876406435e-06, "loss": 1.0067, "step": 4371 }, { "epoch": 0.1, "learning_rate": 9.866963832273696e-06, "loss": 1.2358, "step": 4372 }, { "epoch": 0.1, "learning_rate": 9.866877760681874e-06, "loss": 1.1712, "step": 4373 }, { "epoch": 0.1, "learning_rate": 9.866791661631462e-06, "loss": 0.8967, "step": 4374 }, { "epoch": 0.1, "learning_rate": 9.866705535122943e-06, "loss": 1.1763, "step": 4375 }, { "epoch": 0.1, "learning_rate": 9.866619381156801e-06, "loss": 1.2342, "step": 4376 }, { "epoch": 0.1, "learning_rate": 9.866533199733523e-06, "loss": 1.0547, "step": 4377 }, { "epoch": 0.1, "learning_rate": 9.866446990853597e-06, "loss": 1.0925, "step": 4378 }, { "epoch": 0.1, "learning_rate": 9.866360754517508e-06, "loss": 1.2008, "step": 4379 }, { "epoch": 0.1, "learning_rate": 9.86627449072574e-06, "loss": 0.9359, "step": 4380 }, { "epoch": 0.1, "learning_rate": 9.866188199478786e-06, "loss": 1.0282, "step": 4381 }, { "epoch": 0.1, "learning_rate": 9.866101880777128e-06, "loss": 1.11, "step": 4382 }, { "epoch": 0.1, "learning_rate": 9.866015534621254e-06, "loss": 1.1733, "step": 4383 }, { "epoch": 0.1, "learning_rate": 9.86592916101165e-06, "loss": 0.9352, "step": 4384 }, { "epoch": 0.1, "learning_rate": 9.865842759948807e-06, "loss": 1.2071, "step": 4385 }, { "epoch": 0.1, "learning_rate": 9.865756331433209e-06, "loss": 1.048, "step": 4386 }, { "epoch": 0.1, "learning_rate": 9.865669875465344e-06, "loss": 1.0999, "step": 4387 }, { "epoch": 0.1, "learning_rate": 9.8655833920457e-06, "loss": 1.1081, "step": 4388 }, { "epoch": 0.1, "learning_rate": 9.865496881174768e-06, "loss": 0.9962, "step": 4389 }, { "epoch": 0.1, "learning_rate": 9.865410342853033e-06, "loss": 1.1589, "step": 4390 }, { "epoch": 0.1, "learning_rate": 9.865323777080982e-06, "loss": 1.0788, "step": 4391 }, { "epoch": 0.1, "learning_rate": 9.865237183859107e-06, "loss": 0.799, "step": 4392 }, { "epoch": 0.1, "learning_rate": 9.865150563187893e-06, "loss": 0.9959, "step": 4393 }, { "epoch": 0.1, "learning_rate": 9.865063915067832e-06, "loss": 1.0922, "step": 4394 }, { "epoch": 0.1, "learning_rate": 9.864977239499411e-06, "loss": 1.305, "step": 4395 }, { "epoch": 0.1, "learning_rate": 9.864890536483119e-06, "loss": 0.9242, "step": 4396 }, { "epoch": 0.1, "learning_rate": 9.864803806019445e-06, "loss": 0.981, "step": 4397 }, { "epoch": 0.1, "learning_rate": 9.86471704810888e-06, "loss": 1.0403, "step": 4398 }, { "epoch": 0.1, "learning_rate": 9.864630262751911e-06, "loss": 0.9869, "step": 4399 }, { "epoch": 0.1, "learning_rate": 9.86454344994903e-06, "loss": 1.3662, "step": 4400 }, { "epoch": 0.1, "learning_rate": 9.864456609700726e-06, "loss": 1.2329, "step": 4401 }, { "epoch": 0.1, "learning_rate": 9.864369742007487e-06, "loss": 1.2212, "step": 4402 }, { "epoch": 0.1, "learning_rate": 9.864282846869806e-06, "loss": 1.0245, "step": 4403 }, { "epoch": 0.1, "learning_rate": 9.864195924288172e-06, "loss": 0.9791, "step": 4404 }, { "epoch": 0.1, "learning_rate": 9.864108974263076e-06, "loss": 1.0515, "step": 4405 }, { "epoch": 0.1, "learning_rate": 9.864021996795008e-06, "loss": 1.2269, "step": 4406 }, { "epoch": 0.1, "learning_rate": 9.863934991884457e-06, "loss": 0.7249, "step": 4407 }, { "epoch": 0.1, "learning_rate": 9.863847959531917e-06, "loss": 1.1102, "step": 4408 }, { "epoch": 0.1, "learning_rate": 9.863760899737878e-06, "loss": 1.1996, "step": 4409 }, { "epoch": 0.1, "learning_rate": 9.86367381250283e-06, "loss": 0.8844, "step": 4410 }, { "epoch": 0.1, "learning_rate": 9.863586697827265e-06, "loss": 0.9599, "step": 4411 }, { "epoch": 0.1, "learning_rate": 9.863499555711676e-06, "loss": 0.8985, "step": 4412 }, { "epoch": 0.1, "learning_rate": 9.863412386156553e-06, "loss": 1.0049, "step": 4413 }, { "epoch": 0.1, "learning_rate": 9.863325189162387e-06, "loss": 0.9679, "step": 4414 }, { "epoch": 0.1, "learning_rate": 9.863237964729671e-06, "loss": 0.9463, "step": 4415 }, { "epoch": 0.1, "learning_rate": 9.863150712858897e-06, "loss": 0.8145, "step": 4416 }, { "epoch": 0.1, "learning_rate": 9.863063433550559e-06, "loss": 1.0755, "step": 4417 }, { "epoch": 0.1, "learning_rate": 9.862976126805148e-06, "loss": 1.1895, "step": 4418 }, { "epoch": 0.1, "learning_rate": 9.862888792623155e-06, "loss": 1.2334, "step": 4419 }, { "epoch": 0.1, "learning_rate": 9.862801431005076e-06, "loss": 1.2044, "step": 4420 }, { "epoch": 0.1, "learning_rate": 9.8627140419514e-06, "loss": 0.963, "step": 4421 }, { "epoch": 0.1, "learning_rate": 9.862626625462624e-06, "loss": 1.194, "step": 4422 }, { "epoch": 0.1, "learning_rate": 9.862539181539238e-06, "loss": 0.9237, "step": 4423 }, { "epoch": 0.1, "learning_rate": 9.862451710181737e-06, "loss": 0.7945, "step": 4424 }, { "epoch": 0.1, "learning_rate": 9.862364211390613e-06, "loss": 1.2383, "step": 4425 }, { "epoch": 0.1, "learning_rate": 9.862276685166364e-06, "loss": 1.2938, "step": 4426 }, { "epoch": 0.1, "learning_rate": 9.862189131509478e-06, "loss": 1.0261, "step": 4427 }, { "epoch": 0.1, "learning_rate": 9.862101550420453e-06, "loss": 0.8276, "step": 4428 }, { "epoch": 0.1, "learning_rate": 9.862013941899782e-06, "loss": 0.9764, "step": 4429 }, { "epoch": 0.1, "learning_rate": 9.861926305947957e-06, "loss": 1.085, "step": 4430 }, { "epoch": 0.1, "learning_rate": 9.861838642565477e-06, "loss": 0.974, "step": 4431 }, { "epoch": 0.1, "learning_rate": 9.861750951752833e-06, "loss": 1.0901, "step": 4432 }, { "epoch": 0.1, "learning_rate": 9.86166323351052e-06, "loss": 1.1272, "step": 4433 }, { "epoch": 0.1, "learning_rate": 9.861575487839035e-06, "loss": 1.263, "step": 4434 }, { "epoch": 0.1, "learning_rate": 9.86148771473887e-06, "loss": 1.1557, "step": 4435 }, { "epoch": 0.1, "learning_rate": 9.861399914210525e-06, "loss": 0.9893, "step": 4436 }, { "epoch": 0.1, "learning_rate": 9.86131208625449e-06, "loss": 1.0707, "step": 4437 }, { "epoch": 0.1, "learning_rate": 9.861224230871263e-06, "loss": 0.9509, "step": 4438 }, { "epoch": 0.1, "learning_rate": 9.86113634806134e-06, "loss": 1.1691, "step": 4439 }, { "epoch": 0.1, "learning_rate": 9.861048437825217e-06, "loss": 1.1568, "step": 4440 }, { "epoch": 0.1, "learning_rate": 9.860960500163387e-06, "loss": 0.9516, "step": 4441 }, { "epoch": 0.1, "learning_rate": 9.860872535076351e-06, "loss": 1.1688, "step": 4442 }, { "epoch": 0.1, "learning_rate": 9.860784542564603e-06, "loss": 0.9901, "step": 4443 }, { "epoch": 0.1, "learning_rate": 9.860696522628638e-06, "loss": 1.0675, "step": 4444 }, { "epoch": 0.1, "learning_rate": 9.860608475268955e-06, "loss": 1.1635, "step": 4445 }, { "epoch": 0.1, "learning_rate": 9.860520400486049e-06, "loss": 1.2543, "step": 4446 }, { "epoch": 0.1, "learning_rate": 9.860432298280417e-06, "loss": 1.0543, "step": 4447 }, { "epoch": 0.1, "learning_rate": 9.860344168652557e-06, "loss": 1.2338, "step": 4448 }, { "epoch": 0.1, "learning_rate": 9.860256011602965e-06, "loss": 1.0625, "step": 4449 }, { "epoch": 0.1, "learning_rate": 9.860167827132141e-06, "loss": 0.9601, "step": 4450 }, { "epoch": 0.1, "learning_rate": 9.860079615240579e-06, "loss": 0.8062, "step": 4451 }, { "epoch": 0.1, "learning_rate": 9.85999137592878e-06, "loss": 0.8101, "step": 4452 }, { "epoch": 0.1, "learning_rate": 9.859903109197238e-06, "loss": 1.2235, "step": 4453 }, { "epoch": 0.1, "learning_rate": 9.859814815046454e-06, "loss": 1.2147, "step": 4454 }, { "epoch": 0.1, "learning_rate": 9.859726493476927e-06, "loss": 0.9757, "step": 4455 }, { "epoch": 0.1, "learning_rate": 9.859638144489152e-06, "loss": 0.8365, "step": 4456 }, { "epoch": 0.1, "learning_rate": 9.859549768083629e-06, "loss": 1.0756, "step": 4457 }, { "epoch": 0.1, "learning_rate": 9.859461364260858e-06, "loss": 1.0636, "step": 4458 }, { "epoch": 0.1, "learning_rate": 9.859372933021336e-06, "loss": 1.0892, "step": 4459 }, { "epoch": 0.1, "learning_rate": 9.859284474365562e-06, "loss": 1.0551, "step": 4460 }, { "epoch": 0.1, "learning_rate": 9.859195988294036e-06, "loss": 1.0962, "step": 4461 }, { "epoch": 0.1, "learning_rate": 9.859107474807257e-06, "loss": 1.1359, "step": 4462 }, { "epoch": 0.1, "learning_rate": 9.859018933905725e-06, "loss": 0.9253, "step": 4463 }, { "epoch": 0.1, "learning_rate": 9.858930365589935e-06, "loss": 1.1374, "step": 4464 }, { "epoch": 0.1, "learning_rate": 9.858841769860394e-06, "loss": 0.9948, "step": 4465 }, { "epoch": 0.1, "learning_rate": 9.858753146717597e-06, "loss": 1.1727, "step": 4466 }, { "epoch": 0.1, "learning_rate": 9.858664496162045e-06, "loss": 1.229, "step": 4467 }, { "epoch": 0.1, "learning_rate": 9.858575818194237e-06, "loss": 1.1433, "step": 4468 }, { "epoch": 0.1, "learning_rate": 9.858487112814678e-06, "loss": 0.7991, "step": 4469 }, { "epoch": 0.1, "learning_rate": 9.858398380023864e-06, "loss": 0.8765, "step": 4470 }, { "epoch": 0.1, "learning_rate": 9.858309619822297e-06, "loss": 1.0084, "step": 4471 }, { "epoch": 0.1, "learning_rate": 9.858220832210477e-06, "loss": 0.8638, "step": 4472 }, { "epoch": 0.1, "learning_rate": 9.858132017188905e-06, "loss": 1.0594, "step": 4473 }, { "epoch": 0.1, "learning_rate": 9.858043174758083e-06, "loss": 1.2525, "step": 4474 }, { "epoch": 0.1, "learning_rate": 9.857954304918512e-06, "loss": 0.897, "step": 4475 }, { "epoch": 0.1, "learning_rate": 9.857865407670693e-06, "loss": 1.0163, "step": 4476 }, { "epoch": 0.1, "learning_rate": 9.857776483015129e-06, "loss": 1.0964, "step": 4477 }, { "epoch": 0.1, "learning_rate": 9.857687530952318e-06, "loss": 1.0111, "step": 4478 }, { "epoch": 0.1, "learning_rate": 9.857598551482767e-06, "loss": 0.9891, "step": 4479 }, { "epoch": 0.1, "learning_rate": 9.857509544606975e-06, "loss": 0.8848, "step": 4480 }, { "epoch": 0.1, "learning_rate": 9.857420510325444e-06, "loss": 1.2056, "step": 4481 }, { "epoch": 0.1, "learning_rate": 9.857331448638676e-06, "loss": 1.0746, "step": 4482 }, { "epoch": 0.1, "learning_rate": 9.857242359547174e-06, "loss": 0.9796, "step": 4483 }, { "epoch": 0.1, "learning_rate": 9.857153243051443e-06, "loss": 0.847, "step": 4484 }, { "epoch": 0.1, "learning_rate": 9.857064099151983e-06, "loss": 1.0698, "step": 4485 }, { "epoch": 0.1, "learning_rate": 9.856974927849297e-06, "loss": 1.144, "step": 4486 }, { "epoch": 0.1, "learning_rate": 9.85688572914389e-06, "loss": 1.2018, "step": 4487 }, { "epoch": 0.1, "learning_rate": 9.856796503036263e-06, "loss": 1.044, "step": 4488 }, { "epoch": 0.1, "learning_rate": 9.856707249526922e-06, "loss": 1.0633, "step": 4489 }, { "epoch": 0.1, "learning_rate": 9.85661796861637e-06, "loss": 1.0593, "step": 4490 }, { "epoch": 0.1, "learning_rate": 9.856528660305106e-06, "loss": 0.8145, "step": 4491 }, { "epoch": 0.1, "learning_rate": 9.85643932459364e-06, "loss": 1.095, "step": 4492 }, { "epoch": 0.1, "learning_rate": 9.856349961482472e-06, "loss": 0.9889, "step": 4493 }, { "epoch": 0.1, "learning_rate": 9.856260570972109e-06, "loss": 0.938, "step": 4494 }, { "epoch": 0.1, "learning_rate": 9.856171153063054e-06, "loss": 0.9945, "step": 4495 }, { "epoch": 0.1, "learning_rate": 9.856081707755813e-06, "loss": 1.082, "step": 4496 }, { "epoch": 0.1, "learning_rate": 9.855992235050889e-06, "loss": 0.8652, "step": 4497 }, { "epoch": 0.1, "learning_rate": 9.855902734948786e-06, "loss": 1.2116, "step": 4498 }, { "epoch": 0.1, "learning_rate": 9.855813207450009e-06, "loss": 1.0021, "step": 4499 }, { "epoch": 0.1, "learning_rate": 9.855723652555068e-06, "loss": 0.993, "step": 4500 }, { "epoch": 0.1, "learning_rate": 9.85563407026446e-06, "loss": 0.9146, "step": 4501 }, { "epoch": 0.1, "learning_rate": 9.855544460578696e-06, "loss": 0.9596, "step": 4502 }, { "epoch": 0.1, "learning_rate": 9.855454823498282e-06, "loss": 1.5316, "step": 4503 }, { "epoch": 0.1, "learning_rate": 9.855365159023722e-06, "loss": 0.6777, "step": 4504 }, { "epoch": 0.1, "learning_rate": 9.85527546715552e-06, "loss": 1.1065, "step": 4505 }, { "epoch": 0.1, "learning_rate": 9.855185747894187e-06, "loss": 0.9394, "step": 4506 }, { "epoch": 0.1, "learning_rate": 9.855096001240225e-06, "loss": 1.2527, "step": 4507 }, { "epoch": 0.1, "learning_rate": 9.855006227194141e-06, "loss": 1.1214, "step": 4508 }, { "epoch": 0.1, "learning_rate": 9.854916425756442e-06, "loss": 0.8829, "step": 4509 }, { "epoch": 0.1, "learning_rate": 9.854826596927635e-06, "loss": 1.12, "step": 4510 }, { "epoch": 0.1, "learning_rate": 9.854736740708228e-06, "loss": 1.0143, "step": 4511 }, { "epoch": 0.1, "learning_rate": 9.854646857098726e-06, "loss": 1.215, "step": 4512 }, { "epoch": 0.1, "learning_rate": 9.854556946099636e-06, "loss": 1.1397, "step": 4513 }, { "epoch": 0.1, "learning_rate": 9.854467007711466e-06, "loss": 0.8044, "step": 4514 }, { "epoch": 0.1, "learning_rate": 9.854377041934721e-06, "loss": 0.9698, "step": 4515 }, { "epoch": 0.1, "learning_rate": 9.854287048769915e-06, "loss": 0.8761, "step": 4516 }, { "epoch": 0.1, "learning_rate": 9.854197028217549e-06, "loss": 0.7246, "step": 4517 }, { "epoch": 0.1, "learning_rate": 9.854106980278136e-06, "loss": 1.1695, "step": 4518 }, { "epoch": 0.1, "learning_rate": 9.854016904952179e-06, "loss": 0.9226, "step": 4519 }, { "epoch": 0.1, "learning_rate": 9.85392680224019e-06, "loss": 1.1858, "step": 4520 }, { "epoch": 0.1, "learning_rate": 9.853836672142676e-06, "loss": 1.0828, "step": 4521 }, { "epoch": 0.1, "learning_rate": 9.853746514660145e-06, "loss": 0.958, "step": 4522 }, { "epoch": 0.1, "learning_rate": 9.853656329793108e-06, "loss": 1.0875, "step": 4523 }, { "epoch": 0.1, "learning_rate": 9.853566117542071e-06, "loss": 1.0323, "step": 4524 }, { "epoch": 0.1, "learning_rate": 9.853475877907544e-06, "loss": 1.0781, "step": 4525 }, { "epoch": 0.1, "learning_rate": 9.853385610890036e-06, "loss": 1.1783, "step": 4526 }, { "epoch": 0.1, "learning_rate": 9.853295316490057e-06, "loss": 1.2796, "step": 4527 }, { "epoch": 0.11, "learning_rate": 9.853204994708117e-06, "loss": 1.1815, "step": 4528 }, { "epoch": 0.11, "learning_rate": 9.853114645544723e-06, "loss": 0.9245, "step": 4529 }, { "epoch": 0.11, "learning_rate": 9.853024269000386e-06, "loss": 1.1024, "step": 4530 }, { "epoch": 0.11, "learning_rate": 9.852933865075617e-06, "loss": 1.0679, "step": 4531 }, { "epoch": 0.11, "learning_rate": 9.852843433770925e-06, "loss": 0.9915, "step": 4532 }, { "epoch": 0.11, "learning_rate": 9.85275297508682e-06, "loss": 0.9254, "step": 4533 }, { "epoch": 0.11, "learning_rate": 9.852662489023814e-06, "loss": 0.9779, "step": 4534 }, { "epoch": 0.11, "learning_rate": 9.852571975582415e-06, "loss": 1.0018, "step": 4535 }, { "epoch": 0.11, "learning_rate": 9.852481434763135e-06, "loss": 1.4038, "step": 4536 }, { "epoch": 0.11, "learning_rate": 9.852390866566486e-06, "loss": 1.1681, "step": 4537 }, { "epoch": 0.11, "learning_rate": 9.852300270992978e-06, "loss": 0.8944, "step": 4538 }, { "epoch": 0.11, "learning_rate": 9.85220964804312e-06, "loss": 1.068, "step": 4539 }, { "epoch": 0.11, "learning_rate": 9.852118997717426e-06, "loss": 0.9084, "step": 4540 }, { "epoch": 0.11, "learning_rate": 9.852028320016408e-06, "loss": 1.2559, "step": 4541 }, { "epoch": 0.11, "learning_rate": 9.851937614940576e-06, "loss": 1.2654, "step": 4542 }, { "epoch": 0.11, "learning_rate": 9.851846882490441e-06, "loss": 1.1468, "step": 4543 }, { "epoch": 0.11, "learning_rate": 9.851756122666516e-06, "loss": 0.9624, "step": 4544 }, { "epoch": 0.11, "learning_rate": 9.851665335469313e-06, "loss": 1.3109, "step": 4545 }, { "epoch": 0.11, "learning_rate": 9.851574520899345e-06, "loss": 1.1519, "step": 4546 }, { "epoch": 0.11, "learning_rate": 9.851483678957122e-06, "loss": 1.1438, "step": 4547 }, { "epoch": 0.11, "learning_rate": 9.85139280964316e-06, "loss": 1.1317, "step": 4548 }, { "epoch": 0.11, "learning_rate": 9.851301912957968e-06, "loss": 1.3738, "step": 4549 }, { "epoch": 0.11, "learning_rate": 9.85121098890206e-06, "loss": 1.2416, "step": 4550 }, { "epoch": 0.11, "learning_rate": 9.851120037475952e-06, "loss": 1.1155, "step": 4551 }, { "epoch": 0.11, "learning_rate": 9.851029058680154e-06, "loss": 1.023, "step": 4552 }, { "epoch": 0.11, "learning_rate": 9.85093805251518e-06, "loss": 1.1634, "step": 4553 }, { "epoch": 0.11, "learning_rate": 9.850847018981543e-06, "loss": 1.2475, "step": 4554 }, { "epoch": 0.11, "learning_rate": 9.850755958079757e-06, "loss": 1.1186, "step": 4555 }, { "epoch": 0.11, "learning_rate": 9.850664869810336e-06, "loss": 1.0404, "step": 4556 }, { "epoch": 0.11, "learning_rate": 9.850573754173794e-06, "loss": 1.3113, "step": 4557 }, { "epoch": 0.11, "learning_rate": 9.850482611170644e-06, "loss": 1.0618, "step": 4558 }, { "epoch": 0.11, "learning_rate": 9.850391440801402e-06, "loss": 1.0647, "step": 4559 }, { "epoch": 0.11, "learning_rate": 9.850300243066582e-06, "loss": 0.9823, "step": 4560 }, { "epoch": 0.11, "learning_rate": 9.850209017966696e-06, "loss": 0.9027, "step": 4561 }, { "epoch": 0.11, "learning_rate": 9.850117765502262e-06, "loss": 1.0763, "step": 4562 }, { "epoch": 0.11, "learning_rate": 9.850026485673794e-06, "loss": 0.7466, "step": 4563 }, { "epoch": 0.11, "learning_rate": 9.849935178481805e-06, "loss": 0.9205, "step": 4564 }, { "epoch": 0.11, "learning_rate": 9.849843843926812e-06, "loss": 0.8003, "step": 4565 }, { "epoch": 0.11, "learning_rate": 9.849752482009329e-06, "loss": 0.9719, "step": 4566 }, { "epoch": 0.11, "learning_rate": 9.849661092729874e-06, "loss": 0.9609, "step": 4567 }, { "epoch": 0.11, "learning_rate": 9.84956967608896e-06, "loss": 1.0824, "step": 4568 }, { "epoch": 0.11, "learning_rate": 9.849478232087105e-06, "loss": 0.9257, "step": 4569 }, { "epoch": 0.11, "learning_rate": 9.849386760724823e-06, "loss": 0.9256, "step": 4570 }, { "epoch": 0.11, "learning_rate": 9.84929526200263e-06, "loss": 1.2128, "step": 4571 }, { "epoch": 0.11, "learning_rate": 9.849203735921044e-06, "loss": 1.0141, "step": 4572 }, { "epoch": 0.11, "learning_rate": 9.84911218248058e-06, "loss": 1.0508, "step": 4573 }, { "epoch": 0.11, "learning_rate": 9.849020601681756e-06, "loss": 0.8155, "step": 4574 }, { "epoch": 0.11, "learning_rate": 9.848928993525086e-06, "loss": 1.0388, "step": 4575 }, { "epoch": 0.11, "learning_rate": 9.84883735801109e-06, "loss": 1.1338, "step": 4576 }, { "epoch": 0.11, "learning_rate": 9.848745695140281e-06, "loss": 0.9257, "step": 4577 }, { "epoch": 0.11, "learning_rate": 9.848654004913181e-06, "loss": 1.1903, "step": 4578 }, { "epoch": 0.11, "learning_rate": 9.848562287330303e-06, "loss": 1.2172, "step": 4579 }, { "epoch": 0.11, "learning_rate": 9.848470542392168e-06, "loss": 0.9188, "step": 4580 }, { "epoch": 0.11, "learning_rate": 9.848378770099291e-06, "loss": 0.9825, "step": 4581 }, { "epoch": 0.11, "learning_rate": 9.84828697045219e-06, "loss": 0.9739, "step": 4582 }, { "epoch": 0.11, "learning_rate": 9.848195143451385e-06, "loss": 1.2579, "step": 4583 }, { "epoch": 0.11, "learning_rate": 9.848103289097393e-06, "loss": 1.0293, "step": 4584 }, { "epoch": 0.11, "learning_rate": 9.848011407390731e-06, "loss": 1.1555, "step": 4585 }, { "epoch": 0.11, "learning_rate": 9.847919498331919e-06, "loss": 0.9301, "step": 4586 }, { "epoch": 0.11, "learning_rate": 9.847827561921476e-06, "loss": 1.1966, "step": 4587 }, { "epoch": 0.11, "learning_rate": 9.847735598159918e-06, "loss": 0.904, "step": 4588 }, { "epoch": 0.11, "learning_rate": 9.847643607047766e-06, "loss": 1.2262, "step": 4589 }, { "epoch": 0.11, "learning_rate": 9.84755158858554e-06, "loss": 1.0199, "step": 4590 }, { "epoch": 0.11, "learning_rate": 9.847459542773755e-06, "loss": 1.0664, "step": 4591 }, { "epoch": 0.11, "learning_rate": 9.847367469612935e-06, "loss": 0.9948, "step": 4592 }, { "epoch": 0.11, "learning_rate": 9.847275369103597e-06, "loss": 1.0, "step": 4593 }, { "epoch": 0.11, "learning_rate": 9.847183241246259e-06, "loss": 0.7987, "step": 4594 }, { "epoch": 0.11, "learning_rate": 9.847091086041446e-06, "loss": 0.9567, "step": 4595 }, { "epoch": 0.11, "learning_rate": 9.846998903489672e-06, "loss": 1.0519, "step": 4596 }, { "epoch": 0.11, "learning_rate": 9.846906693591462e-06, "loss": 0.9258, "step": 4597 }, { "epoch": 0.11, "learning_rate": 9.846814456347334e-06, "loss": 1.296, "step": 4598 }, { "epoch": 0.11, "learning_rate": 9.846722191757807e-06, "loss": 1.193, "step": 4599 }, { "epoch": 0.11, "learning_rate": 9.846629899823404e-06, "loss": 1.1119, "step": 4600 }, { "epoch": 0.11, "learning_rate": 9.846537580544645e-06, "loss": 1.0904, "step": 4601 }, { "epoch": 0.11, "learning_rate": 9.84644523392205e-06, "loss": 1.1197, "step": 4602 }, { "epoch": 0.11, "learning_rate": 9.84635285995614e-06, "loss": 1.0458, "step": 4603 }, { "epoch": 0.11, "learning_rate": 9.84626045864744e-06, "loss": 0.7687, "step": 4604 }, { "epoch": 0.11, "learning_rate": 9.846168029996465e-06, "loss": 0.8947, "step": 4605 }, { "epoch": 0.11, "learning_rate": 9.84607557400374e-06, "loss": 0.9684, "step": 4606 }, { "epoch": 0.11, "learning_rate": 9.845983090669787e-06, "loss": 1.2592, "step": 4607 }, { "epoch": 0.11, "learning_rate": 9.845890579995127e-06, "loss": 1.1233, "step": 4608 }, { "epoch": 0.11, "learning_rate": 9.845798041980282e-06, "loss": 0.8335, "step": 4609 }, { "epoch": 0.11, "learning_rate": 9.845705476625773e-06, "loss": 0.9861, "step": 4610 }, { "epoch": 0.11, "learning_rate": 9.845612883932126e-06, "loss": 0.925, "step": 4611 }, { "epoch": 0.11, "learning_rate": 9.845520263899858e-06, "loss": 0.8207, "step": 4612 }, { "epoch": 0.11, "learning_rate": 9.845427616529495e-06, "loss": 0.9727, "step": 4613 }, { "epoch": 0.11, "learning_rate": 9.84533494182156e-06, "loss": 1.1376, "step": 4614 }, { "epoch": 0.11, "learning_rate": 9.845242239776574e-06, "loss": 0.8773, "step": 4615 }, { "epoch": 0.11, "learning_rate": 9.84514951039506e-06, "loss": 1.0674, "step": 4616 }, { "epoch": 0.11, "learning_rate": 9.845056753677543e-06, "loss": 1.1059, "step": 4617 }, { "epoch": 0.11, "learning_rate": 9.844963969624546e-06, "loss": 1.1303, "step": 4618 }, { "epoch": 0.11, "learning_rate": 9.84487115823659e-06, "loss": 1.1831, "step": 4619 }, { "epoch": 0.11, "learning_rate": 9.844778319514201e-06, "loss": 1.0329, "step": 4620 }, { "epoch": 0.11, "learning_rate": 9.844685453457902e-06, "loss": 1.1416, "step": 4621 }, { "epoch": 0.11, "learning_rate": 9.84459256006822e-06, "loss": 1.0374, "step": 4622 }, { "epoch": 0.11, "learning_rate": 9.844499639345674e-06, "loss": 1.2151, "step": 4623 }, { "epoch": 0.11, "learning_rate": 9.844406691290791e-06, "loss": 0.938, "step": 4624 }, { "epoch": 0.11, "learning_rate": 9.844313715904094e-06, "loss": 1.1788, "step": 4625 }, { "epoch": 0.11, "learning_rate": 9.84422071318611e-06, "loss": 0.9914, "step": 4626 }, { "epoch": 0.11, "learning_rate": 9.844127683137361e-06, "loss": 1.1736, "step": 4627 }, { "epoch": 0.11, "learning_rate": 9.844034625758374e-06, "loss": 1.1808, "step": 4628 }, { "epoch": 0.11, "learning_rate": 9.843941541049672e-06, "loss": 0.9172, "step": 4629 }, { "epoch": 0.11, "learning_rate": 9.843848429011785e-06, "loss": 1.0212, "step": 4630 }, { "epoch": 0.11, "learning_rate": 9.843755289645231e-06, "loss": 1.0771, "step": 4631 }, { "epoch": 0.11, "learning_rate": 9.843662122950539e-06, "loss": 1.0025, "step": 4632 }, { "epoch": 0.11, "learning_rate": 9.843568928928235e-06, "loss": 1.0965, "step": 4633 }, { "epoch": 0.11, "learning_rate": 9.843475707578847e-06, "loss": 0.8113, "step": 4634 }, { "epoch": 0.11, "learning_rate": 9.843382458902897e-06, "loss": 1.2151, "step": 4635 }, { "epoch": 0.11, "learning_rate": 9.843289182900911e-06, "loss": 1.011, "step": 4636 }, { "epoch": 0.11, "learning_rate": 9.843195879573418e-06, "loss": 0.8548, "step": 4637 }, { "epoch": 0.11, "learning_rate": 9.843102548920944e-06, "loss": 0.8872, "step": 4638 }, { "epoch": 0.11, "learning_rate": 9.843009190944015e-06, "loss": 0.954, "step": 4639 }, { "epoch": 0.11, "learning_rate": 9.842915805643156e-06, "loss": 0.9705, "step": 4640 }, { "epoch": 0.11, "learning_rate": 9.842822393018897e-06, "loss": 1.152, "step": 4641 }, { "epoch": 0.11, "learning_rate": 9.842728953071763e-06, "loss": 1.0988, "step": 4642 }, { "epoch": 0.11, "learning_rate": 9.842635485802281e-06, "loss": 1.2558, "step": 4643 }, { "epoch": 0.11, "learning_rate": 9.84254199121098e-06, "loss": 0.8765, "step": 4644 }, { "epoch": 0.11, "learning_rate": 9.842448469298386e-06, "loss": 1.204, "step": 4645 }, { "epoch": 0.11, "learning_rate": 9.842354920065028e-06, "loss": 1.222, "step": 4646 }, { "epoch": 0.11, "learning_rate": 9.84226134351143e-06, "loss": 1.1019, "step": 4647 }, { "epoch": 0.11, "learning_rate": 9.842167739638126e-06, "loss": 1.0052, "step": 4648 }, { "epoch": 0.11, "learning_rate": 9.842074108445639e-06, "loss": 1.0686, "step": 4649 }, { "epoch": 0.11, "learning_rate": 9.841980449934501e-06, "loss": 1.3336, "step": 4650 }, { "epoch": 0.11, "learning_rate": 9.841886764105237e-06, "loss": 1.1172, "step": 4651 }, { "epoch": 0.11, "learning_rate": 9.84179305095838e-06, "loss": 1.0168, "step": 4652 }, { "epoch": 0.11, "learning_rate": 9.841699310494452e-06, "loss": 1.1218, "step": 4653 }, { "epoch": 0.11, "learning_rate": 9.841605542713989e-06, "loss": 1.1005, "step": 4654 }, { "epoch": 0.11, "learning_rate": 9.841511747617514e-06, "loss": 0.9442, "step": 4655 }, { "epoch": 0.11, "learning_rate": 9.84141792520556e-06, "loss": 1.1111, "step": 4656 }, { "epoch": 0.11, "learning_rate": 9.841324075478658e-06, "loss": 0.9459, "step": 4657 }, { "epoch": 0.11, "learning_rate": 9.841230198437333e-06, "loss": 1.0281, "step": 4658 }, { "epoch": 0.11, "learning_rate": 9.841136294082116e-06, "loss": 0.9997, "step": 4659 }, { "epoch": 0.11, "learning_rate": 9.841042362413537e-06, "loss": 0.8455, "step": 4660 }, { "epoch": 0.11, "learning_rate": 9.840948403432127e-06, "loss": 1.1992, "step": 4661 }, { "epoch": 0.11, "learning_rate": 9.840854417138416e-06, "loss": 1.1566, "step": 4662 }, { "epoch": 0.11, "learning_rate": 9.840760403532933e-06, "loss": 1.066, "step": 4663 }, { "epoch": 0.11, "learning_rate": 9.84066636261621e-06, "loss": 0.9656, "step": 4664 }, { "epoch": 0.11, "learning_rate": 9.840572294388775e-06, "loss": 1.2495, "step": 4665 }, { "epoch": 0.11, "learning_rate": 9.84047819885116e-06, "loss": 1.144, "step": 4666 }, { "epoch": 0.11, "learning_rate": 9.8403840760039e-06, "loss": 0.9247, "step": 4667 }, { "epoch": 0.11, "learning_rate": 9.840289925847518e-06, "loss": 1.0674, "step": 4668 }, { "epoch": 0.11, "learning_rate": 9.840195748382551e-06, "loss": 0.8327, "step": 4669 }, { "epoch": 0.11, "learning_rate": 9.840101543609529e-06, "loss": 0.9837, "step": 4670 }, { "epoch": 0.11, "learning_rate": 9.840007311528984e-06, "loss": 1.1153, "step": 4671 }, { "epoch": 0.11, "learning_rate": 9.839913052141445e-06, "loss": 1.0469, "step": 4672 }, { "epoch": 0.11, "learning_rate": 9.839818765447448e-06, "loss": 0.8548, "step": 4673 }, { "epoch": 0.11, "learning_rate": 9.839724451447521e-06, "loss": 0.9981, "step": 4674 }, { "epoch": 0.11, "learning_rate": 9.8396301101422e-06, "loss": 0.8657, "step": 4675 }, { "epoch": 0.11, "learning_rate": 9.839535741532014e-06, "loss": 1.105, "step": 4676 }, { "epoch": 0.11, "learning_rate": 9.839441345617496e-06, "loss": 0.7964, "step": 4677 }, { "epoch": 0.11, "learning_rate": 9.83934692239918e-06, "loss": 1.1678, "step": 4678 }, { "epoch": 0.11, "learning_rate": 9.839252471877596e-06, "loss": 1.2015, "step": 4679 }, { "epoch": 0.11, "learning_rate": 9.83915799405328e-06, "loss": 0.9768, "step": 4680 }, { "epoch": 0.11, "learning_rate": 9.839063488926763e-06, "loss": 1.1838, "step": 4681 }, { "epoch": 0.11, "learning_rate": 9.83896895649858e-06, "loss": 0.9042, "step": 4682 }, { "epoch": 0.11, "learning_rate": 9.838874396769264e-06, "loss": 1.0468, "step": 4683 }, { "epoch": 0.11, "learning_rate": 9.838779809739346e-06, "loss": 1.1486, "step": 4684 }, { "epoch": 0.11, "learning_rate": 9.838685195409363e-06, "loss": 0.8772, "step": 4685 }, { "epoch": 0.11, "learning_rate": 9.838590553779845e-06, "loss": 0.891, "step": 4686 }, { "epoch": 0.11, "learning_rate": 9.83849588485133e-06, "loss": 1.2241, "step": 4687 }, { "epoch": 0.11, "learning_rate": 9.83840118862435e-06, "loss": 1.0252, "step": 4688 }, { "epoch": 0.11, "learning_rate": 9.83830646509944e-06, "loss": 1.3133, "step": 4689 }, { "epoch": 0.11, "learning_rate": 9.838211714277133e-06, "loss": 0.9293, "step": 4690 }, { "epoch": 0.11, "learning_rate": 9.838116936157966e-06, "loss": 1.1923, "step": 4691 }, { "epoch": 0.11, "learning_rate": 9.838022130742471e-06, "loss": 0.7959, "step": 4692 }, { "epoch": 0.11, "learning_rate": 9.837927298031185e-06, "loss": 0.9269, "step": 4693 }, { "epoch": 0.11, "learning_rate": 9.837832438024642e-06, "loss": 1.0806, "step": 4694 }, { "epoch": 0.11, "learning_rate": 9.837737550723377e-06, "loss": 1.2701, "step": 4695 }, { "epoch": 0.11, "learning_rate": 9.837642636127927e-06, "loss": 1.0768, "step": 4696 }, { "epoch": 0.11, "learning_rate": 9.837547694238824e-06, "loss": 1.0808, "step": 4697 }, { "epoch": 0.11, "learning_rate": 9.837452725056609e-06, "loss": 0.9601, "step": 4698 }, { "epoch": 0.11, "learning_rate": 9.837357728581813e-06, "loss": 0.9094, "step": 4699 }, { "epoch": 0.11, "learning_rate": 9.837262704814974e-06, "loss": 0.9112, "step": 4700 }, { "epoch": 0.11, "learning_rate": 9.837167653756628e-06, "loss": 1.0257, "step": 4701 }, { "epoch": 0.11, "learning_rate": 9.837072575407312e-06, "loss": 0.9416, "step": 4702 }, { "epoch": 0.11, "learning_rate": 9.83697746976756e-06, "loss": 1.0256, "step": 4703 }, { "epoch": 0.11, "learning_rate": 9.836882336837911e-06, "loss": 0.9364, "step": 4704 }, { "epoch": 0.11, "learning_rate": 9.8367871766189e-06, "loss": 1.3288, "step": 4705 }, { "epoch": 0.11, "learning_rate": 9.836691989111066e-06, "loss": 0.9881, "step": 4706 }, { "epoch": 0.11, "learning_rate": 9.836596774314944e-06, "loss": 1.4394, "step": 4707 }, { "epoch": 0.11, "learning_rate": 9.836501532231071e-06, "loss": 1.0243, "step": 4708 }, { "epoch": 0.11, "learning_rate": 9.836406262859988e-06, "loss": 1.1369, "step": 4709 }, { "epoch": 0.11, "learning_rate": 9.836310966202228e-06, "loss": 1.2568, "step": 4710 }, { "epoch": 0.11, "learning_rate": 9.836215642258331e-06, "loss": 1.066, "step": 4711 }, { "epoch": 0.11, "learning_rate": 9.836120291028834e-06, "loss": 1.0004, "step": 4712 }, { "epoch": 0.11, "learning_rate": 9.836024912514275e-06, "loss": 1.2414, "step": 4713 }, { "epoch": 0.11, "learning_rate": 9.835929506715193e-06, "loss": 1.0569, "step": 4714 }, { "epoch": 0.11, "learning_rate": 9.835834073632125e-06, "loss": 0.9226, "step": 4715 }, { "epoch": 0.11, "learning_rate": 9.83573861326561e-06, "loss": 0.9613, "step": 4716 }, { "epoch": 0.11, "learning_rate": 9.835643125616188e-06, "loss": 1.0387, "step": 4717 }, { "epoch": 0.11, "learning_rate": 9.835547610684395e-06, "loss": 0.8977, "step": 4718 }, { "epoch": 0.11, "learning_rate": 9.835452068470772e-06, "loss": 0.998, "step": 4719 }, { "epoch": 0.11, "learning_rate": 9.835356498975856e-06, "loss": 1.261, "step": 4720 }, { "epoch": 0.11, "learning_rate": 9.83526090220019e-06, "loss": 1.1221, "step": 4721 }, { "epoch": 0.11, "learning_rate": 9.83516527814431e-06, "loss": 0.8859, "step": 4722 }, { "epoch": 0.11, "learning_rate": 9.835069626808755e-06, "loss": 1.2213, "step": 4723 }, { "epoch": 0.11, "learning_rate": 9.834973948194068e-06, "loss": 1.1042, "step": 4724 }, { "epoch": 0.11, "learning_rate": 9.834878242300786e-06, "loss": 1.2309, "step": 4725 }, { "epoch": 0.11, "learning_rate": 9.83478250912945e-06, "loss": 0.9341, "step": 4726 }, { "epoch": 0.11, "learning_rate": 9.8346867486806e-06, "loss": 1.169, "step": 4727 }, { "epoch": 0.11, "learning_rate": 9.834590960954776e-06, "loss": 1.0875, "step": 4728 }, { "epoch": 0.11, "learning_rate": 9.834495145952517e-06, "loss": 1.1521, "step": 4729 }, { "epoch": 0.11, "learning_rate": 9.834399303674367e-06, "loss": 1.1049, "step": 4730 }, { "epoch": 0.11, "learning_rate": 9.834303434120864e-06, "loss": 1.0182, "step": 4731 }, { "epoch": 0.11, "learning_rate": 9.834207537292552e-06, "loss": 0.7973, "step": 4732 }, { "epoch": 0.11, "learning_rate": 9.834111613189968e-06, "loss": 1.0043, "step": 4733 }, { "epoch": 0.11, "learning_rate": 9.834015661813656e-06, "loss": 0.9876, "step": 4734 }, { "epoch": 0.11, "learning_rate": 9.833919683164155e-06, "loss": 1.1208, "step": 4735 }, { "epoch": 0.11, "learning_rate": 9.83382367724201e-06, "loss": 1.0608, "step": 4736 }, { "epoch": 0.11, "learning_rate": 9.833727644047759e-06, "loss": 1.11, "step": 4737 }, { "epoch": 0.11, "learning_rate": 9.833631583581946e-06, "loss": 0.8948, "step": 4738 }, { "epoch": 0.11, "learning_rate": 9.833535495845112e-06, "loss": 1.1552, "step": 4739 }, { "epoch": 0.11, "learning_rate": 9.833439380837802e-06, "loss": 0.7852, "step": 4740 }, { "epoch": 0.11, "learning_rate": 9.833343238560554e-06, "loss": 1.0391, "step": 4741 }, { "epoch": 0.11, "learning_rate": 9.83324706901391e-06, "loss": 1.0616, "step": 4742 }, { "epoch": 0.11, "learning_rate": 9.833150872198417e-06, "loss": 0.9289, "step": 4743 }, { "epoch": 0.11, "learning_rate": 9.833054648114615e-06, "loss": 1.0499, "step": 4744 }, { "epoch": 0.11, "learning_rate": 9.832958396763049e-06, "loss": 1.0522, "step": 4745 }, { "epoch": 0.11, "learning_rate": 9.832862118144259e-06, "loss": 1.2018, "step": 4746 }, { "epoch": 0.11, "learning_rate": 9.832765812258788e-06, "loss": 0.9615, "step": 4747 }, { "epoch": 0.11, "learning_rate": 9.832669479107183e-06, "loss": 1.1902, "step": 4748 }, { "epoch": 0.11, "learning_rate": 9.832573118689986e-06, "loss": 1.131, "step": 4749 }, { "epoch": 0.11, "learning_rate": 9.83247673100774e-06, "loss": 1.1399, "step": 4750 }, { "epoch": 0.11, "learning_rate": 9.832380316060987e-06, "loss": 0.9914, "step": 4751 }, { "epoch": 0.11, "learning_rate": 9.832283873850276e-06, "loss": 1.1381, "step": 4752 }, { "epoch": 0.11, "learning_rate": 9.832187404376146e-06, "loss": 1.0355, "step": 4753 }, { "epoch": 0.11, "learning_rate": 9.832090907639145e-06, "loss": 1.2056, "step": 4754 }, { "epoch": 0.11, "learning_rate": 9.831994383639813e-06, "loss": 1.0744, "step": 4755 }, { "epoch": 0.11, "learning_rate": 9.831897832378701e-06, "loss": 1.1416, "step": 4756 }, { "epoch": 0.11, "learning_rate": 9.831801253856348e-06, "loss": 1.0792, "step": 4757 }, { "epoch": 0.11, "learning_rate": 9.8317046480733e-06, "loss": 0.8965, "step": 4758 }, { "epoch": 0.11, "learning_rate": 9.831608015030104e-06, "loss": 0.9166, "step": 4759 }, { "epoch": 0.11, "learning_rate": 9.831511354727304e-06, "loss": 1.1366, "step": 4760 }, { "epoch": 0.11, "learning_rate": 9.831414667165447e-06, "loss": 0.86, "step": 4761 }, { "epoch": 0.11, "learning_rate": 9.831317952345077e-06, "loss": 1.2048, "step": 4762 }, { "epoch": 0.11, "learning_rate": 9.831221210266736e-06, "loss": 1.4117, "step": 4763 }, { "epoch": 0.11, "learning_rate": 9.831124440930977e-06, "loss": 1.0888, "step": 4764 }, { "epoch": 0.11, "learning_rate": 9.831027644338343e-06, "loss": 0.8154, "step": 4765 }, { "epoch": 0.11, "learning_rate": 9.830930820489377e-06, "loss": 0.9943, "step": 4766 }, { "epoch": 0.11, "learning_rate": 9.83083396938463e-06, "loss": 0.8591, "step": 4767 }, { "epoch": 0.11, "learning_rate": 9.830737091024646e-06, "loss": 1.01, "step": 4768 }, { "epoch": 0.11, "learning_rate": 9.830640185409972e-06, "loss": 1.151, "step": 4769 }, { "epoch": 0.11, "learning_rate": 9.830543252541153e-06, "loss": 0.9812, "step": 4770 }, { "epoch": 0.11, "learning_rate": 9.83044629241874e-06, "loss": 0.9688, "step": 4771 }, { "epoch": 0.11, "learning_rate": 9.830349305043277e-06, "loss": 0.9778, "step": 4772 }, { "epoch": 0.11, "learning_rate": 9.83025229041531e-06, "loss": 1.0801, "step": 4773 }, { "epoch": 0.11, "learning_rate": 9.83015524853539e-06, "loss": 1.1656, "step": 4774 }, { "epoch": 0.11, "learning_rate": 9.830058179404061e-06, "loss": 1.0834, "step": 4775 }, { "epoch": 0.11, "learning_rate": 9.829961083021874e-06, "loss": 1.0, "step": 4776 }, { "epoch": 0.11, "learning_rate": 9.829863959389373e-06, "loss": 1.1742, "step": 4777 }, { "epoch": 0.11, "learning_rate": 9.829766808507111e-06, "loss": 1.0902, "step": 4778 }, { "epoch": 0.11, "learning_rate": 9.829669630375631e-06, "loss": 1.2867, "step": 4779 }, { "epoch": 0.11, "learning_rate": 9.829572424995485e-06, "loss": 1.014, "step": 4780 }, { "epoch": 0.11, "learning_rate": 9.82947519236722e-06, "loss": 0.9868, "step": 4781 }, { "epoch": 0.11, "learning_rate": 9.829377932491382e-06, "loss": 1.3011, "step": 4782 }, { "epoch": 0.11, "learning_rate": 9.829280645368524e-06, "loss": 0.7586, "step": 4783 }, { "epoch": 0.11, "learning_rate": 9.829183330999192e-06, "loss": 0.8442, "step": 4784 }, { "epoch": 0.11, "learning_rate": 9.829085989383937e-06, "loss": 1.021, "step": 4785 }, { "epoch": 0.11, "learning_rate": 9.828988620523307e-06, "loss": 1.1114, "step": 4786 }, { "epoch": 0.11, "learning_rate": 9.828891224417853e-06, "loss": 0.9426, "step": 4787 }, { "epoch": 0.11, "learning_rate": 9.828793801068122e-06, "loss": 1.1603, "step": 4788 }, { "epoch": 0.11, "learning_rate": 9.828696350474665e-06, "loss": 1.1171, "step": 4789 }, { "epoch": 0.11, "learning_rate": 9.82859887263803e-06, "loss": 0.9787, "step": 4790 }, { "epoch": 0.11, "learning_rate": 9.828501367558772e-06, "loss": 1.2569, "step": 4791 }, { "epoch": 0.11, "learning_rate": 9.828403835237435e-06, "loss": 0.9523, "step": 4792 }, { "epoch": 0.11, "learning_rate": 9.828306275674572e-06, "loss": 1.0384, "step": 4793 }, { "epoch": 0.11, "learning_rate": 9.828208688870736e-06, "loss": 0.786, "step": 4794 }, { "epoch": 0.11, "learning_rate": 9.828111074826472e-06, "loss": 1.1575, "step": 4795 }, { "epoch": 0.11, "learning_rate": 9.828013433542335e-06, "loss": 0.9067, "step": 4796 }, { "epoch": 0.11, "learning_rate": 9.827915765018874e-06, "loss": 0.9684, "step": 4797 }, { "epoch": 0.11, "learning_rate": 9.827818069256641e-06, "loss": 1.1393, "step": 4798 }, { "epoch": 0.11, "learning_rate": 9.827720346256188e-06, "loss": 1.1466, "step": 4799 }, { "epoch": 0.11, "learning_rate": 9.827622596018065e-06, "loss": 1.221, "step": 4800 }, { "epoch": 0.11, "learning_rate": 9.827524818542822e-06, "loss": 1.0259, "step": 4801 }, { "epoch": 0.11, "learning_rate": 9.827427013831014e-06, "loss": 1.0399, "step": 4802 }, { "epoch": 0.11, "learning_rate": 9.82732918188319e-06, "loss": 1.0781, "step": 4803 }, { "epoch": 0.11, "learning_rate": 9.827231322699905e-06, "loss": 0.9004, "step": 4804 }, { "epoch": 0.11, "learning_rate": 9.827133436281705e-06, "loss": 1.001, "step": 4805 }, { "epoch": 0.11, "learning_rate": 9.82703552262915e-06, "loss": 0.9033, "step": 4806 }, { "epoch": 0.11, "learning_rate": 9.826937581742787e-06, "loss": 1.044, "step": 4807 }, { "epoch": 0.11, "learning_rate": 9.826839613623173e-06, "loss": 1.1196, "step": 4808 }, { "epoch": 0.11, "learning_rate": 9.826741618270857e-06, "loss": 0.9002, "step": 4809 }, { "epoch": 0.11, "learning_rate": 9.826643595686394e-06, "loss": 1.4547, "step": 4810 }, { "epoch": 0.11, "learning_rate": 9.826545545870333e-06, "loss": 1.1233, "step": 4811 }, { "epoch": 0.11, "learning_rate": 9.826447468823234e-06, "loss": 0.9239, "step": 4812 }, { "epoch": 0.11, "learning_rate": 9.826349364545644e-06, "loss": 1.0502, "step": 4813 }, { "epoch": 0.11, "learning_rate": 9.82625123303812e-06, "loss": 1.0296, "step": 4814 }, { "epoch": 0.11, "learning_rate": 9.826153074301217e-06, "loss": 0.8487, "step": 4815 }, { "epoch": 0.11, "learning_rate": 9.826054888335483e-06, "loss": 0.8583, "step": 4816 }, { "epoch": 0.11, "learning_rate": 9.825956675141478e-06, "loss": 1.2933, "step": 4817 }, { "epoch": 0.11, "learning_rate": 9.825858434719754e-06, "loss": 1.1714, "step": 4818 }, { "epoch": 0.11, "learning_rate": 9.825760167070863e-06, "loss": 1.1246, "step": 4819 }, { "epoch": 0.11, "learning_rate": 9.825661872195362e-06, "loss": 1.538, "step": 4820 }, { "epoch": 0.11, "learning_rate": 9.825563550093806e-06, "loss": 0.923, "step": 4821 }, { "epoch": 0.11, "learning_rate": 9.825465200766748e-06, "loss": 1.1286, "step": 4822 }, { "epoch": 0.11, "learning_rate": 9.825366824214743e-06, "loss": 0.9986, "step": 4823 }, { "epoch": 0.11, "learning_rate": 9.825268420438347e-06, "loss": 1.2663, "step": 4824 }, { "epoch": 0.11, "learning_rate": 9.825169989438117e-06, "loss": 1.1323, "step": 4825 }, { "epoch": 0.11, "learning_rate": 9.825071531214603e-06, "loss": 1.0077, "step": 4826 }, { "epoch": 0.11, "learning_rate": 9.824973045768364e-06, "loss": 1.2894, "step": 4827 }, { "epoch": 0.11, "learning_rate": 9.824874533099957e-06, "loss": 1.122, "step": 4828 }, { "epoch": 0.11, "learning_rate": 9.824775993209935e-06, "loss": 0.8631, "step": 4829 }, { "epoch": 0.11, "learning_rate": 9.824677426098855e-06, "loss": 0.9904, "step": 4830 }, { "epoch": 0.11, "learning_rate": 9.824578831767273e-06, "loss": 1.1022, "step": 4831 }, { "epoch": 0.11, "learning_rate": 9.824480210215747e-06, "loss": 0.9312, "step": 4832 }, { "epoch": 0.11, "learning_rate": 9.824381561444828e-06, "loss": 0.9515, "step": 4833 }, { "epoch": 0.11, "learning_rate": 9.824282885455081e-06, "loss": 0.9026, "step": 4834 }, { "epoch": 0.11, "learning_rate": 9.824184182247056e-06, "loss": 1.3674, "step": 4835 }, { "epoch": 0.11, "learning_rate": 9.824085451821313e-06, "loss": 1.1058, "step": 4836 }, { "epoch": 0.11, "learning_rate": 9.823986694178406e-06, "loss": 0.8671, "step": 4837 }, { "epoch": 0.11, "learning_rate": 9.823887909318894e-06, "loss": 1.1645, "step": 4838 }, { "epoch": 0.11, "learning_rate": 9.823789097243337e-06, "loss": 1.1309, "step": 4839 }, { "epoch": 0.11, "learning_rate": 9.823690257952288e-06, "loss": 0.9169, "step": 4840 }, { "epoch": 0.11, "learning_rate": 9.823591391446308e-06, "loss": 0.8322, "step": 4841 }, { "epoch": 0.11, "learning_rate": 9.823492497725953e-06, "loss": 1.1295, "step": 4842 }, { "epoch": 0.11, "learning_rate": 9.82339357679178e-06, "loss": 1.0484, "step": 4843 }, { "epoch": 0.11, "learning_rate": 9.823294628644352e-06, "loss": 1.0657, "step": 4844 }, { "epoch": 0.11, "learning_rate": 9.82319565328422e-06, "loss": 1.2592, "step": 4845 }, { "epoch": 0.11, "learning_rate": 9.823096650711948e-06, "loss": 1.0243, "step": 4846 }, { "epoch": 0.11, "learning_rate": 9.822997620928092e-06, "loss": 1.0725, "step": 4847 }, { "epoch": 0.11, "learning_rate": 9.822898563933213e-06, "loss": 1.4573, "step": 4848 }, { "epoch": 0.11, "learning_rate": 9.822799479727866e-06, "loss": 0.9736, "step": 4849 }, { "epoch": 0.11, "learning_rate": 9.822700368312616e-06, "loss": 1.1632, "step": 4850 }, { "epoch": 0.11, "learning_rate": 9.822601229688016e-06, "loss": 1.0702, "step": 4851 }, { "epoch": 0.11, "learning_rate": 9.822502063854629e-06, "loss": 1.0281, "step": 4852 }, { "epoch": 0.11, "learning_rate": 9.82240287081301e-06, "loss": 0.9547, "step": 4853 }, { "epoch": 0.11, "learning_rate": 9.822303650563727e-06, "loss": 0.841, "step": 4854 }, { "epoch": 0.11, "learning_rate": 9.822204403107332e-06, "loss": 1.1065, "step": 4855 }, { "epoch": 0.11, "learning_rate": 9.822105128444389e-06, "loss": 1.1012, "step": 4856 }, { "epoch": 0.11, "learning_rate": 9.822005826575455e-06, "loss": 1.0933, "step": 4857 }, { "epoch": 0.11, "learning_rate": 9.821906497501093e-06, "loss": 0.929, "step": 4858 }, { "epoch": 0.11, "learning_rate": 9.821807141221863e-06, "loss": 0.9192, "step": 4859 }, { "epoch": 0.11, "learning_rate": 9.821707757738326e-06, "loss": 1.0454, "step": 4860 }, { "epoch": 0.11, "learning_rate": 9.82160834705104e-06, "loss": 1.0916, "step": 4861 }, { "epoch": 0.11, "learning_rate": 9.821508909160569e-06, "loss": 1.051, "step": 4862 }, { "epoch": 0.11, "learning_rate": 9.821409444067472e-06, "loss": 1.1079, "step": 4863 }, { "epoch": 0.11, "learning_rate": 9.821309951772312e-06, "loss": 1.3939, "step": 4864 }, { "epoch": 0.11, "learning_rate": 9.821210432275646e-06, "loss": 1.2416, "step": 4865 }, { "epoch": 0.11, "learning_rate": 9.821110885578041e-06, "loss": 1.2349, "step": 4866 }, { "epoch": 0.11, "learning_rate": 9.821011311680057e-06, "loss": 1.1644, "step": 4867 }, { "epoch": 0.11, "learning_rate": 9.820911710582253e-06, "loss": 1.3102, "step": 4868 }, { "epoch": 0.11, "learning_rate": 9.820812082285196e-06, "loss": 0.9136, "step": 4869 }, { "epoch": 0.11, "learning_rate": 9.820712426789443e-06, "loss": 1.1643, "step": 4870 }, { "epoch": 0.11, "learning_rate": 9.820612744095557e-06, "loss": 1.3268, "step": 4871 }, { "epoch": 0.11, "learning_rate": 9.820513034204104e-06, "loss": 1.3645, "step": 4872 }, { "epoch": 0.11, "learning_rate": 9.820413297115645e-06, "loss": 1.0396, "step": 4873 }, { "epoch": 0.11, "learning_rate": 9.820313532830741e-06, "loss": 1.1273, "step": 4874 }, { "epoch": 0.11, "learning_rate": 9.820213741349956e-06, "loss": 1.1977, "step": 4875 }, { "epoch": 0.11, "learning_rate": 9.820113922673853e-06, "loss": 1.1492, "step": 4876 }, { "epoch": 0.11, "learning_rate": 9.820014076802996e-06, "loss": 0.9647, "step": 4877 }, { "epoch": 0.11, "learning_rate": 9.819914203737945e-06, "loss": 1.0392, "step": 4878 }, { "epoch": 0.11, "learning_rate": 9.819814303479268e-06, "loss": 1.5934, "step": 4879 }, { "epoch": 0.11, "learning_rate": 9.819714376027524e-06, "loss": 1.114, "step": 4880 }, { "epoch": 0.11, "learning_rate": 9.819614421383282e-06, "loss": 0.8686, "step": 4881 }, { "epoch": 0.11, "learning_rate": 9.819514439547104e-06, "loss": 1.1339, "step": 4882 }, { "epoch": 0.11, "learning_rate": 9.819414430519552e-06, "loss": 1.0272, "step": 4883 }, { "epoch": 0.11, "learning_rate": 9.81931439430119e-06, "loss": 1.0577, "step": 4884 }, { "epoch": 0.11, "learning_rate": 9.819214330892586e-06, "loss": 0.7781, "step": 4885 }, { "epoch": 0.11, "learning_rate": 9.819114240294301e-06, "loss": 1.0153, "step": 4886 }, { "epoch": 0.11, "learning_rate": 9.819014122506902e-06, "loss": 1.0303, "step": 4887 }, { "epoch": 0.11, "learning_rate": 9.818913977530955e-06, "loss": 1.0579, "step": 4888 }, { "epoch": 0.11, "learning_rate": 9.81881380536702e-06, "loss": 1.1436, "step": 4889 }, { "epoch": 0.11, "learning_rate": 9.818713606015667e-06, "loss": 0.9254, "step": 4890 }, { "epoch": 0.11, "learning_rate": 9.81861337947746e-06, "loss": 0.9343, "step": 4891 }, { "epoch": 0.11, "learning_rate": 9.818513125752962e-06, "loss": 0.9887, "step": 4892 }, { "epoch": 0.11, "learning_rate": 9.818412844842744e-06, "loss": 1.0856, "step": 4893 }, { "epoch": 0.11, "learning_rate": 9.818312536747367e-06, "loss": 1.0596, "step": 4894 }, { "epoch": 0.11, "learning_rate": 9.818212201467396e-06, "loss": 1.3783, "step": 4895 }, { "epoch": 0.11, "learning_rate": 9.818111839003402e-06, "loss": 0.9986, "step": 4896 }, { "epoch": 0.11, "learning_rate": 9.818011449355949e-06, "loss": 1.0592, "step": 4897 }, { "epoch": 0.11, "learning_rate": 9.817911032525602e-06, "loss": 0.8886, "step": 4898 }, { "epoch": 0.11, "learning_rate": 9.817810588512929e-06, "loss": 0.8557, "step": 4899 }, { "epoch": 0.11, "learning_rate": 9.817710117318498e-06, "loss": 1.1824, "step": 4900 }, { "epoch": 0.11, "learning_rate": 9.817609618942872e-06, "loss": 0.9596, "step": 4901 }, { "epoch": 0.11, "learning_rate": 9.817509093386621e-06, "loss": 0.9156, "step": 4902 }, { "epoch": 0.11, "learning_rate": 9.81740854065031e-06, "loss": 1.2682, "step": 4903 }, { "epoch": 0.11, "learning_rate": 9.81730796073451e-06, "loss": 1.1482, "step": 4904 }, { "epoch": 0.11, "learning_rate": 9.817207353639785e-06, "loss": 0.8179, "step": 4905 }, { "epoch": 0.11, "learning_rate": 9.817106719366704e-06, "loss": 1.04, "step": 4906 }, { "epoch": 0.11, "learning_rate": 9.817006057915835e-06, "loss": 1.1361, "step": 4907 }, { "epoch": 0.11, "learning_rate": 9.816905369287743e-06, "loss": 0.9873, "step": 4908 }, { "epoch": 0.11, "learning_rate": 9.816804653483001e-06, "loss": 0.9805, "step": 4909 }, { "epoch": 0.11, "learning_rate": 9.816703910502175e-06, "loss": 1.2106, "step": 4910 }, { "epoch": 0.11, "learning_rate": 9.816603140345833e-06, "loss": 0.9913, "step": 4911 }, { "epoch": 0.11, "learning_rate": 9.816502343014542e-06, "loss": 1.0378, "step": 4912 }, { "epoch": 0.11, "learning_rate": 9.816401518508873e-06, "loss": 1.1237, "step": 4913 }, { "epoch": 0.11, "learning_rate": 9.816300666829396e-06, "loss": 1.0816, "step": 4914 }, { "epoch": 0.11, "learning_rate": 9.816199787976677e-06, "loss": 0.8629, "step": 4915 }, { "epoch": 0.11, "learning_rate": 9.816098881951286e-06, "loss": 1.0758, "step": 4916 }, { "epoch": 0.11, "learning_rate": 9.815997948753792e-06, "loss": 1.0048, "step": 4917 }, { "epoch": 0.11, "learning_rate": 9.815896988384768e-06, "loss": 0.9977, "step": 4918 }, { "epoch": 0.11, "learning_rate": 9.815796000844779e-06, "loss": 1.0706, "step": 4919 }, { "epoch": 0.11, "learning_rate": 9.815694986134397e-06, "loss": 0.7954, "step": 4920 }, { "epoch": 0.11, "learning_rate": 9.81559394425419e-06, "loss": 1.2219, "step": 4921 }, { "epoch": 0.11, "learning_rate": 9.81549287520473e-06, "loss": 1.1493, "step": 4922 }, { "epoch": 0.11, "learning_rate": 9.815391778986589e-06, "loss": 0.909, "step": 4923 }, { "epoch": 0.11, "learning_rate": 9.815290655600333e-06, "loss": 1.1123, "step": 4924 }, { "epoch": 0.11, "learning_rate": 9.815189505046534e-06, "loss": 1.1149, "step": 4925 }, { "epoch": 0.11, "learning_rate": 9.815088327325766e-06, "loss": 1.1156, "step": 4926 }, { "epoch": 0.11, "learning_rate": 9.814987122438595e-06, "loss": 1.1961, "step": 4927 }, { "epoch": 0.11, "learning_rate": 9.814885890385595e-06, "loss": 0.9232, "step": 4928 }, { "epoch": 0.11, "learning_rate": 9.814784631167335e-06, "loss": 0.9983, "step": 4929 }, { "epoch": 0.11, "learning_rate": 9.81468334478439e-06, "loss": 1.0216, "step": 4930 }, { "epoch": 0.11, "learning_rate": 9.814582031237328e-06, "loss": 1.0113, "step": 4931 }, { "epoch": 0.11, "learning_rate": 9.81448069052672e-06, "loss": 1.0106, "step": 4932 }, { "epoch": 0.11, "learning_rate": 9.814379322653142e-06, "loss": 0.9002, "step": 4933 }, { "epoch": 0.11, "learning_rate": 9.814277927617162e-06, "loss": 1.1867, "step": 4934 }, { "epoch": 0.11, "learning_rate": 9.814176505419353e-06, "loss": 0.9051, "step": 4935 }, { "epoch": 0.11, "learning_rate": 9.814075056060287e-06, "loss": 1.1354, "step": 4936 }, { "epoch": 0.11, "learning_rate": 9.81397357954054e-06, "loss": 0.9757, "step": 4937 }, { "epoch": 0.11, "learning_rate": 9.81387207586068e-06, "loss": 1.2557, "step": 4938 }, { "epoch": 0.11, "learning_rate": 9.81377054502128e-06, "loss": 1.2489, "step": 4939 }, { "epoch": 0.11, "learning_rate": 9.813668987022916e-06, "loss": 1.0214, "step": 4940 }, { "epoch": 0.11, "learning_rate": 9.813567401866157e-06, "loss": 1.2055, "step": 4941 }, { "epoch": 0.11, "learning_rate": 9.81346578955158e-06, "loss": 1.0642, "step": 4942 }, { "epoch": 0.11, "learning_rate": 9.813364150079754e-06, "loss": 0.9616, "step": 4943 }, { "epoch": 0.11, "learning_rate": 9.813262483451257e-06, "loss": 1.1628, "step": 4944 }, { "epoch": 0.11, "learning_rate": 9.81316078966666e-06, "loss": 1.125, "step": 4945 }, { "epoch": 0.11, "learning_rate": 9.813059068726538e-06, "loss": 1.0017, "step": 4946 }, { "epoch": 0.11, "learning_rate": 9.812957320631462e-06, "loss": 1.2364, "step": 4947 }, { "epoch": 0.11, "learning_rate": 9.81285554538201e-06, "loss": 0.7565, "step": 4948 }, { "epoch": 0.11, "learning_rate": 9.812753742978753e-06, "loss": 0.9682, "step": 4949 }, { "epoch": 0.11, "learning_rate": 9.812651913422268e-06, "loss": 1.2865, "step": 4950 }, { "epoch": 0.11, "learning_rate": 9.812550056713128e-06, "loss": 0.9695, "step": 4951 }, { "epoch": 0.11, "learning_rate": 9.812448172851907e-06, "loss": 1.1303, "step": 4952 }, { "epoch": 0.11, "learning_rate": 9.812346261839182e-06, "loss": 1.1666, "step": 4953 }, { "epoch": 0.11, "learning_rate": 9.812244323675526e-06, "loss": 1.257, "step": 4954 }, { "epoch": 0.11, "learning_rate": 9.812142358361516e-06, "loss": 1.1314, "step": 4955 }, { "epoch": 0.11, "learning_rate": 9.812040365897725e-06, "loss": 1.2849, "step": 4956 }, { "epoch": 0.11, "learning_rate": 9.811938346284728e-06, "loss": 0.8982, "step": 4957 }, { "epoch": 0.11, "learning_rate": 9.811836299523105e-06, "loss": 1.0011, "step": 4958 }, { "epoch": 0.12, "learning_rate": 9.811734225613427e-06, "loss": 1.1058, "step": 4959 }, { "epoch": 0.12, "learning_rate": 9.811632124556273e-06, "loss": 0.8336, "step": 4960 }, { "epoch": 0.12, "learning_rate": 9.811529996352217e-06, "loss": 1.1246, "step": 4961 }, { "epoch": 0.12, "learning_rate": 9.811427841001837e-06, "loss": 0.7776, "step": 4962 }, { "epoch": 0.12, "learning_rate": 9.811325658505708e-06, "loss": 1.0289, "step": 4963 }, { "epoch": 0.12, "learning_rate": 9.811223448864407e-06, "loss": 1.0671, "step": 4964 }, { "epoch": 0.12, "learning_rate": 9.81112121207851e-06, "loss": 1.075, "step": 4965 }, { "epoch": 0.12, "learning_rate": 9.811018948148594e-06, "loss": 1.0895, "step": 4966 }, { "epoch": 0.12, "learning_rate": 9.810916657075238e-06, "loss": 0.8671, "step": 4967 }, { "epoch": 0.12, "learning_rate": 9.810814338859016e-06, "loss": 0.9457, "step": 4968 }, { "epoch": 0.12, "learning_rate": 9.810711993500506e-06, "loss": 0.9413, "step": 4969 }, { "epoch": 0.12, "learning_rate": 9.81060962100029e-06, "loss": 1.0437, "step": 4970 }, { "epoch": 0.12, "learning_rate": 9.810507221358938e-06, "loss": 1.1958, "step": 4971 }, { "epoch": 0.12, "learning_rate": 9.810404794577031e-06, "loss": 0.8771, "step": 4972 }, { "epoch": 0.12, "learning_rate": 9.81030234065515e-06, "loss": 1.0453, "step": 4973 }, { "epoch": 0.12, "learning_rate": 9.81019985959387e-06, "loss": 0.9612, "step": 4974 }, { "epoch": 0.12, "learning_rate": 9.810097351393768e-06, "loss": 1.1381, "step": 4975 }, { "epoch": 0.12, "learning_rate": 9.809994816055426e-06, "loss": 1.0869, "step": 4976 }, { "epoch": 0.12, "learning_rate": 9.809892253579418e-06, "loss": 1.0112, "step": 4977 }, { "epoch": 0.12, "learning_rate": 9.809789663966327e-06, "loss": 1.0324, "step": 4978 }, { "epoch": 0.12, "learning_rate": 9.80968704721673e-06, "loss": 1.2346, "step": 4979 }, { "epoch": 0.12, "learning_rate": 9.809584403331205e-06, "loss": 1.1252, "step": 4980 }, { "epoch": 0.12, "learning_rate": 9.80948173231033e-06, "loss": 1.0428, "step": 4981 }, { "epoch": 0.12, "learning_rate": 9.80937903415469e-06, "loss": 1.1136, "step": 4982 }, { "epoch": 0.12, "learning_rate": 9.809276308864857e-06, "loss": 1.0277, "step": 4983 }, { "epoch": 0.12, "learning_rate": 9.809173556441417e-06, "loss": 0.9966, "step": 4984 }, { "epoch": 0.12, "learning_rate": 9.809070776884945e-06, "loss": 0.9625, "step": 4985 }, { "epoch": 0.12, "learning_rate": 9.808967970196026e-06, "loss": 1.1343, "step": 4986 }, { "epoch": 0.12, "learning_rate": 9.808865136375235e-06, "loss": 0.9406, "step": 4987 }, { "epoch": 0.12, "learning_rate": 9.808762275423152e-06, "loss": 0.99, "step": 4988 }, { "epoch": 0.12, "learning_rate": 9.80865938734036e-06, "loss": 1.0856, "step": 4989 }, { "epoch": 0.12, "learning_rate": 9.808556472127441e-06, "loss": 1.2605, "step": 4990 }, { "epoch": 0.12, "learning_rate": 9.808453529784972e-06, "loss": 1.1191, "step": 4991 }, { "epoch": 0.12, "learning_rate": 9.808350560313535e-06, "loss": 0.6472, "step": 4992 }, { "epoch": 0.12, "learning_rate": 9.808247563713712e-06, "loss": 1.059, "step": 4993 }, { "epoch": 0.12, "learning_rate": 9.808144539986083e-06, "loss": 0.9603, "step": 4994 }, { "epoch": 0.12, "learning_rate": 9.808041489131229e-06, "loss": 0.9356, "step": 4995 }, { "epoch": 0.12, "learning_rate": 9.807938411149734e-06, "loss": 0.921, "step": 4996 }, { "epoch": 0.12, "learning_rate": 9.807835306042176e-06, "loss": 0.8896, "step": 4997 }, { "epoch": 0.12, "learning_rate": 9.807732173809137e-06, "loss": 1.0751, "step": 4998 }, { "epoch": 0.12, "learning_rate": 9.8076290144512e-06, "loss": 0.9275, "step": 4999 }, { "epoch": 0.12, "learning_rate": 9.807525827968948e-06, "loss": 1.2088, "step": 5000 }, { "epoch": 0.12, "learning_rate": 9.807422614362965e-06, "loss": 0.815, "step": 5001 }, { "epoch": 0.12, "learning_rate": 9.807319373633828e-06, "loss": 1.0044, "step": 5002 }, { "epoch": 0.12, "learning_rate": 9.807216105782123e-06, "loss": 0.9744, "step": 5003 }, { "epoch": 0.12, "learning_rate": 9.80711281080843e-06, "loss": 1.0539, "step": 5004 }, { "epoch": 0.12, "learning_rate": 9.807009488713336e-06, "loss": 0.8783, "step": 5005 }, { "epoch": 0.12, "learning_rate": 9.806906139497418e-06, "loss": 1.0849, "step": 5006 }, { "epoch": 0.12, "learning_rate": 9.806802763161266e-06, "loss": 0.9507, "step": 5007 }, { "epoch": 0.12, "learning_rate": 9.806699359705458e-06, "loss": 0.8508, "step": 5008 }, { "epoch": 0.12, "learning_rate": 9.80659592913058e-06, "loss": 1.3654, "step": 5009 }, { "epoch": 0.12, "learning_rate": 9.806492471437215e-06, "loss": 1.0039, "step": 5010 }, { "epoch": 0.12, "learning_rate": 9.806388986625944e-06, "loss": 0.9189, "step": 5011 }, { "epoch": 0.12, "learning_rate": 9.806285474697354e-06, "loss": 1.136, "step": 5012 }, { "epoch": 0.12, "learning_rate": 9.80618193565203e-06, "loss": 1.133, "step": 5013 }, { "epoch": 0.12, "learning_rate": 9.806078369490555e-06, "loss": 1.1865, "step": 5014 }, { "epoch": 0.12, "learning_rate": 9.80597477621351e-06, "loss": 1.4007, "step": 5015 }, { "epoch": 0.12, "learning_rate": 9.805871155821485e-06, "loss": 1.1725, "step": 5016 }, { "epoch": 0.12, "learning_rate": 9.805767508315061e-06, "loss": 1.0508, "step": 5017 }, { "epoch": 0.12, "learning_rate": 9.805663833694822e-06, "loss": 1.0091, "step": 5018 }, { "epoch": 0.12, "learning_rate": 9.805560131961355e-06, "loss": 0.9199, "step": 5019 }, { "epoch": 0.12, "learning_rate": 9.805456403115246e-06, "loss": 0.9912, "step": 5020 }, { "epoch": 0.12, "learning_rate": 9.805352647157078e-06, "loss": 0.9276, "step": 5021 }, { "epoch": 0.12, "learning_rate": 9.805248864087437e-06, "loss": 1.2803, "step": 5022 }, { "epoch": 0.12, "learning_rate": 9.805145053906908e-06, "loss": 0.9343, "step": 5023 }, { "epoch": 0.12, "learning_rate": 9.80504121661608e-06, "loss": 0.8692, "step": 5024 }, { "epoch": 0.12, "learning_rate": 9.804937352215535e-06, "loss": 1.3074, "step": 5025 }, { "epoch": 0.12, "learning_rate": 9.80483346070586e-06, "loss": 1.1617, "step": 5026 }, { "epoch": 0.12, "learning_rate": 9.804729542087641e-06, "loss": 1.2565, "step": 5027 }, { "epoch": 0.12, "learning_rate": 9.804625596361466e-06, "loss": 1.1558, "step": 5028 }, { "epoch": 0.12, "learning_rate": 9.804521623527918e-06, "loss": 1.0588, "step": 5029 }, { "epoch": 0.12, "learning_rate": 9.804417623587587e-06, "loss": 1.0702, "step": 5030 }, { "epoch": 0.12, "learning_rate": 9.80431359654106e-06, "loss": 0.9001, "step": 5031 }, { "epoch": 0.12, "learning_rate": 9.804209542388921e-06, "loss": 0.8961, "step": 5032 }, { "epoch": 0.12, "learning_rate": 9.804105461131759e-06, "loss": 0.7835, "step": 5033 }, { "epoch": 0.12, "learning_rate": 9.80400135277016e-06, "loss": 1.0663, "step": 5034 }, { "epoch": 0.12, "learning_rate": 9.803897217304713e-06, "loss": 1.0702, "step": 5035 }, { "epoch": 0.12, "learning_rate": 9.803793054736004e-06, "loss": 1.0519, "step": 5036 }, { "epoch": 0.12, "learning_rate": 9.803688865064621e-06, "loss": 1.0917, "step": 5037 }, { "epoch": 0.12, "learning_rate": 9.803584648291154e-06, "loss": 0.8893, "step": 5038 }, { "epoch": 0.12, "learning_rate": 9.803480404416188e-06, "loss": 1.1306, "step": 5039 }, { "epoch": 0.12, "learning_rate": 9.803376133440313e-06, "loss": 1.2193, "step": 5040 }, { "epoch": 0.12, "learning_rate": 9.803271835364115e-06, "loss": 0.972, "step": 5041 }, { "epoch": 0.12, "learning_rate": 9.803167510188186e-06, "loss": 0.9426, "step": 5042 }, { "epoch": 0.12, "learning_rate": 9.803063157913111e-06, "loss": 0.9276, "step": 5043 }, { "epoch": 0.12, "learning_rate": 9.80295877853948e-06, "loss": 1.247, "step": 5044 }, { "epoch": 0.12, "learning_rate": 9.802854372067885e-06, "loss": 1.0672, "step": 5045 }, { "epoch": 0.12, "learning_rate": 9.80274993849891e-06, "loss": 0.9956, "step": 5046 }, { "epoch": 0.12, "learning_rate": 9.802645477833147e-06, "loss": 1.092, "step": 5047 }, { "epoch": 0.12, "learning_rate": 9.802540990071185e-06, "loss": 0.8571, "step": 5048 }, { "epoch": 0.12, "learning_rate": 9.802436475213613e-06, "loss": 1.1011, "step": 5049 }, { "epoch": 0.12, "learning_rate": 9.802331933261022e-06, "loss": 1.0115, "step": 5050 }, { "epoch": 0.12, "learning_rate": 9.802227364214e-06, "loss": 0.8968, "step": 5051 }, { "epoch": 0.12, "learning_rate": 9.802122768073138e-06, "loss": 1.0001, "step": 5052 }, { "epoch": 0.12, "learning_rate": 9.802018144839027e-06, "loss": 1.0598, "step": 5053 }, { "epoch": 0.12, "learning_rate": 9.801913494512253e-06, "loss": 1.0158, "step": 5054 }, { "epoch": 0.12, "learning_rate": 9.801808817093414e-06, "loss": 1.2278, "step": 5055 }, { "epoch": 0.12, "learning_rate": 9.801704112583095e-06, "loss": 0.9049, "step": 5056 }, { "epoch": 0.12, "learning_rate": 9.801599380981886e-06, "loss": 0.946, "step": 5057 }, { "epoch": 0.12, "learning_rate": 9.801494622290381e-06, "loss": 0.9451, "step": 5058 }, { "epoch": 0.12, "learning_rate": 9.801389836509172e-06, "loss": 0.8694, "step": 5059 }, { "epoch": 0.12, "learning_rate": 9.801285023638846e-06, "loss": 0.9531, "step": 5060 }, { "epoch": 0.12, "learning_rate": 9.801180183679996e-06, "loss": 0.872, "step": 5061 }, { "epoch": 0.12, "learning_rate": 9.801075316633215e-06, "loss": 1.2542, "step": 5062 }, { "epoch": 0.12, "learning_rate": 9.800970422499095e-06, "loss": 1.2482, "step": 5063 }, { "epoch": 0.12, "learning_rate": 9.800865501278224e-06, "loss": 0.9952, "step": 5064 }, { "epoch": 0.12, "learning_rate": 9.800760552971197e-06, "loss": 1.1283, "step": 5065 }, { "epoch": 0.12, "learning_rate": 9.800655577578607e-06, "loss": 1.0143, "step": 5066 }, { "epoch": 0.12, "learning_rate": 9.800550575101041e-06, "loss": 0.9996, "step": 5067 }, { "epoch": 0.12, "learning_rate": 9.8004455455391e-06, "loss": 1.1791, "step": 5068 }, { "epoch": 0.12, "learning_rate": 9.80034048889337e-06, "loss": 1.2473, "step": 5069 }, { "epoch": 0.12, "learning_rate": 9.800235405164445e-06, "loss": 1.2119, "step": 5070 }, { "epoch": 0.12, "learning_rate": 9.800130294352918e-06, "loss": 1.0008, "step": 5071 }, { "epoch": 0.12, "learning_rate": 9.800025156459382e-06, "loss": 0.8901, "step": 5072 }, { "epoch": 0.12, "learning_rate": 9.799919991484431e-06, "loss": 1.188, "step": 5073 }, { "epoch": 0.12, "learning_rate": 9.799814799428658e-06, "loss": 1.1111, "step": 5074 }, { "epoch": 0.12, "learning_rate": 9.799709580292658e-06, "loss": 0.8965, "step": 5075 }, { "epoch": 0.12, "learning_rate": 9.79960433407702e-06, "loss": 1.1625, "step": 5076 }, { "epoch": 0.12, "learning_rate": 9.799499060782343e-06, "loss": 0.6565, "step": 5077 }, { "epoch": 0.12, "learning_rate": 9.79939376040922e-06, "loss": 0.8848, "step": 5078 }, { "epoch": 0.12, "learning_rate": 9.79928843295824e-06, "loss": 1.3745, "step": 5079 }, { "epoch": 0.12, "learning_rate": 9.799183078430004e-06, "loss": 1.0747, "step": 5080 }, { "epoch": 0.12, "learning_rate": 9.799077696825103e-06, "loss": 0.871, "step": 5081 }, { "epoch": 0.12, "learning_rate": 9.798972288144131e-06, "loss": 0.9861, "step": 5082 }, { "epoch": 0.12, "learning_rate": 9.798866852387685e-06, "loss": 1.1251, "step": 5083 }, { "epoch": 0.12, "learning_rate": 9.798761389556358e-06, "loss": 1.1651, "step": 5084 }, { "epoch": 0.12, "learning_rate": 9.798655899650746e-06, "loss": 1.1919, "step": 5085 }, { "epoch": 0.12, "learning_rate": 9.798550382671443e-06, "loss": 1.1611, "step": 5086 }, { "epoch": 0.12, "learning_rate": 9.798444838619047e-06, "loss": 1.1071, "step": 5087 }, { "epoch": 0.12, "learning_rate": 9.79833926749415e-06, "loss": 1.1308, "step": 5088 }, { "epoch": 0.12, "learning_rate": 9.79823366929735e-06, "loss": 1.0927, "step": 5089 }, { "epoch": 0.12, "learning_rate": 9.79812804402924e-06, "loss": 1.1466, "step": 5090 }, { "epoch": 0.12, "learning_rate": 9.79802239169042e-06, "loss": 0.9927, "step": 5091 }, { "epoch": 0.12, "learning_rate": 9.797916712281485e-06, "loss": 0.9512, "step": 5092 }, { "epoch": 0.12, "learning_rate": 9.79781100580303e-06, "loss": 0.9244, "step": 5093 }, { "epoch": 0.12, "learning_rate": 9.797705272255649e-06, "loss": 0.6933, "step": 5094 }, { "epoch": 0.12, "learning_rate": 9.797599511639943e-06, "loss": 1.1374, "step": 5095 }, { "epoch": 0.12, "learning_rate": 9.797493723956505e-06, "loss": 1.0913, "step": 5096 }, { "epoch": 0.12, "learning_rate": 9.797387909205936e-06, "loss": 1.0621, "step": 5097 }, { "epoch": 0.12, "learning_rate": 9.797282067388831e-06, "loss": 1.2803, "step": 5098 }, { "epoch": 0.12, "learning_rate": 9.797176198505786e-06, "loss": 1.0322, "step": 5099 }, { "epoch": 0.12, "learning_rate": 9.797070302557398e-06, "loss": 0.9699, "step": 5100 }, { "epoch": 0.12, "learning_rate": 9.796964379544267e-06, "loss": 1.137, "step": 5101 }, { "epoch": 0.12, "learning_rate": 9.79685842946699e-06, "loss": 1.0165, "step": 5102 }, { "epoch": 0.12, "learning_rate": 9.796752452326164e-06, "loss": 1.2094, "step": 5103 }, { "epoch": 0.12, "learning_rate": 9.796646448122384e-06, "loss": 1.0051, "step": 5104 }, { "epoch": 0.12, "learning_rate": 9.796540416856255e-06, "loss": 1.1513, "step": 5105 }, { "epoch": 0.12, "learning_rate": 9.796434358528368e-06, "loss": 1.011, "step": 5106 }, { "epoch": 0.12, "learning_rate": 9.796328273139326e-06, "loss": 1.0232, "step": 5107 }, { "epoch": 0.12, "learning_rate": 9.796222160689726e-06, "loss": 0.9757, "step": 5108 }, { "epoch": 0.12, "learning_rate": 9.796116021180167e-06, "loss": 0.906, "step": 5109 }, { "epoch": 0.12, "learning_rate": 9.796009854611248e-06, "loss": 0.902, "step": 5110 }, { "epoch": 0.12, "learning_rate": 9.795903660983567e-06, "loss": 1.1268, "step": 5111 }, { "epoch": 0.12, "learning_rate": 9.795797440297723e-06, "loss": 1.0955, "step": 5112 }, { "epoch": 0.12, "learning_rate": 9.795691192554318e-06, "loss": 0.6825, "step": 5113 }, { "epoch": 0.12, "learning_rate": 9.795584917753948e-06, "loss": 0.9894, "step": 5114 }, { "epoch": 0.12, "learning_rate": 9.795478615897215e-06, "loss": 1.073, "step": 5115 }, { "epoch": 0.12, "learning_rate": 9.795372286984716e-06, "loss": 1.342, "step": 5116 }, { "epoch": 0.12, "learning_rate": 9.795265931017055e-06, "loss": 1.0251, "step": 5117 }, { "epoch": 0.12, "learning_rate": 9.79515954799483e-06, "loss": 1.2522, "step": 5118 }, { "epoch": 0.12, "learning_rate": 9.79505313791864e-06, "loss": 0.8795, "step": 5119 }, { "epoch": 0.12, "learning_rate": 9.794946700789084e-06, "loss": 1.0077, "step": 5120 }, { "epoch": 0.12, "learning_rate": 9.79484023660677e-06, "loss": 1.0732, "step": 5121 }, { "epoch": 0.12, "learning_rate": 9.794733745372288e-06, "loss": 1.1499, "step": 5122 }, { "epoch": 0.12, "learning_rate": 9.794627227086248e-06, "loss": 1.083, "step": 5123 }, { "epoch": 0.12, "learning_rate": 9.794520681749247e-06, "loss": 1.288, "step": 5124 }, { "epoch": 0.12, "learning_rate": 9.794414109361885e-06, "loss": 0.8903, "step": 5125 }, { "epoch": 0.12, "learning_rate": 9.794307509924766e-06, "loss": 1.1173, "step": 5126 }, { "epoch": 0.12, "learning_rate": 9.79420088343849e-06, "loss": 1.1311, "step": 5127 }, { "epoch": 0.12, "learning_rate": 9.794094229903656e-06, "loss": 1.0648, "step": 5128 }, { "epoch": 0.12, "learning_rate": 9.79398754932087e-06, "loss": 1.1707, "step": 5129 }, { "epoch": 0.12, "learning_rate": 9.793880841690736e-06, "loss": 1.059, "step": 5130 }, { "epoch": 0.12, "learning_rate": 9.79377410701385e-06, "loss": 1.2129, "step": 5131 }, { "epoch": 0.12, "learning_rate": 9.793667345290815e-06, "loss": 1.1057, "step": 5132 }, { "epoch": 0.12, "learning_rate": 9.793560556522235e-06, "loss": 1.2002, "step": 5133 }, { "epoch": 0.12, "learning_rate": 9.793453740708713e-06, "loss": 0.8947, "step": 5134 }, { "epoch": 0.12, "learning_rate": 9.793346897850852e-06, "loss": 1.0106, "step": 5135 }, { "epoch": 0.12, "learning_rate": 9.793240027949254e-06, "loss": 1.2012, "step": 5136 }, { "epoch": 0.12, "learning_rate": 9.793133131004521e-06, "loss": 0.9814, "step": 5137 }, { "epoch": 0.12, "learning_rate": 9.793026207017257e-06, "loss": 0.9699, "step": 5138 }, { "epoch": 0.12, "learning_rate": 9.792919255988066e-06, "loss": 0.9465, "step": 5139 }, { "epoch": 0.12, "learning_rate": 9.792812277917548e-06, "loss": 0.9777, "step": 5140 }, { "epoch": 0.12, "learning_rate": 9.792705272806311e-06, "loss": 0.8599, "step": 5141 }, { "epoch": 0.12, "learning_rate": 9.792598240654957e-06, "loss": 0.925, "step": 5142 }, { "epoch": 0.12, "learning_rate": 9.79249118146409e-06, "loss": 0.6833, "step": 5143 }, { "epoch": 0.12, "learning_rate": 9.792384095234312e-06, "loss": 0.9401, "step": 5144 }, { "epoch": 0.12, "learning_rate": 9.79227698196623e-06, "loss": 1.103, "step": 5145 }, { "epoch": 0.12, "learning_rate": 9.792169841660449e-06, "loss": 0.9621, "step": 5146 }, { "epoch": 0.12, "learning_rate": 9.792062674317568e-06, "loss": 1.1991, "step": 5147 }, { "epoch": 0.12, "learning_rate": 9.791955479938198e-06, "loss": 0.9909, "step": 5148 }, { "epoch": 0.12, "learning_rate": 9.79184825852294e-06, "loss": 0.9673, "step": 5149 }, { "epoch": 0.12, "learning_rate": 9.791741010072401e-06, "loss": 0.8936, "step": 5150 }, { "epoch": 0.12, "learning_rate": 9.791633734587185e-06, "loss": 0.8504, "step": 5151 }, { "epoch": 0.12, "learning_rate": 9.791526432067897e-06, "loss": 0.8433, "step": 5152 }, { "epoch": 0.12, "learning_rate": 9.791419102515143e-06, "loss": 0.9241, "step": 5153 }, { "epoch": 0.12, "learning_rate": 9.791311745929528e-06, "loss": 1.0801, "step": 5154 }, { "epoch": 0.12, "learning_rate": 9.791204362311658e-06, "loss": 1.0635, "step": 5155 }, { "epoch": 0.12, "learning_rate": 9.791096951662139e-06, "loss": 1.0698, "step": 5156 }, { "epoch": 0.12, "learning_rate": 9.790989513981578e-06, "loss": 0.9432, "step": 5157 }, { "epoch": 0.12, "learning_rate": 9.790882049270579e-06, "loss": 1.27, "step": 5158 }, { "epoch": 0.12, "learning_rate": 9.790774557529749e-06, "loss": 1.2063, "step": 5159 }, { "epoch": 0.12, "learning_rate": 9.790667038759695e-06, "loss": 1.0378, "step": 5160 }, { "epoch": 0.12, "learning_rate": 9.790559492961024e-06, "loss": 0.9369, "step": 5161 }, { "epoch": 0.12, "learning_rate": 9.79045192013434e-06, "loss": 0.8181, "step": 5162 }, { "epoch": 0.12, "learning_rate": 9.790344320280256e-06, "loss": 1.0304, "step": 5163 }, { "epoch": 0.12, "learning_rate": 9.790236693399373e-06, "loss": 1.1434, "step": 5164 }, { "epoch": 0.12, "learning_rate": 9.7901290394923e-06, "loss": 0.9477, "step": 5165 }, { "epoch": 0.12, "learning_rate": 9.790021358559645e-06, "loss": 1.0999, "step": 5166 }, { "epoch": 0.12, "learning_rate": 9.789913650602017e-06, "loss": 1.0946, "step": 5167 }, { "epoch": 0.12, "learning_rate": 9.78980591562002e-06, "loss": 0.9539, "step": 5168 }, { "epoch": 0.12, "learning_rate": 9.789698153614265e-06, "loss": 0.9097, "step": 5169 }, { "epoch": 0.12, "learning_rate": 9.789590364585357e-06, "loss": 0.9784, "step": 5170 }, { "epoch": 0.12, "learning_rate": 9.78948254853391e-06, "loss": 1.252, "step": 5171 }, { "epoch": 0.12, "learning_rate": 9.789374705460523e-06, "loss": 0.7549, "step": 5172 }, { "epoch": 0.12, "learning_rate": 9.789266835365812e-06, "loss": 0.6964, "step": 5173 }, { "epoch": 0.12, "learning_rate": 9.789158938250386e-06, "loss": 1.2102, "step": 5174 }, { "epoch": 0.12, "learning_rate": 9.789051014114847e-06, "loss": 0.9568, "step": 5175 }, { "epoch": 0.12, "learning_rate": 9.78894306295981e-06, "loss": 1.2768, "step": 5176 }, { "epoch": 0.12, "learning_rate": 9.78883508478588e-06, "loss": 1.1444, "step": 5177 }, { "epoch": 0.12, "learning_rate": 9.788727079593669e-06, "loss": 0.9366, "step": 5178 }, { "epoch": 0.12, "learning_rate": 9.788619047383787e-06, "loss": 1.2941, "step": 5179 }, { "epoch": 0.12, "learning_rate": 9.788510988156841e-06, "loss": 0.9721, "step": 5180 }, { "epoch": 0.12, "learning_rate": 9.788402901913443e-06, "loss": 1.0711, "step": 5181 }, { "epoch": 0.12, "learning_rate": 9.788294788654201e-06, "loss": 1.1368, "step": 5182 }, { "epoch": 0.12, "learning_rate": 9.788186648379724e-06, "loss": 0.8697, "step": 5183 }, { "epoch": 0.12, "learning_rate": 9.788078481090625e-06, "loss": 1.0623, "step": 5184 }, { "epoch": 0.12, "learning_rate": 9.787970286787512e-06, "loss": 1.1163, "step": 5185 }, { "epoch": 0.12, "learning_rate": 9.787862065470996e-06, "loss": 1.031, "step": 5186 }, { "epoch": 0.12, "learning_rate": 9.78775381714169e-06, "loss": 0.957, "step": 5187 }, { "epoch": 0.12, "learning_rate": 9.787645541800202e-06, "loss": 1.1398, "step": 5188 }, { "epoch": 0.12, "learning_rate": 9.787537239447143e-06, "loss": 1.3057, "step": 5189 }, { "epoch": 0.12, "learning_rate": 9.787428910083122e-06, "loss": 1.0155, "step": 5190 }, { "epoch": 0.12, "learning_rate": 9.787320553708756e-06, "loss": 0.9651, "step": 5191 }, { "epoch": 0.12, "learning_rate": 9.78721217032465e-06, "loss": 0.8766, "step": 5192 }, { "epoch": 0.12, "learning_rate": 9.787103759931422e-06, "loss": 1.2308, "step": 5193 }, { "epoch": 0.12, "learning_rate": 9.78699532252968e-06, "loss": 0.8369, "step": 5194 }, { "epoch": 0.12, "learning_rate": 9.786886858120035e-06, "loss": 1.1445, "step": 5195 }, { "epoch": 0.12, "learning_rate": 9.7867783667031e-06, "loss": 1.195, "step": 5196 }, { "epoch": 0.12, "learning_rate": 9.786669848279486e-06, "loss": 0.7245, "step": 5197 }, { "epoch": 0.12, "learning_rate": 9.786561302849809e-06, "loss": 1.1332, "step": 5198 }, { "epoch": 0.12, "learning_rate": 9.786452730414676e-06, "loss": 0.9058, "step": 5199 }, { "epoch": 0.12, "learning_rate": 9.786344130974702e-06, "loss": 1.234, "step": 5200 }, { "epoch": 0.12, "learning_rate": 9.786235504530503e-06, "loss": 1.0216, "step": 5201 }, { "epoch": 0.12, "learning_rate": 9.786126851082687e-06, "loss": 1.03, "step": 5202 }, { "epoch": 0.12, "learning_rate": 9.786018170631868e-06, "loss": 0.903, "step": 5203 }, { "epoch": 0.12, "learning_rate": 9.785909463178663e-06, "loss": 0.8136, "step": 5204 }, { "epoch": 0.12, "learning_rate": 9.785800728723678e-06, "loss": 1.1504, "step": 5205 }, { "epoch": 0.12, "learning_rate": 9.785691967267535e-06, "loss": 0.9574, "step": 5206 }, { "epoch": 0.12, "learning_rate": 9.78558317881084e-06, "loss": 1.4383, "step": 5207 }, { "epoch": 0.12, "learning_rate": 9.785474363354212e-06, "loss": 1.3228, "step": 5208 }, { "epoch": 0.12, "learning_rate": 9.785365520898263e-06, "loss": 1.0094, "step": 5209 }, { "epoch": 0.12, "learning_rate": 9.785256651443608e-06, "loss": 1.0456, "step": 5210 }, { "epoch": 0.12, "learning_rate": 9.78514775499086e-06, "loss": 0.8726, "step": 5211 }, { "epoch": 0.12, "learning_rate": 9.785038831540633e-06, "loss": 1.3034, "step": 5212 }, { "epoch": 0.12, "learning_rate": 9.784929881093542e-06, "loss": 1.2153, "step": 5213 }, { "epoch": 0.12, "learning_rate": 9.784820903650203e-06, "loss": 1.2209, "step": 5214 }, { "epoch": 0.12, "learning_rate": 9.78471189921123e-06, "loss": 0.947, "step": 5215 }, { "epoch": 0.12, "learning_rate": 9.784602867777238e-06, "loss": 0.8451, "step": 5216 }, { "epoch": 0.12, "learning_rate": 9.784493809348843e-06, "loss": 0.7832, "step": 5217 }, { "epoch": 0.12, "learning_rate": 9.784384723926658e-06, "loss": 1.0879, "step": 5218 }, { "epoch": 0.12, "learning_rate": 9.7842756115113e-06, "loss": 1.1333, "step": 5219 }, { "epoch": 0.12, "learning_rate": 9.784166472103385e-06, "loss": 1.0357, "step": 5220 }, { "epoch": 0.12, "learning_rate": 9.784057305703527e-06, "loss": 1.1398, "step": 5221 }, { "epoch": 0.12, "learning_rate": 9.783948112312343e-06, "loss": 1.0276, "step": 5222 }, { "epoch": 0.12, "learning_rate": 9.78383889193045e-06, "loss": 1.1254, "step": 5223 }, { "epoch": 0.12, "learning_rate": 9.783729644558464e-06, "loss": 1.0804, "step": 5224 }, { "epoch": 0.12, "learning_rate": 9.783620370197e-06, "loss": 1.1796, "step": 5225 }, { "epoch": 0.12, "learning_rate": 9.783511068846676e-06, "loss": 1.153, "step": 5226 }, { "epoch": 0.12, "learning_rate": 9.783401740508106e-06, "loss": 1.1862, "step": 5227 }, { "epoch": 0.12, "learning_rate": 9.78329238518191e-06, "loss": 0.9624, "step": 5228 }, { "epoch": 0.12, "learning_rate": 9.783183002868704e-06, "loss": 1.1421, "step": 5229 }, { "epoch": 0.12, "learning_rate": 9.783073593569104e-06, "loss": 0.9815, "step": 5230 }, { "epoch": 0.12, "learning_rate": 9.78296415728373e-06, "loss": 1.1083, "step": 5231 }, { "epoch": 0.12, "learning_rate": 9.782854694013194e-06, "loss": 1.0492, "step": 5232 }, { "epoch": 0.12, "learning_rate": 9.782745203758121e-06, "loss": 0.975, "step": 5233 }, { "epoch": 0.12, "learning_rate": 9.782635686519122e-06, "loss": 0.9899, "step": 5234 }, { "epoch": 0.12, "learning_rate": 9.78252614229682e-06, "loss": 1.2173, "step": 5235 }, { "epoch": 0.12, "learning_rate": 9.782416571091831e-06, "loss": 1.1679, "step": 5236 }, { "epoch": 0.12, "learning_rate": 9.782306972904772e-06, "loss": 0.8355, "step": 5237 }, { "epoch": 0.12, "learning_rate": 9.78219734773626e-06, "loss": 1.2423, "step": 5238 }, { "epoch": 0.12, "learning_rate": 9.782087695586919e-06, "loss": 1.0528, "step": 5239 }, { "epoch": 0.12, "learning_rate": 9.781978016457363e-06, "loss": 0.8665, "step": 5240 }, { "epoch": 0.12, "learning_rate": 9.781868310348214e-06, "loss": 1.1737, "step": 5241 }, { "epoch": 0.12, "learning_rate": 9.781758577260087e-06, "loss": 1.1125, "step": 5242 }, { "epoch": 0.12, "learning_rate": 9.781648817193606e-06, "loss": 1.0569, "step": 5243 }, { "epoch": 0.12, "learning_rate": 9.781539030149385e-06, "loss": 1.2215, "step": 5244 }, { "epoch": 0.12, "learning_rate": 9.781429216128046e-06, "loss": 1.0615, "step": 5245 }, { "epoch": 0.12, "learning_rate": 9.781319375130212e-06, "loss": 0.8655, "step": 5246 }, { "epoch": 0.12, "learning_rate": 9.781209507156496e-06, "loss": 1.0753, "step": 5247 }, { "epoch": 0.12, "learning_rate": 9.781099612207522e-06, "loss": 0.9267, "step": 5248 }, { "epoch": 0.12, "learning_rate": 9.780989690283912e-06, "loss": 0.9412, "step": 5249 }, { "epoch": 0.12, "learning_rate": 9.780879741386279e-06, "loss": 1.3175, "step": 5250 }, { "epoch": 0.12, "learning_rate": 9.78076976551525e-06, "loss": 0.8569, "step": 5251 }, { "epoch": 0.12, "learning_rate": 9.780659762671441e-06, "loss": 1.1021, "step": 5252 }, { "epoch": 0.12, "learning_rate": 9.780549732855477e-06, "loss": 1.037, "step": 5253 }, { "epoch": 0.12, "learning_rate": 9.780439676067977e-06, "loss": 0.8005, "step": 5254 }, { "epoch": 0.12, "learning_rate": 9.78032959230956e-06, "loss": 0.8555, "step": 5255 }, { "epoch": 0.12, "learning_rate": 9.78021948158085e-06, "loss": 1.1663, "step": 5256 }, { "epoch": 0.12, "learning_rate": 9.780109343882464e-06, "loss": 1.2904, "step": 5257 }, { "epoch": 0.12, "learning_rate": 9.77999917921503e-06, "loss": 1.0452, "step": 5258 }, { "epoch": 0.12, "learning_rate": 9.779888987579164e-06, "loss": 1.1316, "step": 5259 }, { "epoch": 0.12, "learning_rate": 9.779778768975489e-06, "loss": 0.8932, "step": 5260 }, { "epoch": 0.12, "learning_rate": 9.779668523404628e-06, "loss": 1.0746, "step": 5261 }, { "epoch": 0.12, "learning_rate": 9.779558250867202e-06, "loss": 0.9822, "step": 5262 }, { "epoch": 0.12, "learning_rate": 9.779447951363834e-06, "loss": 1.0075, "step": 5263 }, { "epoch": 0.12, "learning_rate": 9.779337624895144e-06, "loss": 0.9856, "step": 5264 }, { "epoch": 0.12, "learning_rate": 9.779227271461757e-06, "loss": 1.2929, "step": 5265 }, { "epoch": 0.12, "learning_rate": 9.779116891064296e-06, "loss": 1.1304, "step": 5266 }, { "epoch": 0.12, "learning_rate": 9.779006483703381e-06, "loss": 1.166, "step": 5267 }, { "epoch": 0.12, "learning_rate": 9.778896049379639e-06, "loss": 1.1684, "step": 5268 }, { "epoch": 0.12, "learning_rate": 9.778785588093689e-06, "loss": 0.7661, "step": 5269 }, { "epoch": 0.12, "learning_rate": 9.778675099846155e-06, "loss": 1.1129, "step": 5270 }, { "epoch": 0.12, "learning_rate": 9.778564584637663e-06, "loss": 1.5071, "step": 5271 }, { "epoch": 0.12, "learning_rate": 9.778454042468833e-06, "loss": 0.9122, "step": 5272 }, { "epoch": 0.12, "learning_rate": 9.77834347334029e-06, "loss": 1.0176, "step": 5273 }, { "epoch": 0.12, "learning_rate": 9.778232877252658e-06, "loss": 1.0058, "step": 5274 }, { "epoch": 0.12, "learning_rate": 9.778122254206563e-06, "loss": 1.0777, "step": 5275 }, { "epoch": 0.12, "learning_rate": 9.778011604202627e-06, "loss": 1.0143, "step": 5276 }, { "epoch": 0.12, "learning_rate": 9.777900927241472e-06, "loss": 1.1411, "step": 5277 }, { "epoch": 0.12, "learning_rate": 9.777790223323729e-06, "loss": 1.181, "step": 5278 }, { "epoch": 0.12, "learning_rate": 9.777679492450016e-06, "loss": 0.9056, "step": 5279 }, { "epoch": 0.12, "learning_rate": 9.77756873462096e-06, "loss": 1.0269, "step": 5280 }, { "epoch": 0.12, "learning_rate": 9.777457949837187e-06, "loss": 1.1453, "step": 5281 }, { "epoch": 0.12, "learning_rate": 9.77734713809932e-06, "loss": 1.181, "step": 5282 }, { "epoch": 0.12, "learning_rate": 9.777236299407988e-06, "loss": 1.1084, "step": 5283 }, { "epoch": 0.12, "learning_rate": 9.777125433763812e-06, "loss": 1.0113, "step": 5284 }, { "epoch": 0.12, "learning_rate": 9.77701454116742e-06, "loss": 1.0865, "step": 5285 }, { "epoch": 0.12, "learning_rate": 9.776903621619436e-06, "loss": 1.1624, "step": 5286 }, { "epoch": 0.12, "learning_rate": 9.776792675120486e-06, "loss": 0.9976, "step": 5287 }, { "epoch": 0.12, "learning_rate": 9.776681701671198e-06, "loss": 1.3435, "step": 5288 }, { "epoch": 0.12, "learning_rate": 9.776570701272197e-06, "loss": 1.0139, "step": 5289 }, { "epoch": 0.12, "learning_rate": 9.776459673924109e-06, "loss": 0.9973, "step": 5290 }, { "epoch": 0.12, "learning_rate": 9.776348619627558e-06, "loss": 1.3109, "step": 5291 }, { "epoch": 0.12, "learning_rate": 9.776237538383175e-06, "loss": 1.1019, "step": 5292 }, { "epoch": 0.12, "learning_rate": 9.776126430191585e-06, "loss": 0.9009, "step": 5293 }, { "epoch": 0.12, "learning_rate": 9.776015295053414e-06, "loss": 1.1194, "step": 5294 }, { "epoch": 0.12, "learning_rate": 9.775904132969289e-06, "loss": 1.1532, "step": 5295 }, { "epoch": 0.12, "learning_rate": 9.775792943939839e-06, "loss": 0.986, "step": 5296 }, { "epoch": 0.12, "learning_rate": 9.775681727965688e-06, "loss": 1.0364, "step": 5297 }, { "epoch": 0.12, "learning_rate": 9.775570485047469e-06, "loss": 1.2663, "step": 5298 }, { "epoch": 0.12, "learning_rate": 9.775459215185802e-06, "loss": 1.1197, "step": 5299 }, { "epoch": 0.12, "learning_rate": 9.775347918381322e-06, "loss": 1.054, "step": 5300 }, { "epoch": 0.12, "learning_rate": 9.775236594634653e-06, "loss": 1.0549, "step": 5301 }, { "epoch": 0.12, "learning_rate": 9.775125243946425e-06, "loss": 1.1854, "step": 5302 }, { "epoch": 0.12, "learning_rate": 9.775013866317263e-06, "loss": 1.0478, "step": 5303 }, { "epoch": 0.12, "learning_rate": 9.7749024617478e-06, "loss": 1.0645, "step": 5304 }, { "epoch": 0.12, "learning_rate": 9.77479103023866e-06, "loss": 1.0638, "step": 5305 }, { "epoch": 0.12, "learning_rate": 9.774679571790474e-06, "loss": 1.0441, "step": 5306 }, { "epoch": 0.12, "learning_rate": 9.774568086403871e-06, "loss": 0.996, "step": 5307 }, { "epoch": 0.12, "learning_rate": 9.774456574079481e-06, "loss": 0.9437, "step": 5308 }, { "epoch": 0.12, "learning_rate": 9.77434503481793e-06, "loss": 0.9382, "step": 5309 }, { "epoch": 0.12, "learning_rate": 9.774233468619849e-06, "loss": 1.1149, "step": 5310 }, { "epoch": 0.12, "learning_rate": 9.774121875485867e-06, "loss": 0.7824, "step": 5311 }, { "epoch": 0.12, "learning_rate": 9.774010255416616e-06, "loss": 1.137, "step": 5312 }, { "epoch": 0.12, "learning_rate": 9.773898608412723e-06, "loss": 1.1425, "step": 5313 }, { "epoch": 0.12, "learning_rate": 9.77378693447482e-06, "loss": 1.0368, "step": 5314 }, { "epoch": 0.12, "learning_rate": 9.773675233603534e-06, "loss": 1.1833, "step": 5315 }, { "epoch": 0.12, "learning_rate": 9.773563505799497e-06, "loss": 1.1933, "step": 5316 }, { "epoch": 0.12, "learning_rate": 9.773451751063342e-06, "loss": 0.9832, "step": 5317 }, { "epoch": 0.12, "learning_rate": 9.773339969395695e-06, "loss": 0.9477, "step": 5318 }, { "epoch": 0.12, "learning_rate": 9.773228160797187e-06, "loss": 0.9437, "step": 5319 }, { "epoch": 0.12, "learning_rate": 9.773116325268453e-06, "loss": 1.0112, "step": 5320 }, { "epoch": 0.12, "learning_rate": 9.773004462810119e-06, "loss": 0.7232, "step": 5321 }, { "epoch": 0.12, "learning_rate": 9.77289257342282e-06, "loss": 0.891, "step": 5322 }, { "epoch": 0.12, "learning_rate": 9.772780657107186e-06, "loss": 1.0803, "step": 5323 }, { "epoch": 0.12, "learning_rate": 9.772668713863848e-06, "loss": 1.0402, "step": 5324 }, { "epoch": 0.12, "learning_rate": 9.772556743693438e-06, "loss": 1.052, "step": 5325 }, { "epoch": 0.12, "learning_rate": 9.772444746596585e-06, "loss": 1.0511, "step": 5326 }, { "epoch": 0.12, "learning_rate": 9.772332722573928e-06, "loss": 0.9703, "step": 5327 }, { "epoch": 0.12, "learning_rate": 9.77222067162609e-06, "loss": 0.9315, "step": 5328 }, { "epoch": 0.12, "learning_rate": 9.77210859375371e-06, "loss": 0.9157, "step": 5329 }, { "epoch": 0.12, "learning_rate": 9.771996488957417e-06, "loss": 0.939, "step": 5330 }, { "epoch": 0.12, "learning_rate": 9.771884357237845e-06, "loss": 0.9407, "step": 5331 }, { "epoch": 0.12, "learning_rate": 9.771772198595626e-06, "loss": 1.1022, "step": 5332 }, { "epoch": 0.12, "learning_rate": 9.771660013031392e-06, "loss": 0.8891, "step": 5333 }, { "epoch": 0.12, "learning_rate": 9.771547800545778e-06, "loss": 1.3562, "step": 5334 }, { "epoch": 0.12, "learning_rate": 9.771435561139416e-06, "loss": 1.0059, "step": 5335 }, { "epoch": 0.12, "learning_rate": 9.771323294812936e-06, "loss": 1.1485, "step": 5336 }, { "epoch": 0.12, "learning_rate": 9.771211001566978e-06, "loss": 1.0157, "step": 5337 }, { "epoch": 0.12, "learning_rate": 9.77109868140217e-06, "loss": 1.0916, "step": 5338 }, { "epoch": 0.12, "learning_rate": 9.77098633431915e-06, "loss": 1.14, "step": 5339 }, { "epoch": 0.12, "learning_rate": 9.770873960318548e-06, "loss": 0.8726, "step": 5340 }, { "epoch": 0.12, "learning_rate": 9.770761559400999e-06, "loss": 0.7998, "step": 5341 }, { "epoch": 0.12, "learning_rate": 9.770649131567137e-06, "loss": 1.0217, "step": 5342 }, { "epoch": 0.12, "learning_rate": 9.770536676817601e-06, "loss": 1.0046, "step": 5343 }, { "epoch": 0.12, "learning_rate": 9.77042419515302e-06, "loss": 1.0603, "step": 5344 }, { "epoch": 0.12, "learning_rate": 9.770311686574028e-06, "loss": 1.2305, "step": 5345 }, { "epoch": 0.12, "learning_rate": 9.770199151081263e-06, "loss": 0.9027, "step": 5346 }, { "epoch": 0.12, "learning_rate": 9.77008658867536e-06, "loss": 0.9645, "step": 5347 }, { "epoch": 0.12, "learning_rate": 9.769973999356951e-06, "loss": 1.1213, "step": 5348 }, { "epoch": 0.12, "learning_rate": 9.769861383126676e-06, "loss": 0.9989, "step": 5349 }, { "epoch": 0.12, "learning_rate": 9.769748739985166e-06, "loss": 0.9344, "step": 5350 }, { "epoch": 0.12, "learning_rate": 9.769636069933057e-06, "loss": 0.9927, "step": 5351 }, { "epoch": 0.12, "learning_rate": 9.769523372970988e-06, "loss": 0.7538, "step": 5352 }, { "epoch": 0.12, "learning_rate": 9.769410649099592e-06, "loss": 1.1163, "step": 5353 }, { "epoch": 0.12, "learning_rate": 9.769297898319503e-06, "loss": 1.1298, "step": 5354 }, { "epoch": 0.12, "learning_rate": 9.769185120631361e-06, "loss": 1.2047, "step": 5355 }, { "epoch": 0.12, "learning_rate": 9.769072316035802e-06, "loss": 0.8594, "step": 5356 }, { "epoch": 0.12, "learning_rate": 9.768959484533461e-06, "loss": 0.9948, "step": 5357 }, { "epoch": 0.12, "learning_rate": 9.768846626124975e-06, "loss": 1.0349, "step": 5358 }, { "epoch": 0.12, "learning_rate": 9.768733740810981e-06, "loss": 0.9083, "step": 5359 }, { "epoch": 0.12, "learning_rate": 9.768620828592115e-06, "loss": 1.1774, "step": 5360 }, { "epoch": 0.12, "learning_rate": 9.768507889469014e-06, "loss": 1.1213, "step": 5361 }, { "epoch": 0.12, "learning_rate": 9.768394923442317e-06, "loss": 1.2344, "step": 5362 }, { "epoch": 0.12, "learning_rate": 9.76828193051266e-06, "loss": 1.0346, "step": 5363 }, { "epoch": 0.12, "learning_rate": 9.76816891068068e-06, "loss": 1.1187, "step": 5364 }, { "epoch": 0.12, "learning_rate": 9.768055863947015e-06, "loss": 0.8917, "step": 5365 }, { "epoch": 0.12, "learning_rate": 9.767942790312304e-06, "loss": 1.0842, "step": 5366 }, { "epoch": 0.12, "learning_rate": 9.767829689777184e-06, "loss": 1.111, "step": 5367 }, { "epoch": 0.12, "learning_rate": 9.767716562342294e-06, "loss": 1.0953, "step": 5368 }, { "epoch": 0.12, "learning_rate": 9.76760340800827e-06, "loss": 0.9301, "step": 5369 }, { "epoch": 0.12, "learning_rate": 9.767490226775753e-06, "loss": 1.0947, "step": 5370 }, { "epoch": 0.12, "learning_rate": 9.767377018645382e-06, "loss": 1.0674, "step": 5371 }, { "epoch": 0.12, "learning_rate": 9.76726378361779e-06, "loss": 1.029, "step": 5372 }, { "epoch": 0.12, "learning_rate": 9.767150521693623e-06, "loss": 1.0154, "step": 5373 }, { "epoch": 0.12, "learning_rate": 9.767037232873516e-06, "loss": 0.8598, "step": 5374 }, { "epoch": 0.12, "learning_rate": 9.766923917158108e-06, "loss": 0.9603, "step": 5375 }, { "epoch": 0.12, "learning_rate": 9.766810574548042e-06, "loss": 0.8916, "step": 5376 }, { "epoch": 0.12, "learning_rate": 9.766697205043953e-06, "loss": 0.9835, "step": 5377 }, { "epoch": 0.12, "learning_rate": 9.766583808646484e-06, "loss": 0.9416, "step": 5378 }, { "epoch": 0.12, "learning_rate": 9.766470385356272e-06, "loss": 0.913, "step": 5379 }, { "epoch": 0.12, "learning_rate": 9.766356935173959e-06, "loss": 0.8838, "step": 5380 }, { "epoch": 0.12, "learning_rate": 9.766243458100186e-06, "loss": 1.0595, "step": 5381 }, { "epoch": 0.12, "learning_rate": 9.766129954135588e-06, "loss": 1.1636, "step": 5382 }, { "epoch": 0.12, "learning_rate": 9.766016423280814e-06, "loss": 0.9578, "step": 5383 }, { "epoch": 0.12, "learning_rate": 9.765902865536495e-06, "loss": 1.0314, "step": 5384 }, { "epoch": 0.12, "learning_rate": 9.765789280903277e-06, "loss": 1.183, "step": 5385 }, { "epoch": 0.12, "learning_rate": 9.765675669381802e-06, "loss": 0.8387, "step": 5386 }, { "epoch": 0.12, "learning_rate": 9.765562030972708e-06, "loss": 1.3925, "step": 5387 }, { "epoch": 0.12, "learning_rate": 9.765448365676637e-06, "loss": 1.1123, "step": 5388 }, { "epoch": 0.12, "learning_rate": 9.76533467349423e-06, "loss": 0.9533, "step": 5389 }, { "epoch": 0.13, "learning_rate": 9.76522095442613e-06, "loss": 1.0812, "step": 5390 }, { "epoch": 0.13, "learning_rate": 9.765107208472977e-06, "loss": 0.9618, "step": 5391 }, { "epoch": 0.13, "learning_rate": 9.764993435635412e-06, "loss": 0.9774, "step": 5392 }, { "epoch": 0.13, "learning_rate": 9.76487963591408e-06, "loss": 1.0454, "step": 5393 }, { "epoch": 0.13, "learning_rate": 9.76476580930962e-06, "loss": 0.9954, "step": 5394 }, { "epoch": 0.13, "learning_rate": 9.764651955822677e-06, "loss": 0.9393, "step": 5395 }, { "epoch": 0.13, "learning_rate": 9.764538075453892e-06, "loss": 1.081, "step": 5396 }, { "epoch": 0.13, "learning_rate": 9.764424168203904e-06, "loss": 1.1515, "step": 5397 }, { "epoch": 0.13, "learning_rate": 9.76431023407336e-06, "loss": 1.036, "step": 5398 }, { "epoch": 0.13, "learning_rate": 9.764196273062903e-06, "loss": 0.9608, "step": 5399 }, { "epoch": 0.13, "learning_rate": 9.764082285173175e-06, "loss": 1.0808, "step": 5400 }, { "epoch": 0.13, "learning_rate": 9.763968270404819e-06, "loss": 1.2525, "step": 5401 }, { "epoch": 0.13, "learning_rate": 9.763854228758477e-06, "loss": 0.9991, "step": 5402 }, { "epoch": 0.13, "learning_rate": 9.763740160234794e-06, "loss": 1.0496, "step": 5403 }, { "epoch": 0.13, "learning_rate": 9.763626064834411e-06, "loss": 1.1873, "step": 5404 }, { "epoch": 0.13, "learning_rate": 9.763511942557976e-06, "loss": 1.1444, "step": 5405 }, { "epoch": 0.13, "learning_rate": 9.763397793406131e-06, "loss": 1.1759, "step": 5406 }, { "epoch": 0.13, "learning_rate": 9.763283617379517e-06, "loss": 1.1531, "step": 5407 }, { "epoch": 0.13, "learning_rate": 9.763169414478783e-06, "loss": 0.7217, "step": 5408 }, { "epoch": 0.13, "learning_rate": 9.76305518470457e-06, "loss": 1.0855, "step": 5409 }, { "epoch": 0.13, "learning_rate": 9.762940928057524e-06, "loss": 1.0212, "step": 5410 }, { "epoch": 0.13, "learning_rate": 9.762826644538292e-06, "loss": 1.1575, "step": 5411 }, { "epoch": 0.13, "learning_rate": 9.762712334147513e-06, "loss": 1.0078, "step": 5412 }, { "epoch": 0.13, "learning_rate": 9.762597996885836e-06, "loss": 0.807, "step": 5413 }, { "epoch": 0.13, "learning_rate": 9.762483632753903e-06, "loss": 1.0952, "step": 5414 }, { "epoch": 0.13, "learning_rate": 9.762369241752365e-06, "loss": 1.0429, "step": 5415 }, { "epoch": 0.13, "learning_rate": 9.76225482388186e-06, "loss": 0.8947, "step": 5416 }, { "epoch": 0.13, "learning_rate": 9.762140379143039e-06, "loss": 1.1601, "step": 5417 }, { "epoch": 0.13, "learning_rate": 9.762025907536547e-06, "loss": 0.9182, "step": 5418 }, { "epoch": 0.13, "learning_rate": 9.761911409063028e-06, "loss": 1.243, "step": 5419 }, { "epoch": 0.13, "learning_rate": 9.761796883723127e-06, "loss": 0.9661, "step": 5420 }, { "epoch": 0.13, "learning_rate": 9.761682331517494e-06, "loss": 0.8298, "step": 5421 }, { "epoch": 0.13, "learning_rate": 9.761567752446772e-06, "loss": 0.9247, "step": 5422 }, { "epoch": 0.13, "learning_rate": 9.761453146511608e-06, "loss": 0.8639, "step": 5423 }, { "epoch": 0.13, "learning_rate": 9.76133851371265e-06, "loss": 0.7899, "step": 5424 }, { "epoch": 0.13, "learning_rate": 9.761223854050546e-06, "loss": 1.1354, "step": 5425 }, { "epoch": 0.13, "learning_rate": 9.76110916752594e-06, "loss": 1.1301, "step": 5426 }, { "epoch": 0.13, "learning_rate": 9.760994454139476e-06, "loss": 0.9051, "step": 5427 }, { "epoch": 0.13, "learning_rate": 9.760879713891808e-06, "loss": 1.2692, "step": 5428 }, { "epoch": 0.13, "learning_rate": 9.760764946783582e-06, "loss": 1.2683, "step": 5429 }, { "epoch": 0.13, "learning_rate": 9.760650152815443e-06, "loss": 1.0865, "step": 5430 }, { "epoch": 0.13, "learning_rate": 9.76053533198804e-06, "loss": 1.1721, "step": 5431 }, { "epoch": 0.13, "learning_rate": 9.760420484302018e-06, "loss": 1.1668, "step": 5432 }, { "epoch": 0.13, "learning_rate": 9.76030560975803e-06, "loss": 0.9945, "step": 5433 }, { "epoch": 0.13, "learning_rate": 9.760190708356721e-06, "loss": 1.0786, "step": 5434 }, { "epoch": 0.13, "learning_rate": 9.760075780098738e-06, "loss": 0.8081, "step": 5435 }, { "epoch": 0.13, "learning_rate": 9.759960824984732e-06, "loss": 1.0861, "step": 5436 }, { "epoch": 0.13, "learning_rate": 9.759845843015352e-06, "loss": 1.0836, "step": 5437 }, { "epoch": 0.13, "learning_rate": 9.759730834191246e-06, "loss": 0.806, "step": 5438 }, { "epoch": 0.13, "learning_rate": 9.759615798513062e-06, "loss": 1.1625, "step": 5439 }, { "epoch": 0.13, "learning_rate": 9.759500735981448e-06, "loss": 0.961, "step": 5440 }, { "epoch": 0.13, "learning_rate": 9.759385646597055e-06, "loss": 1.1077, "step": 5441 }, { "epoch": 0.13, "learning_rate": 9.759270530360533e-06, "loss": 1.0356, "step": 5442 }, { "epoch": 0.13, "learning_rate": 9.75915538727253e-06, "loss": 0.8665, "step": 5443 }, { "epoch": 0.13, "learning_rate": 9.759040217333694e-06, "loss": 0.9656, "step": 5444 }, { "epoch": 0.13, "learning_rate": 9.75892502054468e-06, "loss": 1.0355, "step": 5445 }, { "epoch": 0.13, "learning_rate": 9.758809796906132e-06, "loss": 1.1176, "step": 5446 }, { "epoch": 0.13, "learning_rate": 9.758694546418705e-06, "loss": 1.0609, "step": 5447 }, { "epoch": 0.13, "learning_rate": 9.758579269083046e-06, "loss": 0.9137, "step": 5448 }, { "epoch": 0.13, "learning_rate": 9.758463964899806e-06, "loss": 0.9401, "step": 5449 }, { "epoch": 0.13, "learning_rate": 9.758348633869638e-06, "loss": 0.8821, "step": 5450 }, { "epoch": 0.13, "learning_rate": 9.75823327599319e-06, "loss": 1.0156, "step": 5451 }, { "epoch": 0.13, "learning_rate": 9.758117891271112e-06, "loss": 1.041, "step": 5452 }, { "epoch": 0.13, "learning_rate": 9.758002479704056e-06, "loss": 0.9941, "step": 5453 }, { "epoch": 0.13, "learning_rate": 9.757887041292675e-06, "loss": 1.1864, "step": 5454 }, { "epoch": 0.13, "learning_rate": 9.75777157603762e-06, "loss": 1.1498, "step": 5455 }, { "epoch": 0.13, "learning_rate": 9.75765608393954e-06, "loss": 0.9151, "step": 5456 }, { "epoch": 0.13, "learning_rate": 9.757540564999088e-06, "loss": 1.1239, "step": 5457 }, { "epoch": 0.13, "learning_rate": 9.757425019216917e-06, "loss": 1.1566, "step": 5458 }, { "epoch": 0.13, "learning_rate": 9.757309446593676e-06, "loss": 1.1733, "step": 5459 }, { "epoch": 0.13, "learning_rate": 9.75719384713002e-06, "loss": 1.0369, "step": 5460 }, { "epoch": 0.13, "learning_rate": 9.757078220826599e-06, "loss": 1.0491, "step": 5461 }, { "epoch": 0.13, "learning_rate": 9.756962567684066e-06, "loss": 0.8142, "step": 5462 }, { "epoch": 0.13, "learning_rate": 9.756846887703074e-06, "loss": 0.7605, "step": 5463 }, { "epoch": 0.13, "learning_rate": 9.756731180884276e-06, "loss": 0.9793, "step": 5464 }, { "epoch": 0.13, "learning_rate": 9.756615447228324e-06, "loss": 0.9043, "step": 5465 }, { "epoch": 0.13, "learning_rate": 9.756499686735871e-06, "loss": 1.0684, "step": 5466 }, { "epoch": 0.13, "learning_rate": 9.756383899407572e-06, "loss": 1.0883, "step": 5467 }, { "epoch": 0.13, "learning_rate": 9.756268085244075e-06, "loss": 1.1421, "step": 5468 }, { "epoch": 0.13, "learning_rate": 9.75615224424604e-06, "loss": 0.8951, "step": 5469 }, { "epoch": 0.13, "learning_rate": 9.756036376414114e-06, "loss": 1.1143, "step": 5470 }, { "epoch": 0.13, "learning_rate": 9.75592048174896e-06, "loss": 1.2574, "step": 5471 }, { "epoch": 0.13, "learning_rate": 9.755804560251222e-06, "loss": 1.0004, "step": 5472 }, { "epoch": 0.13, "learning_rate": 9.755688611921559e-06, "loss": 1.2081, "step": 5473 }, { "epoch": 0.13, "learning_rate": 9.755572636760623e-06, "loss": 1.2995, "step": 5474 }, { "epoch": 0.13, "learning_rate": 9.755456634769072e-06, "loss": 1.1366, "step": 5475 }, { "epoch": 0.13, "learning_rate": 9.755340605947557e-06, "loss": 1.0411, "step": 5476 }, { "epoch": 0.13, "learning_rate": 9.755224550296735e-06, "loss": 0.983, "step": 5477 }, { "epoch": 0.13, "learning_rate": 9.755108467817258e-06, "loss": 1.0977, "step": 5478 }, { "epoch": 0.13, "learning_rate": 9.754992358509784e-06, "loss": 0.9799, "step": 5479 }, { "epoch": 0.13, "learning_rate": 9.754876222374964e-06, "loss": 1.2626, "step": 5480 }, { "epoch": 0.13, "learning_rate": 9.754760059413457e-06, "loss": 1.1713, "step": 5481 }, { "epoch": 0.13, "learning_rate": 9.754643869625919e-06, "loss": 1.2693, "step": 5482 }, { "epoch": 0.13, "learning_rate": 9.754527653013002e-06, "loss": 1.135, "step": 5483 }, { "epoch": 0.13, "learning_rate": 9.754411409575364e-06, "loss": 0.975, "step": 5484 }, { "epoch": 0.13, "learning_rate": 9.754295139313659e-06, "loss": 1.1331, "step": 5485 }, { "epoch": 0.13, "learning_rate": 9.754178842228546e-06, "loss": 1.0883, "step": 5486 }, { "epoch": 0.13, "learning_rate": 9.754062518320677e-06, "loss": 0.8349, "step": 5487 }, { "epoch": 0.13, "learning_rate": 9.753946167590712e-06, "loss": 1.09, "step": 5488 }, { "epoch": 0.13, "learning_rate": 9.753829790039306e-06, "loss": 0.934, "step": 5489 }, { "epoch": 0.13, "learning_rate": 9.753713385667116e-06, "loss": 1.1712, "step": 5490 }, { "epoch": 0.13, "learning_rate": 9.753596954474797e-06, "loss": 0.9752, "step": 5491 }, { "epoch": 0.13, "learning_rate": 9.75348049646301e-06, "loss": 1.1255, "step": 5492 }, { "epoch": 0.13, "learning_rate": 9.753364011632407e-06, "loss": 1.2781, "step": 5493 }, { "epoch": 0.13, "learning_rate": 9.753247499983649e-06, "loss": 1.0888, "step": 5494 }, { "epoch": 0.13, "learning_rate": 9.753130961517392e-06, "loss": 0.7743, "step": 5495 }, { "epoch": 0.13, "learning_rate": 9.753014396234292e-06, "loss": 0.7777, "step": 5496 }, { "epoch": 0.13, "learning_rate": 9.752897804135009e-06, "loss": 1.173, "step": 5497 }, { "epoch": 0.13, "learning_rate": 9.7527811852202e-06, "loss": 0.9948, "step": 5498 }, { "epoch": 0.13, "learning_rate": 9.752664539490523e-06, "loss": 0.9879, "step": 5499 }, { "epoch": 0.13, "learning_rate": 9.752547866946636e-06, "loss": 0.8488, "step": 5500 }, { "epoch": 0.13, "learning_rate": 9.752431167589195e-06, "loss": 0.8623, "step": 5501 }, { "epoch": 0.13, "learning_rate": 9.752314441418864e-06, "loss": 1.194, "step": 5502 }, { "epoch": 0.13, "learning_rate": 9.752197688436295e-06, "loss": 1.1308, "step": 5503 }, { "epoch": 0.13, "learning_rate": 9.752080908642153e-06, "loss": 0.9278, "step": 5504 }, { "epoch": 0.13, "learning_rate": 9.751964102037091e-06, "loss": 0.9552, "step": 5505 }, { "epoch": 0.13, "learning_rate": 9.751847268621772e-06, "loss": 0.7471, "step": 5506 }, { "epoch": 0.13, "learning_rate": 9.751730408396855e-06, "loss": 1.0554, "step": 5507 }, { "epoch": 0.13, "learning_rate": 9.751613521362996e-06, "loss": 1.0923, "step": 5508 }, { "epoch": 0.13, "learning_rate": 9.751496607520858e-06, "loss": 0.9088, "step": 5509 }, { "epoch": 0.13, "learning_rate": 9.7513796668711e-06, "loss": 1.1056, "step": 5510 }, { "epoch": 0.13, "learning_rate": 9.75126269941438e-06, "loss": 1.104, "step": 5511 }, { "epoch": 0.13, "learning_rate": 9.75114570515136e-06, "loss": 0.9028, "step": 5512 }, { "epoch": 0.13, "learning_rate": 9.751028684082697e-06, "loss": 1.332, "step": 5513 }, { "epoch": 0.13, "learning_rate": 9.750911636209056e-06, "loss": 1.1736, "step": 5514 }, { "epoch": 0.13, "learning_rate": 9.750794561531092e-06, "loss": 0.805, "step": 5515 }, { "epoch": 0.13, "learning_rate": 9.75067746004947e-06, "loss": 1.1406, "step": 5516 }, { "epoch": 0.13, "learning_rate": 9.750560331764848e-06, "loss": 1.1442, "step": 5517 }, { "epoch": 0.13, "learning_rate": 9.75044317667789e-06, "loss": 0.9906, "step": 5518 }, { "epoch": 0.13, "learning_rate": 9.750325994789253e-06, "loss": 0.8112, "step": 5519 }, { "epoch": 0.13, "learning_rate": 9.7502087860996e-06, "loss": 1.1394, "step": 5520 }, { "epoch": 0.13, "learning_rate": 9.750091550609592e-06, "loss": 1.2402, "step": 5521 }, { "epoch": 0.13, "learning_rate": 9.74997428831989e-06, "loss": 1.5202, "step": 5522 }, { "epoch": 0.13, "learning_rate": 9.749856999231157e-06, "loss": 1.0536, "step": 5523 }, { "epoch": 0.13, "learning_rate": 9.749739683344055e-06, "loss": 1.0771, "step": 5524 }, { "epoch": 0.13, "learning_rate": 9.749622340659242e-06, "loss": 1.1889, "step": 5525 }, { "epoch": 0.13, "learning_rate": 9.749504971177386e-06, "loss": 1.079, "step": 5526 }, { "epoch": 0.13, "learning_rate": 9.749387574899143e-06, "loss": 1.3204, "step": 5527 }, { "epoch": 0.13, "learning_rate": 9.74927015182518e-06, "loss": 1.0474, "step": 5528 }, { "epoch": 0.13, "learning_rate": 9.749152701956158e-06, "loss": 1.0564, "step": 5529 }, { "epoch": 0.13, "learning_rate": 9.749035225292737e-06, "loss": 0.9696, "step": 5530 }, { "epoch": 0.13, "learning_rate": 9.748917721835586e-06, "loss": 0.7721, "step": 5531 }, { "epoch": 0.13, "learning_rate": 9.748800191585362e-06, "loss": 0.7576, "step": 5532 }, { "epoch": 0.13, "learning_rate": 9.748682634542731e-06, "loss": 1.2254, "step": 5533 }, { "epoch": 0.13, "learning_rate": 9.748565050708355e-06, "loss": 0.9334, "step": 5534 }, { "epoch": 0.13, "learning_rate": 9.748447440082898e-06, "loss": 1.2189, "step": 5535 }, { "epoch": 0.13, "learning_rate": 9.748329802667026e-06, "loss": 1.4435, "step": 5536 }, { "epoch": 0.13, "learning_rate": 9.748212138461397e-06, "loss": 0.9635, "step": 5537 }, { "epoch": 0.13, "learning_rate": 9.74809444746668e-06, "loss": 0.6983, "step": 5538 }, { "epoch": 0.13, "learning_rate": 9.747976729683536e-06, "loss": 1.1974, "step": 5539 }, { "epoch": 0.13, "learning_rate": 9.74785898511263e-06, "loss": 1.0172, "step": 5540 }, { "epoch": 0.13, "learning_rate": 9.747741213754626e-06, "loss": 1.1785, "step": 5541 }, { "epoch": 0.13, "learning_rate": 9.747623415610193e-06, "loss": 1.0309, "step": 5542 }, { "epoch": 0.13, "learning_rate": 9.747505590679987e-06, "loss": 0.9153, "step": 5543 }, { "epoch": 0.13, "learning_rate": 9.74738773896468e-06, "loss": 0.9899, "step": 5544 }, { "epoch": 0.13, "learning_rate": 9.747269860464934e-06, "loss": 0.881, "step": 5545 }, { "epoch": 0.13, "learning_rate": 9.747151955181412e-06, "loss": 0.8642, "step": 5546 }, { "epoch": 0.13, "learning_rate": 9.747034023114785e-06, "loss": 1.0788, "step": 5547 }, { "epoch": 0.13, "learning_rate": 9.746916064265713e-06, "loss": 1.1947, "step": 5548 }, { "epoch": 0.13, "learning_rate": 9.746798078634863e-06, "loss": 1.1482, "step": 5549 }, { "epoch": 0.13, "learning_rate": 9.746680066222902e-06, "loss": 0.9423, "step": 5550 }, { "epoch": 0.13, "learning_rate": 9.746562027030495e-06, "loss": 1.2024, "step": 5551 }, { "epoch": 0.13, "learning_rate": 9.746443961058308e-06, "loss": 1.217, "step": 5552 }, { "epoch": 0.13, "learning_rate": 9.746325868307007e-06, "loss": 0.7727, "step": 5553 }, { "epoch": 0.13, "learning_rate": 9.746207748777258e-06, "loss": 1.0641, "step": 5554 }, { "epoch": 0.13, "learning_rate": 9.746089602469729e-06, "loss": 0.9794, "step": 5555 }, { "epoch": 0.13, "learning_rate": 9.745971429385084e-06, "loss": 1.0461, "step": 5556 }, { "epoch": 0.13, "learning_rate": 9.745853229523991e-06, "loss": 0.9478, "step": 5557 }, { "epoch": 0.13, "learning_rate": 9.745735002887117e-06, "loss": 0.9989, "step": 5558 }, { "epoch": 0.13, "learning_rate": 9.745616749475129e-06, "loss": 1.0258, "step": 5559 }, { "epoch": 0.13, "learning_rate": 9.745498469288694e-06, "loss": 0.9634, "step": 5560 }, { "epoch": 0.13, "learning_rate": 9.745380162328479e-06, "loss": 0.9203, "step": 5561 }, { "epoch": 0.13, "learning_rate": 9.745261828595152e-06, "loss": 1.1571, "step": 5562 }, { "epoch": 0.13, "learning_rate": 9.745143468089382e-06, "loss": 1.1659, "step": 5563 }, { "epoch": 0.13, "learning_rate": 9.745025080811835e-06, "loss": 1.15, "step": 5564 }, { "epoch": 0.13, "learning_rate": 9.744906666763177e-06, "loss": 0.9889, "step": 5565 }, { "epoch": 0.13, "learning_rate": 9.74478822594408e-06, "loss": 1.0977, "step": 5566 }, { "epoch": 0.13, "learning_rate": 9.744669758355212e-06, "loss": 1.1852, "step": 5567 }, { "epoch": 0.13, "learning_rate": 9.744551263997238e-06, "loss": 0.9419, "step": 5568 }, { "epoch": 0.13, "learning_rate": 9.74443274287083e-06, "loss": 1.1752, "step": 5569 }, { "epoch": 0.13, "learning_rate": 9.744314194976651e-06, "loss": 1.1608, "step": 5570 }, { "epoch": 0.13, "learning_rate": 9.744195620315377e-06, "loss": 0.9467, "step": 5571 }, { "epoch": 0.13, "learning_rate": 9.744077018887675e-06, "loss": 1.0373, "step": 5572 }, { "epoch": 0.13, "learning_rate": 9.743958390694213e-06, "loss": 1.0816, "step": 5573 }, { "epoch": 0.13, "learning_rate": 9.743839735735659e-06, "loss": 0.9896, "step": 5574 }, { "epoch": 0.13, "learning_rate": 9.743721054012684e-06, "loss": 1.0662, "step": 5575 }, { "epoch": 0.13, "learning_rate": 9.743602345525959e-06, "loss": 0.9203, "step": 5576 }, { "epoch": 0.13, "learning_rate": 9.743483610276152e-06, "loss": 1.0647, "step": 5577 }, { "epoch": 0.13, "learning_rate": 9.74336484826393e-06, "loss": 0.9909, "step": 5578 }, { "epoch": 0.13, "learning_rate": 9.743246059489971e-06, "loss": 0.9053, "step": 5579 }, { "epoch": 0.13, "learning_rate": 9.743127243954937e-06, "loss": 0.9978, "step": 5580 }, { "epoch": 0.13, "learning_rate": 9.743008401659502e-06, "loss": 1.1282, "step": 5581 }, { "epoch": 0.13, "learning_rate": 9.742889532604337e-06, "loss": 0.8704, "step": 5582 }, { "epoch": 0.13, "learning_rate": 9.742770636790112e-06, "loss": 0.8719, "step": 5583 }, { "epoch": 0.13, "learning_rate": 9.742651714217497e-06, "loss": 1.2615, "step": 5584 }, { "epoch": 0.13, "learning_rate": 9.742532764887165e-06, "loss": 1.2128, "step": 5585 }, { "epoch": 0.13, "learning_rate": 9.742413788799783e-06, "loss": 0.9808, "step": 5586 }, { "epoch": 0.13, "learning_rate": 9.742294785956027e-06, "loss": 1.1349, "step": 5587 }, { "epoch": 0.13, "learning_rate": 9.742175756356567e-06, "loss": 0.8782, "step": 5588 }, { "epoch": 0.13, "learning_rate": 9.742056700002074e-06, "loss": 1.4084, "step": 5589 }, { "epoch": 0.13, "learning_rate": 9.741937616893218e-06, "loss": 1.0276, "step": 5590 }, { "epoch": 0.13, "learning_rate": 9.741818507030674e-06, "loss": 0.9794, "step": 5591 }, { "epoch": 0.13, "learning_rate": 9.741699370415112e-06, "loss": 1.1266, "step": 5592 }, { "epoch": 0.13, "learning_rate": 9.741580207047203e-06, "loss": 0.92, "step": 5593 }, { "epoch": 0.13, "learning_rate": 9.741461016927623e-06, "loss": 0.981, "step": 5594 }, { "epoch": 0.13, "learning_rate": 9.741341800057042e-06, "loss": 1.0406, "step": 5595 }, { "epoch": 0.13, "learning_rate": 9.741222556436132e-06, "loss": 0.9646, "step": 5596 }, { "epoch": 0.13, "learning_rate": 9.741103286065568e-06, "loss": 0.9523, "step": 5597 }, { "epoch": 0.13, "learning_rate": 9.740983988946022e-06, "loss": 1.2261, "step": 5598 }, { "epoch": 0.13, "learning_rate": 9.740864665078166e-06, "loss": 1.0691, "step": 5599 }, { "epoch": 0.13, "learning_rate": 9.740745314462674e-06, "loss": 0.8547, "step": 5600 }, { "epoch": 0.13, "learning_rate": 9.740625937100222e-06, "loss": 1.013, "step": 5601 }, { "epoch": 0.13, "learning_rate": 9.740506532991476e-06, "loss": 1.0055, "step": 5602 }, { "epoch": 0.13, "learning_rate": 9.740387102137119e-06, "loss": 0.9175, "step": 5603 }, { "epoch": 0.13, "learning_rate": 9.740267644537817e-06, "loss": 1.2002, "step": 5604 }, { "epoch": 0.13, "learning_rate": 9.74014816019425e-06, "loss": 0.9351, "step": 5605 }, { "epoch": 0.13, "learning_rate": 9.740028649107089e-06, "loss": 1.1823, "step": 5606 }, { "epoch": 0.13, "learning_rate": 9.739909111277008e-06, "loss": 1.0452, "step": 5607 }, { "epoch": 0.13, "learning_rate": 9.739789546704683e-06, "loss": 0.9374, "step": 5608 }, { "epoch": 0.13, "learning_rate": 9.739669955390787e-06, "loss": 0.8496, "step": 5609 }, { "epoch": 0.13, "learning_rate": 9.739550337335996e-06, "loss": 1.2706, "step": 5610 }, { "epoch": 0.13, "learning_rate": 9.739430692540986e-06, "loss": 1.063, "step": 5611 }, { "epoch": 0.13, "learning_rate": 9.739311021006427e-06, "loss": 1.0005, "step": 5612 }, { "epoch": 0.13, "learning_rate": 9.739191322732999e-06, "loss": 1.169, "step": 5613 }, { "epoch": 0.13, "learning_rate": 9.739071597721376e-06, "loss": 1.0787, "step": 5614 }, { "epoch": 0.13, "learning_rate": 9.738951845972234e-06, "loss": 0.9986, "step": 5615 }, { "epoch": 0.13, "learning_rate": 9.738832067486249e-06, "loss": 0.8609, "step": 5616 }, { "epoch": 0.13, "learning_rate": 9.738712262264094e-06, "loss": 1.0484, "step": 5617 }, { "epoch": 0.13, "learning_rate": 9.738592430306446e-06, "loss": 0.914, "step": 5618 }, { "epoch": 0.13, "learning_rate": 9.738472571613984e-06, "loss": 0.9058, "step": 5619 }, { "epoch": 0.13, "learning_rate": 9.73835268618738e-06, "loss": 0.9561, "step": 5620 }, { "epoch": 0.13, "learning_rate": 9.738232774027315e-06, "loss": 1.0945, "step": 5621 }, { "epoch": 0.13, "learning_rate": 9.73811283513446e-06, "loss": 0.9777, "step": 5622 }, { "epoch": 0.13, "learning_rate": 9.737992869509497e-06, "loss": 0.6759, "step": 5623 }, { "epoch": 0.13, "learning_rate": 9.737872877153099e-06, "loss": 0.88, "step": 5624 }, { "epoch": 0.13, "learning_rate": 9.737752858065945e-06, "loss": 0.9003, "step": 5625 }, { "epoch": 0.13, "learning_rate": 9.737632812248711e-06, "loss": 1.0407, "step": 5626 }, { "epoch": 0.13, "learning_rate": 9.737512739702078e-06, "loss": 0.8589, "step": 5627 }, { "epoch": 0.13, "learning_rate": 9.737392640426718e-06, "loss": 0.9976, "step": 5628 }, { "epoch": 0.13, "learning_rate": 9.73727251442331e-06, "loss": 0.9345, "step": 5629 }, { "epoch": 0.13, "learning_rate": 9.737152361692534e-06, "loss": 1.2138, "step": 5630 }, { "epoch": 0.13, "learning_rate": 9.737032182235067e-06, "loss": 1.2667, "step": 5631 }, { "epoch": 0.13, "learning_rate": 9.736911976051586e-06, "loss": 1.1503, "step": 5632 }, { "epoch": 0.13, "learning_rate": 9.736791743142769e-06, "loss": 0.987, "step": 5633 }, { "epoch": 0.13, "learning_rate": 9.736671483509297e-06, "loss": 1.3222, "step": 5634 }, { "epoch": 0.13, "learning_rate": 9.736551197151845e-06, "loss": 1.3624, "step": 5635 }, { "epoch": 0.13, "learning_rate": 9.736430884071093e-06, "loss": 0.9438, "step": 5636 }, { "epoch": 0.13, "learning_rate": 9.736310544267721e-06, "loss": 1.1385, "step": 5637 }, { "epoch": 0.13, "learning_rate": 9.736190177742408e-06, "loss": 0.9518, "step": 5638 }, { "epoch": 0.13, "learning_rate": 9.736069784495832e-06, "loss": 1.0127, "step": 5639 }, { "epoch": 0.13, "learning_rate": 9.735949364528672e-06, "loss": 1.0573, "step": 5640 }, { "epoch": 0.13, "learning_rate": 9.735828917841607e-06, "loss": 1.399, "step": 5641 }, { "epoch": 0.13, "learning_rate": 9.735708444435319e-06, "loss": 1.02, "step": 5642 }, { "epoch": 0.13, "learning_rate": 9.735587944310485e-06, "loss": 0.8851, "step": 5643 }, { "epoch": 0.13, "learning_rate": 9.735467417467786e-06, "loss": 1.0406, "step": 5644 }, { "epoch": 0.13, "learning_rate": 9.735346863907902e-06, "loss": 1.0295, "step": 5645 }, { "epoch": 0.13, "learning_rate": 9.735226283631514e-06, "loss": 1.238, "step": 5646 }, { "epoch": 0.13, "learning_rate": 9.7351056766393e-06, "loss": 1.1671, "step": 5647 }, { "epoch": 0.13, "learning_rate": 9.734985042931941e-06, "loss": 0.8592, "step": 5648 }, { "epoch": 0.13, "learning_rate": 9.73486438251012e-06, "loss": 0.9305, "step": 5649 }, { "epoch": 0.13, "learning_rate": 9.734743695374516e-06, "loss": 1.107, "step": 5650 }, { "epoch": 0.13, "learning_rate": 9.734622981525811e-06, "loss": 1.2086, "step": 5651 }, { "epoch": 0.13, "learning_rate": 9.734502240964684e-06, "loss": 0.8988, "step": 5652 }, { "epoch": 0.13, "learning_rate": 9.734381473691818e-06, "loss": 1.3773, "step": 5653 }, { "epoch": 0.13, "learning_rate": 9.734260679707894e-06, "loss": 1.3102, "step": 5654 }, { "epoch": 0.13, "learning_rate": 9.734139859013592e-06, "loss": 0.889, "step": 5655 }, { "epoch": 0.13, "learning_rate": 9.734019011609597e-06, "loss": 0.9946, "step": 5656 }, { "epoch": 0.13, "learning_rate": 9.733898137496586e-06, "loss": 1.3074, "step": 5657 }, { "epoch": 0.13, "learning_rate": 9.733777236675246e-06, "loss": 1.0416, "step": 5658 }, { "epoch": 0.13, "learning_rate": 9.733656309146256e-06, "loss": 1.102, "step": 5659 }, { "epoch": 0.13, "learning_rate": 9.733535354910298e-06, "loss": 1.0838, "step": 5660 }, { "epoch": 0.13, "learning_rate": 9.733414373968057e-06, "loss": 1.033, "step": 5661 }, { "epoch": 0.13, "learning_rate": 9.733293366320213e-06, "loss": 0.9388, "step": 5662 }, { "epoch": 0.13, "learning_rate": 9.73317233196745e-06, "loss": 1.1913, "step": 5663 }, { "epoch": 0.13, "learning_rate": 9.733051270910452e-06, "loss": 1.2959, "step": 5664 }, { "epoch": 0.13, "learning_rate": 9.7329301831499e-06, "loss": 0.9955, "step": 5665 }, { "epoch": 0.13, "learning_rate": 9.732809068686477e-06, "loss": 0.8277, "step": 5666 }, { "epoch": 0.13, "learning_rate": 9.732687927520868e-06, "loss": 0.8951, "step": 5667 }, { "epoch": 0.13, "learning_rate": 9.732566759653756e-06, "loss": 0.9427, "step": 5668 }, { "epoch": 0.13, "learning_rate": 9.732445565085823e-06, "loss": 1.1053, "step": 5669 }, { "epoch": 0.13, "learning_rate": 9.732324343817755e-06, "loss": 0.9476, "step": 5670 }, { "epoch": 0.13, "learning_rate": 9.732203095850234e-06, "loss": 0.9422, "step": 5671 }, { "epoch": 0.13, "learning_rate": 9.732081821183945e-06, "loss": 1.1377, "step": 5672 }, { "epoch": 0.13, "learning_rate": 9.731960519819574e-06, "loss": 0.8576, "step": 5673 }, { "epoch": 0.13, "learning_rate": 9.731839191757802e-06, "loss": 1.0807, "step": 5674 }, { "epoch": 0.13, "learning_rate": 9.731717836999315e-06, "loss": 1.0789, "step": 5675 }, { "epoch": 0.13, "learning_rate": 9.7315964555448e-06, "loss": 1.1779, "step": 5676 }, { "epoch": 0.13, "learning_rate": 9.731475047394939e-06, "loss": 1.0613, "step": 5677 }, { "epoch": 0.13, "learning_rate": 9.731353612550417e-06, "loss": 1.0038, "step": 5678 }, { "epoch": 0.13, "learning_rate": 9.731232151011917e-06, "loss": 1.0272, "step": 5679 }, { "epoch": 0.13, "learning_rate": 9.73111066278013e-06, "loss": 1.0186, "step": 5680 }, { "epoch": 0.13, "learning_rate": 9.730989147855739e-06, "loss": 0.7606, "step": 5681 }, { "epoch": 0.13, "learning_rate": 9.730867606239427e-06, "loss": 0.9811, "step": 5682 }, { "epoch": 0.13, "learning_rate": 9.730746037931883e-06, "loss": 1.1917, "step": 5683 }, { "epoch": 0.13, "learning_rate": 9.730624442933791e-06, "loss": 1.0234, "step": 5684 }, { "epoch": 0.13, "learning_rate": 9.730502821245839e-06, "loss": 0.9118, "step": 5685 }, { "epoch": 0.13, "learning_rate": 9.73038117286871e-06, "loss": 1.131, "step": 5686 }, { "epoch": 0.13, "learning_rate": 9.730259497803095e-06, "loss": 1.1182, "step": 5687 }, { "epoch": 0.13, "learning_rate": 9.730137796049675e-06, "loss": 0.9517, "step": 5688 }, { "epoch": 0.13, "learning_rate": 9.730016067609139e-06, "loss": 0.5807, "step": 5689 }, { "epoch": 0.13, "learning_rate": 9.729894312482176e-06, "loss": 1.1703, "step": 5690 }, { "epoch": 0.13, "learning_rate": 9.729772530669468e-06, "loss": 0.9812, "step": 5691 }, { "epoch": 0.13, "learning_rate": 9.729650722171708e-06, "loss": 1.239, "step": 5692 }, { "epoch": 0.13, "learning_rate": 9.72952888698958e-06, "loss": 1.3523, "step": 5693 }, { "epoch": 0.13, "learning_rate": 9.729407025123771e-06, "loss": 1.2194, "step": 5694 }, { "epoch": 0.13, "learning_rate": 9.72928513657497e-06, "loss": 0.9001, "step": 5695 }, { "epoch": 0.13, "learning_rate": 9.729163221343863e-06, "loss": 1.0158, "step": 5696 }, { "epoch": 0.13, "learning_rate": 9.72904127943114e-06, "loss": 1.2025, "step": 5697 }, { "epoch": 0.13, "learning_rate": 9.728919310837486e-06, "loss": 0.9323, "step": 5698 }, { "epoch": 0.13, "learning_rate": 9.728797315563592e-06, "loss": 0.8138, "step": 5699 }, { "epoch": 0.13, "learning_rate": 9.728675293610146e-06, "loss": 1.1856, "step": 5700 }, { "epoch": 0.13, "learning_rate": 9.728553244977834e-06, "loss": 1.2074, "step": 5701 }, { "epoch": 0.13, "learning_rate": 9.728431169667347e-06, "loss": 1.1268, "step": 5702 }, { "epoch": 0.13, "learning_rate": 9.728309067679373e-06, "loss": 1.1188, "step": 5703 }, { "epoch": 0.13, "learning_rate": 9.7281869390146e-06, "loss": 1.0834, "step": 5704 }, { "epoch": 0.13, "learning_rate": 9.728064783673721e-06, "loss": 0.8502, "step": 5705 }, { "epoch": 0.13, "learning_rate": 9.727942601657418e-06, "loss": 0.9262, "step": 5706 }, { "epoch": 0.13, "learning_rate": 9.727820392966387e-06, "loss": 1.1354, "step": 5707 }, { "epoch": 0.13, "learning_rate": 9.727698157601315e-06, "loss": 1.0516, "step": 5708 }, { "epoch": 0.13, "learning_rate": 9.72757589556289e-06, "loss": 1.2421, "step": 5709 }, { "epoch": 0.13, "learning_rate": 9.727453606851804e-06, "loss": 1.303, "step": 5710 }, { "epoch": 0.13, "learning_rate": 9.727331291468747e-06, "loss": 1.2143, "step": 5711 }, { "epoch": 0.13, "learning_rate": 9.727208949414408e-06, "loss": 1.0169, "step": 5712 }, { "epoch": 0.13, "learning_rate": 9.727086580689477e-06, "loss": 1.092, "step": 5713 }, { "epoch": 0.13, "learning_rate": 9.726964185294646e-06, "loss": 1.1764, "step": 5714 }, { "epoch": 0.13, "learning_rate": 9.726841763230604e-06, "loss": 1.1148, "step": 5715 }, { "epoch": 0.13, "learning_rate": 9.726719314498043e-06, "loss": 0.9527, "step": 5716 }, { "epoch": 0.13, "learning_rate": 9.726596839097653e-06, "loss": 0.9117, "step": 5717 }, { "epoch": 0.13, "learning_rate": 9.726474337030123e-06, "loss": 0.9648, "step": 5718 }, { "epoch": 0.13, "learning_rate": 9.726351808296148e-06, "loss": 1.1023, "step": 5719 }, { "epoch": 0.13, "learning_rate": 9.72622925289642e-06, "loss": 1.2311, "step": 5720 }, { "epoch": 0.13, "learning_rate": 9.726106670831624e-06, "loss": 1.0425, "step": 5721 }, { "epoch": 0.13, "learning_rate": 9.725984062102458e-06, "loss": 1.0491, "step": 5722 }, { "epoch": 0.13, "learning_rate": 9.725861426709611e-06, "loss": 0.9862, "step": 5723 }, { "epoch": 0.13, "learning_rate": 9.725738764653773e-06, "loss": 1.0443, "step": 5724 }, { "epoch": 0.13, "learning_rate": 9.725616075935642e-06, "loss": 1.1558, "step": 5725 }, { "epoch": 0.13, "learning_rate": 9.725493360555904e-06, "loss": 1.1981, "step": 5726 }, { "epoch": 0.13, "learning_rate": 9.725370618515255e-06, "loss": 1.01, "step": 5727 }, { "epoch": 0.13, "learning_rate": 9.725247849814387e-06, "loss": 1.0274, "step": 5728 }, { "epoch": 0.13, "learning_rate": 9.72512505445399e-06, "loss": 1.0984, "step": 5729 }, { "epoch": 0.13, "learning_rate": 9.72500223243476e-06, "loss": 1.2458, "step": 5730 }, { "epoch": 0.13, "learning_rate": 9.724879383757389e-06, "loss": 0.9367, "step": 5731 }, { "epoch": 0.13, "learning_rate": 9.72475650842257e-06, "loss": 1.1687, "step": 5732 }, { "epoch": 0.13, "learning_rate": 9.724633606430996e-06, "loss": 1.2343, "step": 5733 }, { "epoch": 0.13, "learning_rate": 9.724510677783361e-06, "loss": 1.0309, "step": 5734 }, { "epoch": 0.13, "learning_rate": 9.724387722480358e-06, "loss": 0.854, "step": 5735 }, { "epoch": 0.13, "learning_rate": 9.72426474052268e-06, "loss": 1.0152, "step": 5736 }, { "epoch": 0.13, "learning_rate": 9.724141731911022e-06, "loss": 1.2483, "step": 5737 }, { "epoch": 0.13, "learning_rate": 9.724018696646077e-06, "loss": 1.0173, "step": 5738 }, { "epoch": 0.13, "learning_rate": 9.72389563472854e-06, "loss": 1.1335, "step": 5739 }, { "epoch": 0.13, "learning_rate": 9.723772546159108e-06, "loss": 0.9113, "step": 5740 }, { "epoch": 0.13, "learning_rate": 9.72364943093847e-06, "loss": 0.715, "step": 5741 }, { "epoch": 0.13, "learning_rate": 9.723526289067322e-06, "loss": 1.1702, "step": 5742 }, { "epoch": 0.13, "learning_rate": 9.723403120546362e-06, "loss": 1.3655, "step": 5743 }, { "epoch": 0.13, "learning_rate": 9.723279925376283e-06, "loss": 1.0511, "step": 5744 }, { "epoch": 0.13, "learning_rate": 9.723156703557778e-06, "loss": 1.1022, "step": 5745 }, { "epoch": 0.13, "learning_rate": 9.723033455091546e-06, "loss": 0.9528, "step": 5746 }, { "epoch": 0.13, "learning_rate": 9.72291017997828e-06, "loss": 0.9427, "step": 5747 }, { "epoch": 0.13, "learning_rate": 9.722786878218675e-06, "loss": 1.2186, "step": 5748 }, { "epoch": 0.13, "learning_rate": 9.72266354981343e-06, "loss": 1.0595, "step": 5749 }, { "epoch": 0.13, "learning_rate": 9.722540194763237e-06, "loss": 1.2855, "step": 5750 }, { "epoch": 0.13, "learning_rate": 9.722416813068794e-06, "loss": 1.2384, "step": 5751 }, { "epoch": 0.13, "learning_rate": 9.722293404730797e-06, "loss": 1.0706, "step": 5752 }, { "epoch": 0.13, "learning_rate": 9.722169969749939e-06, "loss": 0.8825, "step": 5753 }, { "epoch": 0.13, "learning_rate": 9.722046508126922e-06, "loss": 1.1106, "step": 5754 }, { "epoch": 0.13, "learning_rate": 9.721923019862439e-06, "loss": 1.107, "step": 5755 }, { "epoch": 0.13, "learning_rate": 9.721799504957188e-06, "loss": 1.0324, "step": 5756 }, { "epoch": 0.13, "learning_rate": 9.721675963411864e-06, "loss": 0.9329, "step": 5757 }, { "epoch": 0.13, "learning_rate": 9.721552395227168e-06, "loss": 1.502, "step": 5758 }, { "epoch": 0.13, "learning_rate": 9.721428800403792e-06, "loss": 0.9986, "step": 5759 }, { "epoch": 0.13, "learning_rate": 9.721305178942435e-06, "loss": 1.2988, "step": 5760 }, { "epoch": 0.13, "learning_rate": 9.721181530843799e-06, "loss": 1.0386, "step": 5761 }, { "epoch": 0.13, "learning_rate": 9.721057856108575e-06, "loss": 1.0502, "step": 5762 }, { "epoch": 0.13, "learning_rate": 9.720934154737465e-06, "loss": 0.8081, "step": 5763 }, { "epoch": 0.13, "learning_rate": 9.720810426731166e-06, "loss": 0.894, "step": 5764 }, { "epoch": 0.13, "learning_rate": 9.720686672090374e-06, "loss": 1.0424, "step": 5765 }, { "epoch": 0.13, "learning_rate": 9.72056289081579e-06, "loss": 0.9574, "step": 5766 }, { "epoch": 0.13, "learning_rate": 9.720439082908111e-06, "loss": 1.0051, "step": 5767 }, { "epoch": 0.13, "learning_rate": 9.720315248368036e-06, "loss": 1.1426, "step": 5768 }, { "epoch": 0.13, "learning_rate": 9.720191387196263e-06, "loss": 1.0004, "step": 5769 }, { "epoch": 0.13, "learning_rate": 9.720067499393494e-06, "loss": 1.2909, "step": 5770 }, { "epoch": 0.13, "learning_rate": 9.71994358496042e-06, "loss": 0.9542, "step": 5771 }, { "epoch": 0.13, "learning_rate": 9.71981964389775e-06, "loss": 0.8761, "step": 5772 }, { "epoch": 0.13, "learning_rate": 9.719695676206176e-06, "loss": 1.1493, "step": 5773 }, { "epoch": 0.13, "learning_rate": 9.719571681886402e-06, "loss": 1.1083, "step": 5774 }, { "epoch": 0.13, "learning_rate": 9.719447660939123e-06, "loss": 1.1331, "step": 5775 }, { "epoch": 0.13, "learning_rate": 9.719323613365044e-06, "loss": 1.108, "step": 5776 }, { "epoch": 0.13, "learning_rate": 9.719199539164859e-06, "loss": 0.9493, "step": 5777 }, { "epoch": 0.13, "learning_rate": 9.719075438339274e-06, "loss": 0.9829, "step": 5778 }, { "epoch": 0.13, "learning_rate": 9.718951310888985e-06, "loss": 1.0337, "step": 5779 }, { "epoch": 0.13, "learning_rate": 9.718827156814694e-06, "loss": 0.9023, "step": 5780 }, { "epoch": 0.13, "learning_rate": 9.718702976117102e-06, "loss": 1.3945, "step": 5781 }, { "epoch": 0.13, "learning_rate": 9.718578768796909e-06, "loss": 1.1888, "step": 5782 }, { "epoch": 0.13, "learning_rate": 9.718454534854814e-06, "loss": 1.1309, "step": 5783 }, { "epoch": 0.13, "learning_rate": 9.71833027429152e-06, "loss": 1.2705, "step": 5784 }, { "epoch": 0.13, "learning_rate": 9.718205987107728e-06, "loss": 1.1256, "step": 5785 }, { "epoch": 0.13, "learning_rate": 9.718081673304139e-06, "loss": 1.1596, "step": 5786 }, { "epoch": 0.13, "learning_rate": 9.717957332881454e-06, "loss": 0.8656, "step": 5787 }, { "epoch": 0.13, "learning_rate": 9.717832965840373e-06, "loss": 1.0268, "step": 5788 }, { "epoch": 0.13, "learning_rate": 9.717708572181602e-06, "loss": 0.93, "step": 5789 }, { "epoch": 0.13, "learning_rate": 9.717584151905836e-06, "loss": 1.0006, "step": 5790 }, { "epoch": 0.13, "learning_rate": 9.717459705013785e-06, "loss": 1.1507, "step": 5791 }, { "epoch": 0.13, "learning_rate": 9.717335231506146e-06, "loss": 0.7514, "step": 5792 }, { "epoch": 0.13, "learning_rate": 9.717210731383622e-06, "loss": 1.1305, "step": 5793 }, { "epoch": 0.13, "learning_rate": 9.717086204646916e-06, "loss": 1.0819, "step": 5794 }, { "epoch": 0.13, "learning_rate": 9.716961651296732e-06, "loss": 1.1087, "step": 5795 }, { "epoch": 0.13, "learning_rate": 9.716837071333768e-06, "loss": 0.8559, "step": 5796 }, { "epoch": 0.13, "learning_rate": 9.716712464758732e-06, "loss": 1.157, "step": 5797 }, { "epoch": 0.13, "learning_rate": 9.716587831572326e-06, "loss": 1.169, "step": 5798 }, { "epoch": 0.13, "learning_rate": 9.716463171775252e-06, "loss": 0.8899, "step": 5799 }, { "epoch": 0.13, "learning_rate": 9.716338485368213e-06, "loss": 1.2088, "step": 5800 }, { "epoch": 0.13, "learning_rate": 9.716213772351915e-06, "loss": 1.1304, "step": 5801 }, { "epoch": 0.13, "learning_rate": 9.716089032727056e-06, "loss": 0.9438, "step": 5802 }, { "epoch": 0.13, "learning_rate": 9.715964266494346e-06, "loss": 0.9115, "step": 5803 }, { "epoch": 0.13, "learning_rate": 9.715839473654486e-06, "loss": 1.0551, "step": 5804 }, { "epoch": 0.13, "learning_rate": 9.715714654208181e-06, "loss": 0.988, "step": 5805 }, { "epoch": 0.13, "learning_rate": 9.715589808156135e-06, "loss": 1.1951, "step": 5806 }, { "epoch": 0.13, "learning_rate": 9.715464935499049e-06, "loss": 1.1331, "step": 5807 }, { "epoch": 0.13, "learning_rate": 9.715340036237632e-06, "loss": 1.2687, "step": 5808 }, { "epoch": 0.13, "learning_rate": 9.715215110372588e-06, "loss": 1.1312, "step": 5809 }, { "epoch": 0.13, "learning_rate": 9.715090157904621e-06, "loss": 1.0308, "step": 5810 }, { "epoch": 0.13, "learning_rate": 9.714965178834437e-06, "loss": 1.1968, "step": 5811 }, { "epoch": 0.13, "learning_rate": 9.714840173162738e-06, "loss": 0.9782, "step": 5812 }, { "epoch": 0.13, "learning_rate": 9.714715140890232e-06, "loss": 1.3123, "step": 5813 }, { "epoch": 0.13, "learning_rate": 9.714590082017625e-06, "loss": 0.9937, "step": 5814 }, { "epoch": 0.13, "learning_rate": 9.714464996545621e-06, "loss": 1.1631, "step": 5815 }, { "epoch": 0.13, "learning_rate": 9.714339884474925e-06, "loss": 0.939, "step": 5816 }, { "epoch": 0.13, "learning_rate": 9.714214745806248e-06, "loss": 1.1069, "step": 5817 }, { "epoch": 0.13, "learning_rate": 9.714089580540287e-06, "loss": 1.248, "step": 5818 }, { "epoch": 0.13, "learning_rate": 9.713964388677756e-06, "loss": 0.9304, "step": 5819 }, { "epoch": 0.13, "learning_rate": 9.713839170219358e-06, "loss": 1.1968, "step": 5820 }, { "epoch": 0.13, "learning_rate": 9.7137139251658e-06, "loss": 0.9092, "step": 5821 }, { "epoch": 0.14, "learning_rate": 9.71358865351779e-06, "loss": 1.0686, "step": 5822 }, { "epoch": 0.14, "learning_rate": 9.713463355276032e-06, "loss": 0.9954, "step": 5823 }, { "epoch": 0.14, "learning_rate": 9.713338030441232e-06, "loss": 1.0812, "step": 5824 }, { "epoch": 0.14, "learning_rate": 9.713212679014103e-06, "loss": 0.9733, "step": 5825 }, { "epoch": 0.14, "learning_rate": 9.713087300995348e-06, "loss": 1.0302, "step": 5826 }, { "epoch": 0.14, "learning_rate": 9.712961896385674e-06, "loss": 1.1613, "step": 5827 }, { "epoch": 0.14, "learning_rate": 9.712836465185792e-06, "loss": 1.1284, "step": 5828 }, { "epoch": 0.14, "learning_rate": 9.712711007396403e-06, "loss": 0.9137, "step": 5829 }, { "epoch": 0.14, "learning_rate": 9.712585523018223e-06, "loss": 0.9749, "step": 5830 }, { "epoch": 0.14, "learning_rate": 9.712460012051954e-06, "loss": 0.9992, "step": 5831 }, { "epoch": 0.14, "learning_rate": 9.712334474498306e-06, "loss": 0.6692, "step": 5832 }, { "epoch": 0.14, "learning_rate": 9.71220891035799e-06, "loss": 1.09, "step": 5833 }, { "epoch": 0.14, "learning_rate": 9.71208331963171e-06, "loss": 1.0398, "step": 5834 }, { "epoch": 0.14, "learning_rate": 9.711957702320176e-06, "loss": 1.243, "step": 5835 }, { "epoch": 0.14, "learning_rate": 9.711832058424096e-06, "loss": 0.9655, "step": 5836 }, { "epoch": 0.14, "learning_rate": 9.711706387944182e-06, "loss": 0.9559, "step": 5837 }, { "epoch": 0.14, "learning_rate": 9.71158069088114e-06, "loss": 1.1423, "step": 5838 }, { "epoch": 0.14, "learning_rate": 9.71145496723568e-06, "loss": 1.0994, "step": 5839 }, { "epoch": 0.14, "learning_rate": 9.711329217008514e-06, "loss": 0.894, "step": 5840 }, { "epoch": 0.14, "learning_rate": 9.711203440200347e-06, "loss": 1.0547, "step": 5841 }, { "epoch": 0.14, "learning_rate": 9.71107763681189e-06, "loss": 1.1291, "step": 5842 }, { "epoch": 0.14, "learning_rate": 9.710951806843856e-06, "loss": 0.8537, "step": 5843 }, { "epoch": 0.14, "learning_rate": 9.71082595029695e-06, "loss": 0.6732, "step": 5844 }, { "epoch": 0.14, "learning_rate": 9.710700067171885e-06, "loss": 1.1514, "step": 5845 }, { "epoch": 0.14, "learning_rate": 9.71057415746937e-06, "loss": 0.825, "step": 5846 }, { "epoch": 0.14, "learning_rate": 9.710448221190117e-06, "loss": 1.007, "step": 5847 }, { "epoch": 0.14, "learning_rate": 9.710322258334836e-06, "loss": 0.8138, "step": 5848 }, { "epoch": 0.14, "learning_rate": 9.710196268904238e-06, "loss": 1.1131, "step": 5849 }, { "epoch": 0.14, "learning_rate": 9.71007025289903e-06, "loss": 1.2163, "step": 5850 }, { "epoch": 0.14, "learning_rate": 9.709944210319928e-06, "loss": 1.4588, "step": 5851 }, { "epoch": 0.14, "learning_rate": 9.70981814116764e-06, "loss": 0.7943, "step": 5852 }, { "epoch": 0.14, "learning_rate": 9.70969204544288e-06, "loss": 1.002, "step": 5853 }, { "epoch": 0.14, "learning_rate": 9.709565923146357e-06, "loss": 0.8993, "step": 5854 }, { "epoch": 0.14, "learning_rate": 9.709439774278784e-06, "loss": 1.3012, "step": 5855 }, { "epoch": 0.14, "learning_rate": 9.70931359884087e-06, "loss": 0.8592, "step": 5856 }, { "epoch": 0.14, "learning_rate": 9.709187396833331e-06, "loss": 1.0929, "step": 5857 }, { "epoch": 0.14, "learning_rate": 9.709061168256878e-06, "loss": 0.9083, "step": 5858 }, { "epoch": 0.14, "learning_rate": 9.70893491311222e-06, "loss": 1.024, "step": 5859 }, { "epoch": 0.14, "learning_rate": 9.708808631400073e-06, "loss": 1.0478, "step": 5860 }, { "epoch": 0.14, "learning_rate": 9.708682323121146e-06, "loss": 0.9191, "step": 5861 }, { "epoch": 0.14, "learning_rate": 9.708555988276156e-06, "loss": 1.2379, "step": 5862 }, { "epoch": 0.14, "learning_rate": 9.708429626865812e-06, "loss": 0.8092, "step": 5863 }, { "epoch": 0.14, "learning_rate": 9.708303238890828e-06, "loss": 1.2849, "step": 5864 }, { "epoch": 0.14, "learning_rate": 9.708176824351918e-06, "loss": 1.0576, "step": 5865 }, { "epoch": 0.14, "learning_rate": 9.708050383249795e-06, "loss": 1.1653, "step": 5866 }, { "epoch": 0.14, "learning_rate": 9.70792391558517e-06, "loss": 1.0569, "step": 5867 }, { "epoch": 0.14, "learning_rate": 9.707797421358763e-06, "loss": 1.0125, "step": 5868 }, { "epoch": 0.14, "learning_rate": 9.70767090057128e-06, "loss": 0.759, "step": 5869 }, { "epoch": 0.14, "learning_rate": 9.707544353223437e-06, "loss": 1.2091, "step": 5870 }, { "epoch": 0.14, "learning_rate": 9.70741777931595e-06, "loss": 1.0522, "step": 5871 }, { "epoch": 0.14, "learning_rate": 9.707291178849534e-06, "loss": 1.1022, "step": 5872 }, { "epoch": 0.14, "learning_rate": 9.7071645518249e-06, "loss": 0.9524, "step": 5873 }, { "epoch": 0.14, "learning_rate": 9.707037898242763e-06, "loss": 1.2309, "step": 5874 }, { "epoch": 0.14, "learning_rate": 9.706911218103839e-06, "loss": 0.9733, "step": 5875 }, { "epoch": 0.14, "learning_rate": 9.706784511408842e-06, "loss": 0.9969, "step": 5876 }, { "epoch": 0.14, "learning_rate": 9.706657778158486e-06, "loss": 1.2893, "step": 5877 }, { "epoch": 0.14, "learning_rate": 9.706531018353487e-06, "loss": 0.8737, "step": 5878 }, { "epoch": 0.14, "learning_rate": 9.706404231994562e-06, "loss": 1.0234, "step": 5879 }, { "epoch": 0.14, "learning_rate": 9.706277419082423e-06, "loss": 1.0792, "step": 5880 }, { "epoch": 0.14, "learning_rate": 9.706150579617788e-06, "loss": 1.0652, "step": 5881 }, { "epoch": 0.14, "learning_rate": 9.70602371360137e-06, "loss": 1.1231, "step": 5882 }, { "epoch": 0.14, "learning_rate": 9.705896821033888e-06, "loss": 1.0492, "step": 5883 }, { "epoch": 0.14, "learning_rate": 9.705769901916055e-06, "loss": 1.1685, "step": 5884 }, { "epoch": 0.14, "learning_rate": 9.705642956248588e-06, "loss": 1.3859, "step": 5885 }, { "epoch": 0.14, "learning_rate": 9.705515984032205e-06, "loss": 1.1524, "step": 5886 }, { "epoch": 0.14, "learning_rate": 9.70538898526762e-06, "loss": 0.957, "step": 5887 }, { "epoch": 0.14, "learning_rate": 9.705261959955551e-06, "loss": 1.3481, "step": 5888 }, { "epoch": 0.14, "learning_rate": 9.705134908096714e-06, "loss": 1.0365, "step": 5889 }, { "epoch": 0.14, "learning_rate": 9.705007829691825e-06, "loss": 1.1142, "step": 5890 }, { "epoch": 0.14, "learning_rate": 9.704880724741603e-06, "loss": 0.9774, "step": 5891 }, { "epoch": 0.14, "learning_rate": 9.704753593246762e-06, "loss": 0.9541, "step": 5892 }, { "epoch": 0.14, "learning_rate": 9.704626435208022e-06, "loss": 1.0801, "step": 5893 }, { "epoch": 0.14, "learning_rate": 9.704499250626101e-06, "loss": 1.2574, "step": 5894 }, { "epoch": 0.14, "learning_rate": 9.704372039501715e-06, "loss": 0.9418, "step": 5895 }, { "epoch": 0.14, "learning_rate": 9.70424480183558e-06, "loss": 1.0401, "step": 5896 }, { "epoch": 0.14, "learning_rate": 9.70411753762842e-06, "loss": 1.0227, "step": 5897 }, { "epoch": 0.14, "learning_rate": 9.703990246880944e-06, "loss": 1.0713, "step": 5898 }, { "epoch": 0.14, "learning_rate": 9.703862929593877e-06, "loss": 1.1796, "step": 5899 }, { "epoch": 0.14, "learning_rate": 9.703735585767936e-06, "loss": 0.9144, "step": 5900 }, { "epoch": 0.14, "learning_rate": 9.703608215403838e-06, "loss": 1.3089, "step": 5901 }, { "epoch": 0.14, "learning_rate": 9.703480818502302e-06, "loss": 1.1674, "step": 5902 }, { "epoch": 0.14, "learning_rate": 9.703353395064048e-06, "loss": 0.9773, "step": 5903 }, { "epoch": 0.14, "learning_rate": 9.703225945089793e-06, "loss": 1.0062, "step": 5904 }, { "epoch": 0.14, "learning_rate": 9.70309846858026e-06, "loss": 0.7902, "step": 5905 }, { "epoch": 0.14, "learning_rate": 9.702970965536163e-06, "loss": 1.0594, "step": 5906 }, { "epoch": 0.14, "learning_rate": 9.702843435958223e-06, "loss": 1.0576, "step": 5907 }, { "epoch": 0.14, "learning_rate": 9.702715879847162e-06, "loss": 1.1369, "step": 5908 }, { "epoch": 0.14, "learning_rate": 9.702588297203696e-06, "loss": 1.051, "step": 5909 }, { "epoch": 0.14, "learning_rate": 9.702460688028547e-06, "loss": 1.1072, "step": 5910 }, { "epoch": 0.14, "learning_rate": 9.702333052322437e-06, "loss": 1.093, "step": 5911 }, { "epoch": 0.14, "learning_rate": 9.702205390086081e-06, "loss": 1.2921, "step": 5912 }, { "epoch": 0.14, "learning_rate": 9.702077701320204e-06, "loss": 0.9931, "step": 5913 }, { "epoch": 0.14, "learning_rate": 9.701949986025523e-06, "loss": 1.0343, "step": 5914 }, { "epoch": 0.14, "learning_rate": 9.701822244202761e-06, "loss": 1.219, "step": 5915 }, { "epoch": 0.14, "learning_rate": 9.701694475852636e-06, "loss": 1.0225, "step": 5916 }, { "epoch": 0.14, "learning_rate": 9.701566680975874e-06, "loss": 1.1515, "step": 5917 }, { "epoch": 0.14, "learning_rate": 9.70143885957319e-06, "loss": 0.9644, "step": 5918 }, { "epoch": 0.14, "learning_rate": 9.701311011645309e-06, "loss": 0.9548, "step": 5919 }, { "epoch": 0.14, "learning_rate": 9.701183137192949e-06, "loss": 1.06, "step": 5920 }, { "epoch": 0.14, "learning_rate": 9.701055236216835e-06, "loss": 1.3081, "step": 5921 }, { "epoch": 0.14, "learning_rate": 9.700927308717688e-06, "loss": 1.2602, "step": 5922 }, { "epoch": 0.14, "learning_rate": 9.700799354696227e-06, "loss": 0.7633, "step": 5923 }, { "epoch": 0.14, "learning_rate": 9.700671374153176e-06, "loss": 0.9159, "step": 5924 }, { "epoch": 0.14, "learning_rate": 9.700543367089259e-06, "loss": 1.0415, "step": 5925 }, { "epoch": 0.14, "learning_rate": 9.700415333505193e-06, "loss": 1.2533, "step": 5926 }, { "epoch": 0.14, "learning_rate": 9.700287273401705e-06, "loss": 1.0945, "step": 5927 }, { "epoch": 0.14, "learning_rate": 9.700159186779517e-06, "loss": 0.9181, "step": 5928 }, { "epoch": 0.14, "learning_rate": 9.700031073639349e-06, "loss": 0.9745, "step": 5929 }, { "epoch": 0.14, "learning_rate": 9.699902933981927e-06, "loss": 1.0767, "step": 5930 }, { "epoch": 0.14, "learning_rate": 9.69977476780797e-06, "loss": 0.9466, "step": 5931 }, { "epoch": 0.14, "learning_rate": 9.699646575118204e-06, "loss": 0.9143, "step": 5932 }, { "epoch": 0.14, "learning_rate": 9.699518355913353e-06, "loss": 1.0755, "step": 5933 }, { "epoch": 0.14, "learning_rate": 9.699390110194138e-06, "loss": 1.0667, "step": 5934 }, { "epoch": 0.14, "learning_rate": 9.699261837961284e-06, "loss": 0.7622, "step": 5935 }, { "epoch": 0.14, "learning_rate": 9.699133539215515e-06, "loss": 0.9839, "step": 5936 }, { "epoch": 0.14, "learning_rate": 9.699005213957553e-06, "loss": 1.0145, "step": 5937 }, { "epoch": 0.14, "learning_rate": 9.698876862188124e-06, "loss": 1.0617, "step": 5938 }, { "epoch": 0.14, "learning_rate": 9.698748483907951e-06, "loss": 0.9126, "step": 5939 }, { "epoch": 0.14, "learning_rate": 9.69862007911776e-06, "loss": 1.1062, "step": 5940 }, { "epoch": 0.14, "learning_rate": 9.698491647818273e-06, "loss": 0.9806, "step": 5941 }, { "epoch": 0.14, "learning_rate": 9.698363190010214e-06, "loss": 1.1317, "step": 5942 }, { "epoch": 0.14, "learning_rate": 9.698234705694312e-06, "loss": 1.3705, "step": 5943 }, { "epoch": 0.14, "learning_rate": 9.69810619487129e-06, "loss": 0.9988, "step": 5944 }, { "epoch": 0.14, "learning_rate": 9.69797765754187e-06, "loss": 0.9698, "step": 5945 }, { "epoch": 0.14, "learning_rate": 9.69784909370678e-06, "loss": 1.3363, "step": 5946 }, { "epoch": 0.14, "learning_rate": 9.697720503366746e-06, "loss": 0.9826, "step": 5947 }, { "epoch": 0.14, "learning_rate": 9.697591886522491e-06, "loss": 0.8769, "step": 5948 }, { "epoch": 0.14, "learning_rate": 9.697463243174743e-06, "loss": 0.9087, "step": 5949 }, { "epoch": 0.14, "learning_rate": 9.69733457332423e-06, "loss": 1.1942, "step": 5950 }, { "epoch": 0.14, "learning_rate": 9.697205876971669e-06, "loss": 0.8521, "step": 5951 }, { "epoch": 0.14, "learning_rate": 9.697077154117795e-06, "loss": 1.078, "step": 5952 }, { "epoch": 0.14, "learning_rate": 9.696948404763332e-06, "loss": 1.0859, "step": 5953 }, { "epoch": 0.14, "learning_rate": 9.696819628909004e-06, "loss": 1.0594, "step": 5954 }, { "epoch": 0.14, "learning_rate": 9.696690826555539e-06, "loss": 0.9521, "step": 5955 }, { "epoch": 0.14, "learning_rate": 9.696561997703666e-06, "loss": 1.005, "step": 5956 }, { "epoch": 0.14, "learning_rate": 9.696433142354107e-06, "loss": 1.1018, "step": 5957 }, { "epoch": 0.14, "learning_rate": 9.696304260507593e-06, "loss": 0.9014, "step": 5958 }, { "epoch": 0.14, "learning_rate": 9.69617535216485e-06, "loss": 0.9939, "step": 5959 }, { "epoch": 0.14, "learning_rate": 9.696046417326605e-06, "loss": 1.102, "step": 5960 }, { "epoch": 0.14, "learning_rate": 9.695917455993585e-06, "loss": 1.1179, "step": 5961 }, { "epoch": 0.14, "learning_rate": 9.695788468166518e-06, "loss": 0.9659, "step": 5962 }, { "epoch": 0.14, "learning_rate": 9.695659453846132e-06, "loss": 1.0433, "step": 5963 }, { "epoch": 0.14, "learning_rate": 9.695530413033156e-06, "loss": 1.0488, "step": 5964 }, { "epoch": 0.14, "learning_rate": 9.695401345728315e-06, "loss": 1.2096, "step": 5965 }, { "epoch": 0.14, "learning_rate": 9.69527225193234e-06, "loss": 0.9863, "step": 5966 }, { "epoch": 0.14, "learning_rate": 9.69514313164596e-06, "loss": 1.0318, "step": 5967 }, { "epoch": 0.14, "learning_rate": 9.695013984869899e-06, "loss": 0.9617, "step": 5968 }, { "epoch": 0.14, "learning_rate": 9.694884811604888e-06, "loss": 0.9799, "step": 5969 }, { "epoch": 0.14, "learning_rate": 9.694755611851659e-06, "loss": 1.0366, "step": 5970 }, { "epoch": 0.14, "learning_rate": 9.694626385610938e-06, "loss": 1.0796, "step": 5971 }, { "epoch": 0.14, "learning_rate": 9.69449713288345e-06, "loss": 0.995, "step": 5972 }, { "epoch": 0.14, "learning_rate": 9.694367853669933e-06, "loss": 1.1504, "step": 5973 }, { "epoch": 0.14, "learning_rate": 9.694238547971111e-06, "loss": 0.9877, "step": 5974 }, { "epoch": 0.14, "learning_rate": 9.694109215787714e-06, "loss": 0.9994, "step": 5975 }, { "epoch": 0.14, "learning_rate": 9.693979857120471e-06, "loss": 1.4388, "step": 5976 }, { "epoch": 0.14, "learning_rate": 9.693850471970115e-06, "loss": 1.2844, "step": 5977 }, { "epoch": 0.14, "learning_rate": 9.693721060337371e-06, "loss": 1.1656, "step": 5978 }, { "epoch": 0.14, "learning_rate": 9.693591622222975e-06, "loss": 1.041, "step": 5979 }, { "epoch": 0.14, "learning_rate": 9.693462157627653e-06, "loss": 0.77, "step": 5980 }, { "epoch": 0.14, "learning_rate": 9.693332666552137e-06, "loss": 1.1578, "step": 5981 }, { "epoch": 0.14, "learning_rate": 9.693203148997158e-06, "loss": 1.1165, "step": 5982 }, { "epoch": 0.14, "learning_rate": 9.693073604963445e-06, "loss": 1.219, "step": 5983 }, { "epoch": 0.14, "learning_rate": 9.69294403445173e-06, "loss": 0.969, "step": 5984 }, { "epoch": 0.14, "learning_rate": 9.692814437462745e-06, "loss": 1.1563, "step": 5985 }, { "epoch": 0.14, "learning_rate": 9.69268481399722e-06, "loss": 0.9421, "step": 5986 }, { "epoch": 0.14, "learning_rate": 9.692555164055885e-06, "loss": 1.1369, "step": 5987 }, { "epoch": 0.14, "learning_rate": 9.692425487639474e-06, "loss": 1.0514, "step": 5988 }, { "epoch": 0.14, "learning_rate": 9.692295784748717e-06, "loss": 1.0636, "step": 5989 }, { "epoch": 0.14, "learning_rate": 9.692166055384346e-06, "loss": 0.6067, "step": 5990 }, { "epoch": 0.14, "learning_rate": 9.692036299547096e-06, "loss": 1.0546, "step": 5991 }, { "epoch": 0.14, "learning_rate": 9.691906517237694e-06, "loss": 1.0171, "step": 5992 }, { "epoch": 0.14, "learning_rate": 9.691776708456875e-06, "loss": 1.0705, "step": 5993 }, { "epoch": 0.14, "learning_rate": 9.691646873205372e-06, "loss": 1.0435, "step": 5994 }, { "epoch": 0.14, "learning_rate": 9.691517011483914e-06, "loss": 1.1081, "step": 5995 }, { "epoch": 0.14, "learning_rate": 9.691387123293238e-06, "loss": 0.8296, "step": 5996 }, { "epoch": 0.14, "learning_rate": 9.691257208634075e-06, "loss": 1.1143, "step": 5997 }, { "epoch": 0.14, "learning_rate": 9.691127267507157e-06, "loss": 1.043, "step": 5998 }, { "epoch": 0.14, "learning_rate": 9.690997299913219e-06, "loss": 0.9018, "step": 5999 }, { "epoch": 0.14, "learning_rate": 9.690867305852993e-06, "loss": 0.8046, "step": 6000 }, { "epoch": 0.14, "learning_rate": 9.690737285327212e-06, "loss": 0.5867, "step": 6001 }, { "epoch": 0.14, "learning_rate": 9.690607238336612e-06, "loss": 1.2334, "step": 6002 }, { "epoch": 0.14, "learning_rate": 9.690477164881923e-06, "loss": 0.8947, "step": 6003 }, { "epoch": 0.14, "learning_rate": 9.690347064963881e-06, "loss": 0.9134, "step": 6004 }, { "epoch": 0.14, "learning_rate": 9.69021693858322e-06, "loss": 0.832, "step": 6005 }, { "epoch": 0.14, "learning_rate": 9.690086785740675e-06, "loss": 1.3276, "step": 6006 }, { "epoch": 0.14, "learning_rate": 9.689956606436979e-06, "loss": 1.1703, "step": 6007 }, { "epoch": 0.14, "learning_rate": 9.689826400672869e-06, "loss": 1.2914, "step": 6008 }, { "epoch": 0.14, "learning_rate": 9.689696168449073e-06, "loss": 0.8911, "step": 6009 }, { "epoch": 0.14, "learning_rate": 9.689565909766334e-06, "loss": 0.8188, "step": 6010 }, { "epoch": 0.14, "learning_rate": 9.68943562462538e-06, "loss": 1.0853, "step": 6011 }, { "epoch": 0.14, "learning_rate": 9.689305313026952e-06, "loss": 1.177, "step": 6012 }, { "epoch": 0.14, "learning_rate": 9.689174974971783e-06, "loss": 1.0333, "step": 6013 }, { "epoch": 0.14, "learning_rate": 9.689044610460604e-06, "loss": 0.8971, "step": 6014 }, { "epoch": 0.14, "learning_rate": 9.688914219494156e-06, "loss": 1.251, "step": 6015 }, { "epoch": 0.14, "learning_rate": 9.688783802073173e-06, "loss": 0.9951, "step": 6016 }, { "epoch": 0.14, "learning_rate": 9.688653358198393e-06, "loss": 1.0686, "step": 6017 }, { "epoch": 0.14, "learning_rate": 9.688522887870546e-06, "loss": 0.929, "step": 6018 }, { "epoch": 0.14, "learning_rate": 9.688392391090374e-06, "loss": 0.8997, "step": 6019 }, { "epoch": 0.14, "learning_rate": 9.688261867858611e-06, "loss": 1.1198, "step": 6020 }, { "epoch": 0.14, "learning_rate": 9.688131318175993e-06, "loss": 1.2113, "step": 6021 }, { "epoch": 0.14, "learning_rate": 9.688000742043255e-06, "loss": 1.1132, "step": 6022 }, { "epoch": 0.14, "learning_rate": 9.68787013946114e-06, "loss": 1.0092, "step": 6023 }, { "epoch": 0.14, "learning_rate": 9.687739510430376e-06, "loss": 0.7064, "step": 6024 }, { "epoch": 0.14, "learning_rate": 9.687608854951706e-06, "loss": 1.1433, "step": 6025 }, { "epoch": 0.14, "learning_rate": 9.687478173025868e-06, "loss": 1.0862, "step": 6026 }, { "epoch": 0.14, "learning_rate": 9.687347464653594e-06, "loss": 1.1746, "step": 6027 }, { "epoch": 0.14, "learning_rate": 9.687216729835627e-06, "loss": 1.2147, "step": 6028 }, { "epoch": 0.14, "learning_rate": 9.6870859685727e-06, "loss": 1.0373, "step": 6029 }, { "epoch": 0.14, "learning_rate": 9.686955180865554e-06, "loss": 1.1652, "step": 6030 }, { "epoch": 0.14, "learning_rate": 9.686824366714926e-06, "loss": 0.9271, "step": 6031 }, { "epoch": 0.14, "learning_rate": 9.686693526121553e-06, "loss": 1.1114, "step": 6032 }, { "epoch": 0.14, "learning_rate": 9.686562659086174e-06, "loss": 0.9665, "step": 6033 }, { "epoch": 0.14, "learning_rate": 9.686431765609526e-06, "loss": 1.2254, "step": 6034 }, { "epoch": 0.14, "learning_rate": 9.68630084569235e-06, "loss": 0.8496, "step": 6035 }, { "epoch": 0.14, "learning_rate": 9.686169899335384e-06, "loss": 1.2898, "step": 6036 }, { "epoch": 0.14, "learning_rate": 9.686038926539365e-06, "loss": 1.0931, "step": 6037 }, { "epoch": 0.14, "learning_rate": 9.685907927305034e-06, "loss": 1.1044, "step": 6038 }, { "epoch": 0.14, "learning_rate": 9.685776901633129e-06, "loss": 1.0904, "step": 6039 }, { "epoch": 0.14, "learning_rate": 9.685645849524389e-06, "loss": 1.0017, "step": 6040 }, { "epoch": 0.14, "learning_rate": 9.685514770979554e-06, "loss": 0.8198, "step": 6041 }, { "epoch": 0.14, "learning_rate": 9.685383665999364e-06, "loss": 1.013, "step": 6042 }, { "epoch": 0.14, "learning_rate": 9.685252534584557e-06, "loss": 0.8657, "step": 6043 }, { "epoch": 0.14, "learning_rate": 9.685121376735875e-06, "loss": 1.2534, "step": 6044 }, { "epoch": 0.14, "learning_rate": 9.684990192454055e-06, "loss": 1.2152, "step": 6045 }, { "epoch": 0.14, "learning_rate": 9.68485898173984e-06, "loss": 1.0832, "step": 6046 }, { "epoch": 0.14, "learning_rate": 9.68472774459397e-06, "loss": 1.1684, "step": 6047 }, { "epoch": 0.14, "learning_rate": 9.684596481017184e-06, "loss": 1.1205, "step": 6048 }, { "epoch": 0.14, "learning_rate": 9.684465191010224e-06, "loss": 0.8824, "step": 6049 }, { "epoch": 0.14, "learning_rate": 9.68433387457383e-06, "loss": 0.9813, "step": 6050 }, { "epoch": 0.14, "learning_rate": 9.684202531708742e-06, "loss": 0.9783, "step": 6051 }, { "epoch": 0.14, "learning_rate": 9.684071162415703e-06, "loss": 1.0518, "step": 6052 }, { "epoch": 0.14, "learning_rate": 9.683939766695452e-06, "loss": 1.0867, "step": 6053 }, { "epoch": 0.14, "learning_rate": 9.683808344548733e-06, "loss": 0.8052, "step": 6054 }, { "epoch": 0.14, "learning_rate": 9.683676895976284e-06, "loss": 1.2877, "step": 6055 }, { "epoch": 0.14, "learning_rate": 9.68354542097885e-06, "loss": 0.9414, "step": 6056 }, { "epoch": 0.14, "learning_rate": 9.68341391955717e-06, "loss": 0.851, "step": 6057 }, { "epoch": 0.14, "learning_rate": 9.683282391711989e-06, "loss": 0.9007, "step": 6058 }, { "epoch": 0.14, "learning_rate": 9.683150837444047e-06, "loss": 0.8676, "step": 6059 }, { "epoch": 0.14, "learning_rate": 9.683019256754084e-06, "loss": 1.0908, "step": 6060 }, { "epoch": 0.14, "learning_rate": 9.682887649642847e-06, "loss": 0.8372, "step": 6061 }, { "epoch": 0.14, "learning_rate": 9.682756016111076e-06, "loss": 1.1569, "step": 6062 }, { "epoch": 0.14, "learning_rate": 9.682624356159516e-06, "loss": 0.957, "step": 6063 }, { "epoch": 0.14, "learning_rate": 9.682492669788905e-06, "loss": 1.0806, "step": 6064 }, { "epoch": 0.14, "learning_rate": 9.68236095699999e-06, "loss": 1.174, "step": 6065 }, { "epoch": 0.14, "learning_rate": 9.682229217793512e-06, "loss": 0.9788, "step": 6066 }, { "epoch": 0.14, "learning_rate": 9.682097452170218e-06, "loss": 1.1524, "step": 6067 }, { "epoch": 0.14, "learning_rate": 9.681965660130846e-06, "loss": 1.131, "step": 6068 }, { "epoch": 0.14, "learning_rate": 9.681833841676143e-06, "loss": 0.9243, "step": 6069 }, { "epoch": 0.14, "learning_rate": 9.681701996806851e-06, "loss": 0.867, "step": 6070 }, { "epoch": 0.14, "learning_rate": 9.681570125523717e-06, "loss": 1.0903, "step": 6071 }, { "epoch": 0.14, "learning_rate": 9.681438227827483e-06, "loss": 1.3573, "step": 6072 }, { "epoch": 0.14, "learning_rate": 9.68130630371889e-06, "loss": 0.9066, "step": 6073 }, { "epoch": 0.14, "learning_rate": 9.681174353198687e-06, "loss": 0.8584, "step": 6074 }, { "epoch": 0.14, "learning_rate": 9.681042376267616e-06, "loss": 1.3224, "step": 6075 }, { "epoch": 0.14, "learning_rate": 9.680910372926423e-06, "loss": 0.9768, "step": 6076 }, { "epoch": 0.14, "learning_rate": 9.680778343175851e-06, "loss": 0.7489, "step": 6077 }, { "epoch": 0.14, "learning_rate": 9.68064628701665e-06, "loss": 0.9711, "step": 6078 }, { "epoch": 0.14, "learning_rate": 9.680514204449555e-06, "loss": 1.2832, "step": 6079 }, { "epoch": 0.14, "learning_rate": 9.68038209547532e-06, "loss": 0.774, "step": 6080 }, { "epoch": 0.14, "learning_rate": 9.680249960094688e-06, "loss": 1.2139, "step": 6081 }, { "epoch": 0.14, "learning_rate": 9.680117798308404e-06, "loss": 0.945, "step": 6082 }, { "epoch": 0.14, "learning_rate": 9.679985610117215e-06, "loss": 0.9331, "step": 6083 }, { "epoch": 0.14, "learning_rate": 9.679853395521864e-06, "loss": 1.0318, "step": 6084 }, { "epoch": 0.14, "learning_rate": 9.679721154523098e-06, "loss": 0.9925, "step": 6085 }, { "epoch": 0.14, "learning_rate": 9.679588887121663e-06, "loss": 1.1612, "step": 6086 }, { "epoch": 0.14, "learning_rate": 9.679456593318306e-06, "loss": 1.291, "step": 6087 }, { "epoch": 0.14, "learning_rate": 9.679324273113774e-06, "loss": 1.0522, "step": 6088 }, { "epoch": 0.14, "learning_rate": 9.679191926508815e-06, "loss": 0.9906, "step": 6089 }, { "epoch": 0.14, "learning_rate": 9.67905955350417e-06, "loss": 0.9726, "step": 6090 }, { "epoch": 0.14, "learning_rate": 9.678927154100591e-06, "loss": 0.9821, "step": 6091 }, { "epoch": 0.14, "learning_rate": 9.678794728298823e-06, "loss": 0.8118, "step": 6092 }, { "epoch": 0.14, "learning_rate": 9.678662276099614e-06, "loss": 0.8781, "step": 6093 }, { "epoch": 0.14, "learning_rate": 9.678529797503709e-06, "loss": 0.9261, "step": 6094 }, { "epoch": 0.14, "learning_rate": 9.678397292511858e-06, "loss": 1.0775, "step": 6095 }, { "epoch": 0.14, "learning_rate": 9.678264761124807e-06, "loss": 1.0678, "step": 6096 }, { "epoch": 0.14, "learning_rate": 9.678132203343304e-06, "loss": 1.1496, "step": 6097 }, { "epoch": 0.14, "learning_rate": 9.6779996191681e-06, "loss": 1.1704, "step": 6098 }, { "epoch": 0.14, "learning_rate": 9.677867008599938e-06, "loss": 1.1971, "step": 6099 }, { "epoch": 0.14, "learning_rate": 9.677734371639568e-06, "loss": 0.9095, "step": 6100 }, { "epoch": 0.14, "learning_rate": 9.677601708287742e-06, "loss": 1.0516, "step": 6101 }, { "epoch": 0.14, "learning_rate": 9.677469018545202e-06, "loss": 0.8702, "step": 6102 }, { "epoch": 0.14, "learning_rate": 9.677336302412704e-06, "loss": 1.1102, "step": 6103 }, { "epoch": 0.14, "learning_rate": 9.677203559890988e-06, "loss": 0.9207, "step": 6104 }, { "epoch": 0.14, "learning_rate": 9.67707079098081e-06, "loss": 1.2577, "step": 6105 }, { "epoch": 0.14, "learning_rate": 9.676937995682916e-06, "loss": 0.8236, "step": 6106 }, { "epoch": 0.14, "learning_rate": 9.676805173998058e-06, "loss": 1.0298, "step": 6107 }, { "epoch": 0.14, "learning_rate": 9.67667232592698e-06, "loss": 1.0084, "step": 6108 }, { "epoch": 0.14, "learning_rate": 9.676539451470438e-06, "loss": 1.0312, "step": 6109 }, { "epoch": 0.14, "learning_rate": 9.676406550629177e-06, "loss": 1.0294, "step": 6110 }, { "epoch": 0.14, "learning_rate": 9.676273623403949e-06, "loss": 1.1013, "step": 6111 }, { "epoch": 0.14, "learning_rate": 9.676140669795502e-06, "loss": 0.9775, "step": 6112 }, { "epoch": 0.14, "learning_rate": 9.67600768980459e-06, "loss": 1.4166, "step": 6113 }, { "epoch": 0.14, "learning_rate": 9.675874683431958e-06, "loss": 0.9184, "step": 6114 }, { "epoch": 0.14, "learning_rate": 9.67574165067836e-06, "loss": 0.8818, "step": 6115 }, { "epoch": 0.14, "learning_rate": 9.675608591544545e-06, "loss": 1.1469, "step": 6116 }, { "epoch": 0.14, "learning_rate": 9.675475506031266e-06, "loss": 0.9228, "step": 6117 }, { "epoch": 0.14, "learning_rate": 9.67534239413927e-06, "loss": 0.8339, "step": 6118 }, { "epoch": 0.14, "learning_rate": 9.675209255869312e-06, "loss": 1.1997, "step": 6119 }, { "epoch": 0.14, "learning_rate": 9.675076091222141e-06, "loss": 1.0899, "step": 6120 }, { "epoch": 0.14, "learning_rate": 9.674942900198508e-06, "loss": 1.1261, "step": 6121 }, { "epoch": 0.14, "learning_rate": 9.674809682799167e-06, "loss": 1.1254, "step": 6122 }, { "epoch": 0.14, "learning_rate": 9.674676439024866e-06, "loss": 0.9586, "step": 6123 }, { "epoch": 0.14, "learning_rate": 9.674543168876358e-06, "loss": 0.8901, "step": 6124 }, { "epoch": 0.14, "learning_rate": 9.674409872354397e-06, "loss": 0.786, "step": 6125 }, { "epoch": 0.14, "learning_rate": 9.674276549459732e-06, "loss": 1.1259, "step": 6126 }, { "epoch": 0.14, "learning_rate": 9.674143200193119e-06, "loss": 0.8808, "step": 6127 }, { "epoch": 0.14, "learning_rate": 9.674009824555306e-06, "loss": 1.1795, "step": 6128 }, { "epoch": 0.14, "learning_rate": 9.673876422547048e-06, "loss": 0.8979, "step": 6129 }, { "epoch": 0.14, "learning_rate": 9.673742994169096e-06, "loss": 0.9638, "step": 6130 }, { "epoch": 0.14, "learning_rate": 9.673609539422207e-06, "loss": 1.1244, "step": 6131 }, { "epoch": 0.14, "learning_rate": 9.673476058307128e-06, "loss": 1.1669, "step": 6132 }, { "epoch": 0.14, "learning_rate": 9.673342550824615e-06, "loss": 1.1782, "step": 6133 }, { "epoch": 0.14, "learning_rate": 9.673209016975422e-06, "loss": 0.6707, "step": 6134 }, { "epoch": 0.14, "learning_rate": 9.673075456760302e-06, "loss": 0.8669, "step": 6135 }, { "epoch": 0.14, "learning_rate": 9.672941870180009e-06, "loss": 1.0594, "step": 6136 }, { "epoch": 0.14, "learning_rate": 9.672808257235294e-06, "loss": 0.981, "step": 6137 }, { "epoch": 0.14, "learning_rate": 9.672674617926912e-06, "loss": 0.9843, "step": 6138 }, { "epoch": 0.14, "learning_rate": 9.67254095225562e-06, "loss": 1.0467, "step": 6139 }, { "epoch": 0.14, "learning_rate": 9.672407260222169e-06, "loss": 1.0127, "step": 6140 }, { "epoch": 0.14, "learning_rate": 9.672273541827313e-06, "loss": 0.8967, "step": 6141 }, { "epoch": 0.14, "learning_rate": 9.672139797071808e-06, "loss": 0.8728, "step": 6142 }, { "epoch": 0.14, "learning_rate": 9.672006025956408e-06, "loss": 1.3278, "step": 6143 }, { "epoch": 0.14, "learning_rate": 9.671872228481869e-06, "loss": 0.9393, "step": 6144 }, { "epoch": 0.14, "learning_rate": 9.671738404648943e-06, "loss": 0.9199, "step": 6145 }, { "epoch": 0.14, "learning_rate": 9.671604554458389e-06, "loss": 1.1916, "step": 6146 }, { "epoch": 0.14, "learning_rate": 9.671470677910958e-06, "loss": 1.1643, "step": 6147 }, { "epoch": 0.14, "learning_rate": 9.671336775007407e-06, "loss": 0.9577, "step": 6148 }, { "epoch": 0.14, "learning_rate": 9.671202845748493e-06, "loss": 0.9871, "step": 6149 }, { "epoch": 0.14, "learning_rate": 9.67106889013497e-06, "loss": 1.0499, "step": 6150 }, { "epoch": 0.14, "learning_rate": 9.670934908167593e-06, "loss": 0.626, "step": 6151 }, { "epoch": 0.14, "learning_rate": 9.670800899847119e-06, "loss": 1.0599, "step": 6152 }, { "epoch": 0.14, "learning_rate": 9.670666865174303e-06, "loss": 1.1593, "step": 6153 }, { "epoch": 0.14, "learning_rate": 9.670532804149906e-06, "loss": 1.2425, "step": 6154 }, { "epoch": 0.14, "learning_rate": 9.670398716774677e-06, "loss": 0.9553, "step": 6155 }, { "epoch": 0.14, "learning_rate": 9.670264603049377e-06, "loss": 1.1006, "step": 6156 }, { "epoch": 0.14, "learning_rate": 9.670130462974763e-06, "loss": 1.087, "step": 6157 }, { "epoch": 0.14, "learning_rate": 9.66999629655159e-06, "loss": 0.8083, "step": 6158 }, { "epoch": 0.14, "learning_rate": 9.669862103780616e-06, "loss": 1.3918, "step": 6159 }, { "epoch": 0.14, "learning_rate": 9.669727884662596e-06, "loss": 1.1577, "step": 6160 }, { "epoch": 0.14, "learning_rate": 9.66959363919829e-06, "loss": 1.2271, "step": 6161 }, { "epoch": 0.14, "learning_rate": 9.669459367388454e-06, "loss": 1.1317, "step": 6162 }, { "epoch": 0.14, "learning_rate": 9.669325069233846e-06, "loss": 1.0626, "step": 6163 }, { "epoch": 0.14, "learning_rate": 9.669190744735225e-06, "loss": 0.85, "step": 6164 }, { "epoch": 0.14, "learning_rate": 9.669056393893346e-06, "loss": 1.1539, "step": 6165 }, { "epoch": 0.14, "learning_rate": 9.668922016708968e-06, "loss": 1.0277, "step": 6166 }, { "epoch": 0.14, "learning_rate": 9.66878761318285e-06, "loss": 0.7831, "step": 6167 }, { "epoch": 0.14, "learning_rate": 9.66865318331575e-06, "loss": 0.8769, "step": 6168 }, { "epoch": 0.14, "learning_rate": 9.668518727108427e-06, "loss": 0.9236, "step": 6169 }, { "epoch": 0.14, "learning_rate": 9.668384244561638e-06, "loss": 1.1737, "step": 6170 }, { "epoch": 0.14, "learning_rate": 9.668249735676142e-06, "loss": 1.095, "step": 6171 }, { "epoch": 0.14, "learning_rate": 9.668115200452701e-06, "loss": 0.9196, "step": 6172 }, { "epoch": 0.14, "learning_rate": 9.66798063889207e-06, "loss": 0.9511, "step": 6173 }, { "epoch": 0.14, "learning_rate": 9.667846050995009e-06, "loss": 1.1747, "step": 6174 }, { "epoch": 0.14, "learning_rate": 9.667711436762279e-06, "loss": 0.981, "step": 6175 }, { "epoch": 0.14, "learning_rate": 9.667576796194638e-06, "loss": 1.059, "step": 6176 }, { "epoch": 0.14, "learning_rate": 9.667442129292845e-06, "loss": 1.0261, "step": 6177 }, { "epoch": 0.14, "learning_rate": 9.667307436057664e-06, "loss": 0.9938, "step": 6178 }, { "epoch": 0.14, "learning_rate": 9.66717271648985e-06, "loss": 1.143, "step": 6179 }, { "epoch": 0.14, "learning_rate": 9.667037970590165e-06, "loss": 1.1425, "step": 6180 }, { "epoch": 0.14, "learning_rate": 9.66690319835937e-06, "loss": 1.1616, "step": 6181 }, { "epoch": 0.14, "learning_rate": 9.666768399798226e-06, "loss": 0.879, "step": 6182 }, { "epoch": 0.14, "learning_rate": 9.666633574907489e-06, "loss": 1.1385, "step": 6183 }, { "epoch": 0.14, "learning_rate": 9.666498723687926e-06, "loss": 1.398, "step": 6184 }, { "epoch": 0.14, "learning_rate": 9.666363846140291e-06, "loss": 1.0612, "step": 6185 }, { "epoch": 0.14, "learning_rate": 9.66622894226535e-06, "loss": 0.7974, "step": 6186 }, { "epoch": 0.14, "learning_rate": 9.666094012063864e-06, "loss": 1.1395, "step": 6187 }, { "epoch": 0.14, "learning_rate": 9.66595905553659e-06, "loss": 1.3169, "step": 6188 }, { "epoch": 0.14, "learning_rate": 9.665824072684296e-06, "loss": 0.9688, "step": 6189 }, { "epoch": 0.14, "learning_rate": 9.665689063507738e-06, "loss": 1.0793, "step": 6190 }, { "epoch": 0.14, "learning_rate": 9.66555402800768e-06, "loss": 0.9051, "step": 6191 }, { "epoch": 0.14, "learning_rate": 9.665418966184884e-06, "loss": 0.9314, "step": 6192 }, { "epoch": 0.14, "learning_rate": 9.66528387804011e-06, "loss": 0.8149, "step": 6193 }, { "epoch": 0.14, "learning_rate": 9.665148763574123e-06, "loss": 0.8788, "step": 6194 }, { "epoch": 0.14, "learning_rate": 9.665013622787685e-06, "loss": 1.1646, "step": 6195 }, { "epoch": 0.14, "learning_rate": 9.664878455681556e-06, "loss": 0.9886, "step": 6196 }, { "epoch": 0.14, "learning_rate": 9.6647432622565e-06, "loss": 0.8842, "step": 6197 }, { "epoch": 0.14, "learning_rate": 9.66460804251328e-06, "loss": 0.866, "step": 6198 }, { "epoch": 0.14, "learning_rate": 9.66447279645266e-06, "loss": 1.1046, "step": 6199 }, { "epoch": 0.14, "learning_rate": 9.6643375240754e-06, "loss": 0.7813, "step": 6200 }, { "epoch": 0.14, "learning_rate": 9.664202225382266e-06, "loss": 0.88, "step": 6201 }, { "epoch": 0.14, "learning_rate": 9.66406690037402e-06, "loss": 0.81, "step": 6202 }, { "epoch": 0.14, "learning_rate": 9.663931549051426e-06, "loss": 1.2131, "step": 6203 }, { "epoch": 0.14, "learning_rate": 9.663796171415246e-06, "loss": 1.0639, "step": 6204 }, { "epoch": 0.14, "learning_rate": 9.663660767466246e-06, "loss": 1.1297, "step": 6205 }, { "epoch": 0.14, "learning_rate": 9.66352533720519e-06, "loss": 1.3202, "step": 6206 }, { "epoch": 0.14, "learning_rate": 9.663389880632841e-06, "loss": 0.8757, "step": 6207 }, { "epoch": 0.14, "learning_rate": 9.663254397749964e-06, "loss": 1.1838, "step": 6208 }, { "epoch": 0.14, "learning_rate": 9.663118888557321e-06, "loss": 0.8782, "step": 6209 }, { "epoch": 0.14, "learning_rate": 9.66298335305568e-06, "loss": 0.9656, "step": 6210 }, { "epoch": 0.14, "learning_rate": 9.662847791245804e-06, "loss": 0.9369, "step": 6211 }, { "epoch": 0.14, "learning_rate": 9.662712203128458e-06, "loss": 1.0358, "step": 6212 }, { "epoch": 0.14, "learning_rate": 9.662576588704406e-06, "loss": 0.8826, "step": 6213 }, { "epoch": 0.14, "learning_rate": 9.662440947974414e-06, "loss": 1.0568, "step": 6214 }, { "epoch": 0.14, "learning_rate": 9.662305280939249e-06, "loss": 1.0154, "step": 6215 }, { "epoch": 0.14, "learning_rate": 9.662169587599672e-06, "loss": 0.9012, "step": 6216 }, { "epoch": 0.14, "learning_rate": 9.662033867956454e-06, "loss": 1.1705, "step": 6217 }, { "epoch": 0.14, "learning_rate": 9.661898122010355e-06, "loss": 1.2837, "step": 6218 }, { "epoch": 0.14, "learning_rate": 9.661762349762148e-06, "loss": 0.7937, "step": 6219 }, { "epoch": 0.14, "learning_rate": 9.661626551212591e-06, "loss": 1.1305, "step": 6220 }, { "epoch": 0.14, "learning_rate": 9.661490726362457e-06, "loss": 1.1043, "step": 6221 }, { "epoch": 0.14, "learning_rate": 9.661354875212508e-06, "loss": 1.2819, "step": 6222 }, { "epoch": 0.14, "learning_rate": 9.661218997763513e-06, "loss": 0.9591, "step": 6223 }, { "epoch": 0.14, "learning_rate": 9.661083094016236e-06, "loss": 1.0392, "step": 6224 }, { "epoch": 0.14, "learning_rate": 9.660947163971446e-06, "loss": 1.1813, "step": 6225 }, { "epoch": 0.14, "learning_rate": 9.66081120762991e-06, "loss": 0.6873, "step": 6226 }, { "epoch": 0.14, "learning_rate": 9.660675224992392e-06, "loss": 1.1356, "step": 6227 }, { "epoch": 0.14, "learning_rate": 9.660539216059662e-06, "loss": 1.0817, "step": 6228 }, { "epoch": 0.14, "learning_rate": 9.660403180832488e-06, "loss": 1.0957, "step": 6229 }, { "epoch": 0.14, "learning_rate": 9.660267119311636e-06, "loss": 1.1082, "step": 6230 }, { "epoch": 0.14, "learning_rate": 9.660131031497873e-06, "loss": 0.8941, "step": 6231 }, { "epoch": 0.14, "learning_rate": 9.659994917391969e-06, "loss": 0.9349, "step": 6232 }, { "epoch": 0.14, "learning_rate": 9.659858776994689e-06, "loss": 1.3677, "step": 6233 }, { "epoch": 0.14, "learning_rate": 9.659722610306803e-06, "loss": 1.1328, "step": 6234 }, { "epoch": 0.14, "learning_rate": 9.659586417329079e-06, "loss": 1.0146, "step": 6235 }, { "epoch": 0.14, "learning_rate": 9.659450198062286e-06, "loss": 0.9784, "step": 6236 }, { "epoch": 0.14, "learning_rate": 9.659313952507192e-06, "loss": 1.0496, "step": 6237 }, { "epoch": 0.14, "learning_rate": 9.659177680664566e-06, "loss": 1.1672, "step": 6238 }, { "epoch": 0.14, "learning_rate": 9.659041382535175e-06, "loss": 1.3217, "step": 6239 }, { "epoch": 0.14, "learning_rate": 9.658905058119791e-06, "loss": 0.8856, "step": 6240 }, { "epoch": 0.14, "learning_rate": 9.65876870741918e-06, "loss": 1.1358, "step": 6241 }, { "epoch": 0.14, "learning_rate": 9.658632330434114e-06, "loss": 0.9634, "step": 6242 }, { "epoch": 0.14, "learning_rate": 9.658495927165361e-06, "loss": 1.1084, "step": 6243 }, { "epoch": 0.14, "learning_rate": 9.658359497613691e-06, "loss": 1.2657, "step": 6244 }, { "epoch": 0.14, "learning_rate": 9.658223041779874e-06, "loss": 1.1723, "step": 6245 }, { "epoch": 0.14, "learning_rate": 9.658086559664679e-06, "loss": 0.9994, "step": 6246 }, { "epoch": 0.14, "learning_rate": 9.657950051268876e-06, "loss": 0.7346, "step": 6247 }, { "epoch": 0.14, "learning_rate": 9.657813516593234e-06, "loss": 1.1868, "step": 6248 }, { "epoch": 0.14, "learning_rate": 9.65767695563853e-06, "loss": 1.0609, "step": 6249 }, { "epoch": 0.14, "learning_rate": 9.657540368405525e-06, "loss": 0.8772, "step": 6250 }, { "epoch": 0.14, "learning_rate": 9.657403754894997e-06, "loss": 1.1941, "step": 6251 }, { "epoch": 0.14, "learning_rate": 9.657267115107711e-06, "loss": 0.8999, "step": 6252 }, { "epoch": 0.15, "learning_rate": 9.657130449044442e-06, "loss": 1.0624, "step": 6253 }, { "epoch": 0.15, "learning_rate": 9.656993756705959e-06, "loss": 1.1274, "step": 6254 }, { "epoch": 0.15, "learning_rate": 9.656857038093035e-06, "loss": 1.3732, "step": 6255 }, { "epoch": 0.15, "learning_rate": 9.656720293206441e-06, "loss": 0.8185, "step": 6256 }, { "epoch": 0.15, "learning_rate": 9.656583522046946e-06, "loss": 0.8649, "step": 6257 }, { "epoch": 0.15, "learning_rate": 9.656446724615325e-06, "loss": 1.1118, "step": 6258 }, { "epoch": 0.15, "learning_rate": 9.656309900912348e-06, "loss": 0.8602, "step": 6259 }, { "epoch": 0.15, "learning_rate": 9.656173050938786e-06, "loss": 1.1143, "step": 6260 }, { "epoch": 0.15, "learning_rate": 9.656036174695413e-06, "loss": 1.3609, "step": 6261 }, { "epoch": 0.15, "learning_rate": 9.655899272183003e-06, "loss": 1.0822, "step": 6262 }, { "epoch": 0.15, "learning_rate": 9.655762343402323e-06, "loss": 1.303, "step": 6263 }, { "epoch": 0.15, "learning_rate": 9.65562538835415e-06, "loss": 1.0289, "step": 6264 }, { "epoch": 0.15, "learning_rate": 9.655488407039255e-06, "loss": 1.3135, "step": 6265 }, { "epoch": 0.15, "learning_rate": 9.65535139945841e-06, "loss": 1.0444, "step": 6266 }, { "epoch": 0.15, "learning_rate": 9.65521436561239e-06, "loss": 1.1523, "step": 6267 }, { "epoch": 0.15, "learning_rate": 9.655077305501967e-06, "loss": 0.9535, "step": 6268 }, { "epoch": 0.15, "learning_rate": 9.654940219127916e-06, "loss": 1.1609, "step": 6269 }, { "epoch": 0.15, "learning_rate": 9.654803106491006e-06, "loss": 1.2271, "step": 6270 }, { "epoch": 0.15, "learning_rate": 9.654665967592016e-06, "loss": 0.8981, "step": 6271 }, { "epoch": 0.15, "learning_rate": 9.654528802431715e-06, "loss": 0.854, "step": 6272 }, { "epoch": 0.15, "learning_rate": 9.65439161101088e-06, "loss": 0.9165, "step": 6273 }, { "epoch": 0.15, "learning_rate": 9.654254393330285e-06, "loss": 0.9178, "step": 6274 }, { "epoch": 0.15, "learning_rate": 9.654117149390702e-06, "loss": 1.1864, "step": 6275 }, { "epoch": 0.15, "learning_rate": 9.653979879192908e-06, "loss": 0.9855, "step": 6276 }, { "epoch": 0.15, "learning_rate": 9.653842582737675e-06, "loss": 1.2466, "step": 6277 }, { "epoch": 0.15, "learning_rate": 9.653705260025782e-06, "loss": 1.1968, "step": 6278 }, { "epoch": 0.15, "learning_rate": 9.653567911057996e-06, "loss": 1.0045, "step": 6279 }, { "epoch": 0.15, "learning_rate": 9.653430535835098e-06, "loss": 1.243, "step": 6280 }, { "epoch": 0.15, "learning_rate": 9.653293134357862e-06, "loss": 1.2044, "step": 6281 }, { "epoch": 0.15, "learning_rate": 9.653155706627061e-06, "loss": 1.2626, "step": 6282 }, { "epoch": 0.15, "learning_rate": 9.653018252643473e-06, "loss": 0.8658, "step": 6283 }, { "epoch": 0.15, "learning_rate": 9.652880772407873e-06, "loss": 0.8667, "step": 6284 }, { "epoch": 0.15, "learning_rate": 9.652743265921036e-06, "loss": 1.132, "step": 6285 }, { "epoch": 0.15, "learning_rate": 9.652605733183737e-06, "loss": 1.0577, "step": 6286 }, { "epoch": 0.15, "learning_rate": 9.652468174196754e-06, "loss": 0.8038, "step": 6287 }, { "epoch": 0.15, "learning_rate": 9.652330588960863e-06, "loss": 1.1277, "step": 6288 }, { "epoch": 0.15, "learning_rate": 9.652192977476838e-06, "loss": 0.8441, "step": 6289 }, { "epoch": 0.15, "learning_rate": 9.652055339745456e-06, "loss": 0.9317, "step": 6290 }, { "epoch": 0.15, "learning_rate": 9.651917675767495e-06, "loss": 1.029, "step": 6291 }, { "epoch": 0.15, "learning_rate": 9.65177998554373e-06, "loss": 1.0562, "step": 6292 }, { "epoch": 0.15, "learning_rate": 9.65164226907494e-06, "loss": 0.9622, "step": 6293 }, { "epoch": 0.15, "learning_rate": 9.651504526361901e-06, "loss": 0.9606, "step": 6294 }, { "epoch": 0.15, "learning_rate": 9.651366757405388e-06, "loss": 0.8746, "step": 6295 }, { "epoch": 0.15, "learning_rate": 9.651228962206182e-06, "loss": 0.8656, "step": 6296 }, { "epoch": 0.15, "learning_rate": 9.651091140765058e-06, "loss": 1.3106, "step": 6297 }, { "epoch": 0.15, "learning_rate": 9.650953293082793e-06, "loss": 1.0303, "step": 6298 }, { "epoch": 0.15, "learning_rate": 9.650815419160166e-06, "loss": 1.2193, "step": 6299 }, { "epoch": 0.15, "learning_rate": 9.650677518997957e-06, "loss": 0.9798, "step": 6300 }, { "epoch": 0.15, "learning_rate": 9.65053959259694e-06, "loss": 1.1698, "step": 6301 }, { "epoch": 0.15, "learning_rate": 9.650401639957896e-06, "loss": 1.087, "step": 6302 }, { "epoch": 0.15, "learning_rate": 9.6502636610816e-06, "loss": 0.9185, "step": 6303 }, { "epoch": 0.15, "learning_rate": 9.650125655968836e-06, "loss": 1.0102, "step": 6304 }, { "epoch": 0.15, "learning_rate": 9.649987624620378e-06, "loss": 1.5689, "step": 6305 }, { "epoch": 0.15, "learning_rate": 9.649849567037005e-06, "loss": 0.9783, "step": 6306 }, { "epoch": 0.15, "learning_rate": 9.649711483219498e-06, "loss": 0.9817, "step": 6307 }, { "epoch": 0.15, "learning_rate": 9.649573373168635e-06, "loss": 1.0904, "step": 6308 }, { "epoch": 0.15, "learning_rate": 9.649435236885193e-06, "loss": 0.9976, "step": 6309 }, { "epoch": 0.15, "learning_rate": 9.649297074369958e-06, "loss": 1.0774, "step": 6310 }, { "epoch": 0.15, "learning_rate": 9.649158885623703e-06, "loss": 1.0541, "step": 6311 }, { "epoch": 0.15, "learning_rate": 9.64902067064721e-06, "loss": 0.9509, "step": 6312 }, { "epoch": 0.15, "learning_rate": 9.648882429441258e-06, "loss": 1.117, "step": 6313 }, { "epoch": 0.15, "learning_rate": 9.648744162006628e-06, "loss": 1.194, "step": 6314 }, { "epoch": 0.15, "learning_rate": 9.6486058683441e-06, "loss": 1.1169, "step": 6315 }, { "epoch": 0.15, "learning_rate": 9.648467548454452e-06, "loss": 1.137, "step": 6316 }, { "epoch": 0.15, "learning_rate": 9.64832920233847e-06, "loss": 1.372, "step": 6317 }, { "epoch": 0.15, "learning_rate": 9.648190829996927e-06, "loss": 0.7226, "step": 6318 }, { "epoch": 0.15, "learning_rate": 9.64805243143061e-06, "loss": 1.1271, "step": 6319 }, { "epoch": 0.15, "learning_rate": 9.647914006640296e-06, "loss": 0.9632, "step": 6320 }, { "epoch": 0.15, "learning_rate": 9.647775555626769e-06, "loss": 1.1456, "step": 6321 }, { "epoch": 0.15, "learning_rate": 9.647637078390806e-06, "loss": 1.0964, "step": 6322 }, { "epoch": 0.15, "learning_rate": 9.647498574933191e-06, "loss": 0.8442, "step": 6323 }, { "epoch": 0.15, "learning_rate": 9.647360045254706e-06, "loss": 1.0037, "step": 6324 }, { "epoch": 0.15, "learning_rate": 9.647221489356133e-06, "loss": 1.0942, "step": 6325 }, { "epoch": 0.15, "learning_rate": 9.64708290723825e-06, "loss": 1.0856, "step": 6326 }, { "epoch": 0.15, "learning_rate": 9.646944298901843e-06, "loss": 1.2961, "step": 6327 }, { "epoch": 0.15, "learning_rate": 9.646805664347693e-06, "loss": 0.9804, "step": 6328 }, { "epoch": 0.15, "learning_rate": 9.64666700357658e-06, "loss": 0.8775, "step": 6329 }, { "epoch": 0.15, "learning_rate": 9.646528316589289e-06, "loss": 1.0032, "step": 6330 }, { "epoch": 0.15, "learning_rate": 9.6463896033866e-06, "loss": 1.3743, "step": 6331 }, { "epoch": 0.15, "learning_rate": 9.646250863969298e-06, "loss": 1.0305, "step": 6332 }, { "epoch": 0.15, "learning_rate": 9.646112098338164e-06, "loss": 0.9811, "step": 6333 }, { "epoch": 0.15, "learning_rate": 9.645973306493983e-06, "loss": 1.1697, "step": 6334 }, { "epoch": 0.15, "learning_rate": 9.645834488437534e-06, "loss": 1.1421, "step": 6335 }, { "epoch": 0.15, "learning_rate": 9.645695644169604e-06, "loss": 1.0182, "step": 6336 }, { "epoch": 0.15, "learning_rate": 9.645556773690976e-06, "loss": 1.0156, "step": 6337 }, { "epoch": 0.15, "learning_rate": 9.645417877002432e-06, "loss": 1.136, "step": 6338 }, { "epoch": 0.15, "learning_rate": 9.645278954104756e-06, "loss": 0.9952, "step": 6339 }, { "epoch": 0.15, "learning_rate": 9.645140004998732e-06, "loss": 0.875, "step": 6340 }, { "epoch": 0.15, "learning_rate": 9.645001029685147e-06, "loss": 0.8882, "step": 6341 }, { "epoch": 0.15, "learning_rate": 9.644862028164778e-06, "loss": 1.1852, "step": 6342 }, { "epoch": 0.15, "learning_rate": 9.644723000438416e-06, "loss": 1.1208, "step": 6343 }, { "epoch": 0.15, "learning_rate": 9.64458394650684e-06, "loss": 1.1271, "step": 6344 }, { "epoch": 0.15, "learning_rate": 9.64444486637084e-06, "loss": 0.8653, "step": 6345 }, { "epoch": 0.15, "learning_rate": 9.644305760031199e-06, "loss": 0.9249, "step": 6346 }, { "epoch": 0.15, "learning_rate": 9.644166627488697e-06, "loss": 0.9514, "step": 6347 }, { "epoch": 0.15, "learning_rate": 9.644027468744127e-06, "loss": 1.2306, "step": 6348 }, { "epoch": 0.15, "learning_rate": 9.643888283798267e-06, "loss": 0.9605, "step": 6349 }, { "epoch": 0.15, "learning_rate": 9.643749072651904e-06, "loss": 1.2182, "step": 6350 }, { "epoch": 0.15, "learning_rate": 9.643609835305827e-06, "loss": 1.2858, "step": 6351 }, { "epoch": 0.15, "learning_rate": 9.643470571760819e-06, "loss": 1.054, "step": 6352 }, { "epoch": 0.15, "learning_rate": 9.643331282017664e-06, "loss": 0.9176, "step": 6353 }, { "epoch": 0.15, "learning_rate": 9.643191966077153e-06, "loss": 1.0672, "step": 6354 }, { "epoch": 0.15, "learning_rate": 9.643052623940067e-06, "loss": 1.1443, "step": 6355 }, { "epoch": 0.15, "learning_rate": 9.642913255607194e-06, "loss": 1.0367, "step": 6356 }, { "epoch": 0.15, "learning_rate": 9.64277386107932e-06, "loss": 1.2669, "step": 6357 }, { "epoch": 0.15, "learning_rate": 9.642634440357233e-06, "loss": 1.0028, "step": 6358 }, { "epoch": 0.15, "learning_rate": 9.642494993441716e-06, "loss": 0.9609, "step": 6359 }, { "epoch": 0.15, "learning_rate": 9.642355520333559e-06, "loss": 0.8401, "step": 6360 }, { "epoch": 0.15, "learning_rate": 9.642216021033549e-06, "loss": 0.8598, "step": 6361 }, { "epoch": 0.15, "learning_rate": 9.64207649554247e-06, "loss": 1.1295, "step": 6362 }, { "epoch": 0.15, "learning_rate": 9.641936943861112e-06, "loss": 0.9163, "step": 6363 }, { "epoch": 0.15, "learning_rate": 9.641797365990261e-06, "loss": 1.3468, "step": 6364 }, { "epoch": 0.15, "learning_rate": 9.641657761930707e-06, "loss": 1.4789, "step": 6365 }, { "epoch": 0.15, "learning_rate": 9.641518131683233e-06, "loss": 1.0947, "step": 6366 }, { "epoch": 0.15, "learning_rate": 9.641378475248632e-06, "loss": 1.1898, "step": 6367 }, { "epoch": 0.15, "learning_rate": 9.641238792627688e-06, "loss": 1.0945, "step": 6368 }, { "epoch": 0.15, "learning_rate": 9.64109908382119e-06, "loss": 1.0346, "step": 6369 }, { "epoch": 0.15, "learning_rate": 9.640959348829929e-06, "loss": 1.603, "step": 6370 }, { "epoch": 0.15, "learning_rate": 9.640819587654689e-06, "loss": 1.1069, "step": 6371 }, { "epoch": 0.15, "learning_rate": 9.64067980029626e-06, "loss": 1.0126, "step": 6372 }, { "epoch": 0.15, "learning_rate": 9.640539986755432e-06, "loss": 1.0299, "step": 6373 }, { "epoch": 0.15, "learning_rate": 9.640400147032993e-06, "loss": 0.8591, "step": 6374 }, { "epoch": 0.15, "learning_rate": 9.640260281129732e-06, "loss": 1.115, "step": 6375 }, { "epoch": 0.15, "learning_rate": 9.640120389046438e-06, "loss": 1.2025, "step": 6376 }, { "epoch": 0.15, "learning_rate": 9.6399804707839e-06, "loss": 1.0895, "step": 6377 }, { "epoch": 0.15, "learning_rate": 9.639840526342909e-06, "loss": 0.9894, "step": 6378 }, { "epoch": 0.15, "learning_rate": 9.639700555724253e-06, "loss": 1.0497, "step": 6379 }, { "epoch": 0.15, "learning_rate": 9.639560558928723e-06, "loss": 1.0996, "step": 6380 }, { "epoch": 0.15, "learning_rate": 9.639420535957105e-06, "loss": 0.7929, "step": 6381 }, { "epoch": 0.15, "learning_rate": 9.639280486810194e-06, "loss": 0.7978, "step": 6382 }, { "epoch": 0.15, "learning_rate": 9.639140411488777e-06, "loss": 1.1247, "step": 6383 }, { "epoch": 0.15, "learning_rate": 9.639000309993647e-06, "loss": 1.2165, "step": 6384 }, { "epoch": 0.15, "learning_rate": 9.638860182325591e-06, "loss": 1.0273, "step": 6385 }, { "epoch": 0.15, "learning_rate": 9.638720028485402e-06, "loss": 1.0264, "step": 6386 }, { "epoch": 0.15, "learning_rate": 9.638579848473871e-06, "loss": 1.1156, "step": 6387 }, { "epoch": 0.15, "learning_rate": 9.638439642291786e-06, "loss": 0.9954, "step": 6388 }, { "epoch": 0.15, "learning_rate": 9.638299409939941e-06, "loss": 1.1889, "step": 6389 }, { "epoch": 0.15, "learning_rate": 9.638159151419128e-06, "loss": 1.2228, "step": 6390 }, { "epoch": 0.15, "learning_rate": 9.638018866730135e-06, "loss": 1.1783, "step": 6391 }, { "epoch": 0.15, "learning_rate": 9.637878555873755e-06, "loss": 1.046, "step": 6392 }, { "epoch": 0.15, "learning_rate": 9.63773821885078e-06, "loss": 0.9375, "step": 6393 }, { "epoch": 0.15, "learning_rate": 9.637597855662001e-06, "loss": 1.3919, "step": 6394 }, { "epoch": 0.15, "learning_rate": 9.637457466308212e-06, "loss": 0.8192, "step": 6395 }, { "epoch": 0.15, "learning_rate": 9.637317050790201e-06, "loss": 1.0804, "step": 6396 }, { "epoch": 0.15, "learning_rate": 9.637176609108764e-06, "loss": 0.8877, "step": 6397 }, { "epoch": 0.15, "learning_rate": 9.637036141264692e-06, "loss": 0.8431, "step": 6398 }, { "epoch": 0.15, "learning_rate": 9.636895647258777e-06, "loss": 1.2131, "step": 6399 }, { "epoch": 0.15, "learning_rate": 9.636755127091813e-06, "loss": 1.0489, "step": 6400 }, { "epoch": 0.15, "learning_rate": 9.636614580764591e-06, "loss": 0.8189, "step": 6401 }, { "epoch": 0.15, "learning_rate": 9.636474008277904e-06, "loss": 1.0317, "step": 6402 }, { "epoch": 0.15, "learning_rate": 9.636333409632548e-06, "loss": 1.1383, "step": 6403 }, { "epoch": 0.15, "learning_rate": 9.636192784829313e-06, "loss": 1.1379, "step": 6404 }, { "epoch": 0.15, "learning_rate": 9.636052133868995e-06, "loss": 1.0944, "step": 6405 }, { "epoch": 0.15, "learning_rate": 9.635911456752385e-06, "loss": 1.0005, "step": 6406 }, { "epoch": 0.15, "learning_rate": 9.635770753480277e-06, "loss": 0.9742, "step": 6407 }, { "epoch": 0.15, "learning_rate": 9.635630024053469e-06, "loss": 1.1013, "step": 6408 }, { "epoch": 0.15, "learning_rate": 9.635489268472749e-06, "loss": 1.1287, "step": 6409 }, { "epoch": 0.15, "learning_rate": 9.635348486738915e-06, "loss": 1.2622, "step": 6410 }, { "epoch": 0.15, "learning_rate": 9.63520767885276e-06, "loss": 0.8446, "step": 6411 }, { "epoch": 0.15, "learning_rate": 9.635066844815077e-06, "loss": 1.1511, "step": 6412 }, { "epoch": 0.15, "learning_rate": 9.634925984626665e-06, "loss": 1.1625, "step": 6413 }, { "epoch": 0.15, "learning_rate": 9.634785098288313e-06, "loss": 0.9856, "step": 6414 }, { "epoch": 0.15, "learning_rate": 9.63464418580082e-06, "loss": 0.9621, "step": 6415 }, { "epoch": 0.15, "learning_rate": 9.63450324716498e-06, "loss": 0.9699, "step": 6416 }, { "epoch": 0.15, "learning_rate": 9.634362282381589e-06, "loss": 1.0834, "step": 6417 }, { "epoch": 0.15, "learning_rate": 9.63422129145144e-06, "loss": 1.3216, "step": 6418 }, { "epoch": 0.15, "learning_rate": 9.634080274375329e-06, "loss": 0.8923, "step": 6419 }, { "epoch": 0.15, "learning_rate": 9.633939231154052e-06, "loss": 0.9093, "step": 6420 }, { "epoch": 0.15, "learning_rate": 9.633798161788406e-06, "loss": 1.0143, "step": 6421 }, { "epoch": 0.15, "learning_rate": 9.633657066279186e-06, "loss": 0.9296, "step": 6422 }, { "epoch": 0.15, "learning_rate": 9.633515944627189e-06, "loss": 0.8256, "step": 6423 }, { "epoch": 0.15, "learning_rate": 9.633374796833208e-06, "loss": 1.1242, "step": 6424 }, { "epoch": 0.15, "learning_rate": 9.633233622898044e-06, "loss": 0.8267, "step": 6425 }, { "epoch": 0.15, "learning_rate": 9.63309242282249e-06, "loss": 0.9544, "step": 6426 }, { "epoch": 0.15, "learning_rate": 9.632951196607343e-06, "loss": 1.0243, "step": 6427 }, { "epoch": 0.15, "learning_rate": 9.6328099442534e-06, "loss": 1.0354, "step": 6428 }, { "epoch": 0.15, "learning_rate": 9.63266866576146e-06, "loss": 1.0966, "step": 6429 }, { "epoch": 0.15, "learning_rate": 9.632527361132318e-06, "loss": 0.7584, "step": 6430 }, { "epoch": 0.15, "learning_rate": 9.632386030366771e-06, "loss": 0.9413, "step": 6431 }, { "epoch": 0.15, "learning_rate": 9.632244673465618e-06, "loss": 1.1093, "step": 6432 }, { "epoch": 0.15, "learning_rate": 9.632103290429654e-06, "loss": 0.8762, "step": 6433 }, { "epoch": 0.15, "learning_rate": 9.631961881259682e-06, "loss": 1.0129, "step": 6434 }, { "epoch": 0.15, "learning_rate": 9.631820445956492e-06, "loss": 1.1902, "step": 6435 }, { "epoch": 0.15, "learning_rate": 9.631678984520888e-06, "loss": 0.9136, "step": 6436 }, { "epoch": 0.15, "learning_rate": 9.631537496953666e-06, "loss": 1.1147, "step": 6437 }, { "epoch": 0.15, "learning_rate": 9.631395983255625e-06, "loss": 1.1043, "step": 6438 }, { "epoch": 0.15, "learning_rate": 9.631254443427563e-06, "loss": 1.1124, "step": 6439 }, { "epoch": 0.15, "learning_rate": 9.63111287747028e-06, "loss": 0.9099, "step": 6440 }, { "epoch": 0.15, "learning_rate": 9.630971285384569e-06, "loss": 1.089, "step": 6441 }, { "epoch": 0.15, "learning_rate": 9.630829667171236e-06, "loss": 0.8217, "step": 6442 }, { "epoch": 0.15, "learning_rate": 9.630688022831076e-06, "loss": 0.9675, "step": 6443 }, { "epoch": 0.15, "learning_rate": 9.630546352364889e-06, "loss": 0.8833, "step": 6444 }, { "epoch": 0.15, "learning_rate": 9.630404655773475e-06, "loss": 1.0945, "step": 6445 }, { "epoch": 0.15, "learning_rate": 9.630262933057633e-06, "loss": 0.948, "step": 6446 }, { "epoch": 0.15, "learning_rate": 9.630121184218162e-06, "loss": 1.1647, "step": 6447 }, { "epoch": 0.15, "learning_rate": 9.629979409255861e-06, "loss": 1.0432, "step": 6448 }, { "epoch": 0.15, "learning_rate": 9.629837608171533e-06, "loss": 1.0501, "step": 6449 }, { "epoch": 0.15, "learning_rate": 9.629695780965975e-06, "loss": 0.8818, "step": 6450 }, { "epoch": 0.15, "learning_rate": 9.629553927639989e-06, "loss": 1.2146, "step": 6451 }, { "epoch": 0.15, "learning_rate": 9.629412048194375e-06, "loss": 0.9261, "step": 6452 }, { "epoch": 0.15, "learning_rate": 9.629270142629932e-06, "loss": 1.108, "step": 6453 }, { "epoch": 0.15, "learning_rate": 9.629128210947463e-06, "loss": 0.9789, "step": 6454 }, { "epoch": 0.15, "learning_rate": 9.628986253147767e-06, "loss": 1.0777, "step": 6455 }, { "epoch": 0.15, "learning_rate": 9.628844269231645e-06, "loss": 0.9475, "step": 6456 }, { "epoch": 0.15, "learning_rate": 9.628702259199899e-06, "loss": 0.9358, "step": 6457 }, { "epoch": 0.15, "learning_rate": 9.62856022305333e-06, "loss": 1.0383, "step": 6458 }, { "epoch": 0.15, "learning_rate": 9.628418160792739e-06, "loss": 1.0046, "step": 6459 }, { "epoch": 0.15, "learning_rate": 9.628276072418927e-06, "loss": 1.2254, "step": 6460 }, { "epoch": 0.15, "learning_rate": 9.628133957932695e-06, "loss": 1.1322, "step": 6461 }, { "epoch": 0.15, "learning_rate": 9.627991817334848e-06, "loss": 1.0082, "step": 6462 }, { "epoch": 0.15, "learning_rate": 9.627849650626185e-06, "loss": 1.0309, "step": 6463 }, { "epoch": 0.15, "learning_rate": 9.62770745780751e-06, "loss": 1.0297, "step": 6464 }, { "epoch": 0.15, "learning_rate": 9.627565238879624e-06, "loss": 1.1379, "step": 6465 }, { "epoch": 0.15, "learning_rate": 9.627422993843329e-06, "loss": 1.1473, "step": 6466 }, { "epoch": 0.15, "learning_rate": 9.627280722699428e-06, "loss": 0.9546, "step": 6467 }, { "epoch": 0.15, "learning_rate": 9.627138425448726e-06, "loss": 0.7869, "step": 6468 }, { "epoch": 0.15, "learning_rate": 9.62699610209202e-06, "loss": 0.7542, "step": 6469 }, { "epoch": 0.15, "learning_rate": 9.626853752630121e-06, "loss": 1.0651, "step": 6470 }, { "epoch": 0.15, "learning_rate": 9.626711377063824e-06, "loss": 1.1188, "step": 6471 }, { "epoch": 0.15, "learning_rate": 9.626568975393939e-06, "loss": 1.0683, "step": 6472 }, { "epoch": 0.15, "learning_rate": 9.626426547621265e-06, "loss": 1.0699, "step": 6473 }, { "epoch": 0.15, "learning_rate": 9.626284093746607e-06, "loss": 1.1511, "step": 6474 }, { "epoch": 0.15, "learning_rate": 9.62614161377077e-06, "loss": 1.1793, "step": 6475 }, { "epoch": 0.15, "learning_rate": 9.625999107694557e-06, "loss": 0.8822, "step": 6476 }, { "epoch": 0.15, "learning_rate": 9.62585657551877e-06, "loss": 0.9253, "step": 6477 }, { "epoch": 0.15, "learning_rate": 9.625714017244217e-06, "loss": 1.1104, "step": 6478 }, { "epoch": 0.15, "learning_rate": 9.625571432871697e-06, "loss": 0.9168, "step": 6479 }, { "epoch": 0.15, "learning_rate": 9.62542882240202e-06, "loss": 0.9781, "step": 6480 }, { "epoch": 0.15, "learning_rate": 9.625286185835987e-06, "loss": 0.8111, "step": 6481 }, { "epoch": 0.15, "learning_rate": 9.625143523174406e-06, "loss": 0.9931, "step": 6482 }, { "epoch": 0.15, "learning_rate": 9.625000834418077e-06, "loss": 1.0328, "step": 6483 }, { "epoch": 0.15, "learning_rate": 9.62485811956781e-06, "loss": 1.1773, "step": 6484 }, { "epoch": 0.15, "learning_rate": 9.624715378624407e-06, "loss": 0.9969, "step": 6485 }, { "epoch": 0.15, "learning_rate": 9.624572611588675e-06, "loss": 0.9886, "step": 6486 }, { "epoch": 0.15, "learning_rate": 9.624429818461418e-06, "loss": 0.8557, "step": 6487 }, { "epoch": 0.15, "learning_rate": 9.624286999243443e-06, "loss": 0.8078, "step": 6488 }, { "epoch": 0.15, "learning_rate": 9.624144153935557e-06, "loss": 1.0258, "step": 6489 }, { "epoch": 0.15, "learning_rate": 9.624001282538562e-06, "loss": 0.9852, "step": 6490 }, { "epoch": 0.15, "learning_rate": 9.623858385053268e-06, "loss": 1.2272, "step": 6491 }, { "epoch": 0.15, "learning_rate": 9.623715461480479e-06, "loss": 1.224, "step": 6492 }, { "epoch": 0.15, "learning_rate": 9.623572511821e-06, "loss": 1.2205, "step": 6493 }, { "epoch": 0.15, "learning_rate": 9.62342953607564e-06, "loss": 1.0161, "step": 6494 }, { "epoch": 0.15, "learning_rate": 9.623286534245206e-06, "loss": 1.0579, "step": 6495 }, { "epoch": 0.15, "learning_rate": 9.623143506330504e-06, "loss": 1.0463, "step": 6496 }, { "epoch": 0.15, "learning_rate": 9.62300045233234e-06, "loss": 1.0234, "step": 6497 }, { "epoch": 0.15, "learning_rate": 9.622857372251524e-06, "loss": 1.2144, "step": 6498 }, { "epoch": 0.15, "learning_rate": 9.622714266088858e-06, "loss": 0.7974, "step": 6499 }, { "epoch": 0.15, "learning_rate": 9.622571133845155e-06, "loss": 0.8614, "step": 6500 }, { "epoch": 0.15, "learning_rate": 9.622427975521218e-06, "loss": 1.0512, "step": 6501 }, { "epoch": 0.15, "learning_rate": 9.62228479111786e-06, "loss": 0.9569, "step": 6502 }, { "epoch": 0.15, "learning_rate": 9.622141580635882e-06, "loss": 1.0575, "step": 6503 }, { "epoch": 0.15, "learning_rate": 9.621998344076098e-06, "loss": 1.1012, "step": 6504 }, { "epoch": 0.15, "learning_rate": 9.621855081439313e-06, "loss": 1.1434, "step": 6505 }, { "epoch": 0.15, "learning_rate": 9.621711792726336e-06, "loss": 1.2295, "step": 6506 }, { "epoch": 0.15, "learning_rate": 9.621568477937975e-06, "loss": 1.0163, "step": 6507 }, { "epoch": 0.15, "learning_rate": 9.62142513707504e-06, "loss": 0.9669, "step": 6508 }, { "epoch": 0.15, "learning_rate": 9.621281770138338e-06, "loss": 0.8359, "step": 6509 }, { "epoch": 0.15, "learning_rate": 9.621138377128678e-06, "loss": 1.2358, "step": 6510 }, { "epoch": 0.15, "learning_rate": 9.62099495804687e-06, "loss": 1.1655, "step": 6511 }, { "epoch": 0.15, "learning_rate": 9.620851512893722e-06, "loss": 1.0562, "step": 6512 }, { "epoch": 0.15, "learning_rate": 9.620708041670046e-06, "loss": 0.9266, "step": 6513 }, { "epoch": 0.15, "learning_rate": 9.62056454437665e-06, "loss": 0.9871, "step": 6514 }, { "epoch": 0.15, "learning_rate": 9.620421021014341e-06, "loss": 1.0103, "step": 6515 }, { "epoch": 0.15, "learning_rate": 9.620277471583932e-06, "loss": 0.8539, "step": 6516 }, { "epoch": 0.15, "learning_rate": 9.62013389608623e-06, "loss": 1.0711, "step": 6517 }, { "epoch": 0.15, "learning_rate": 9.619990294522048e-06, "loss": 1.3098, "step": 6518 }, { "epoch": 0.15, "learning_rate": 9.619846666892197e-06, "loss": 0.765, "step": 6519 }, { "epoch": 0.15, "learning_rate": 9.619703013197483e-06, "loss": 0.9225, "step": 6520 }, { "epoch": 0.15, "learning_rate": 9.619559333438719e-06, "loss": 1.2468, "step": 6521 }, { "epoch": 0.15, "learning_rate": 9.619415627616717e-06, "loss": 0.9359, "step": 6522 }, { "epoch": 0.15, "learning_rate": 9.619271895732285e-06, "loss": 1.0505, "step": 6523 }, { "epoch": 0.15, "learning_rate": 9.619128137786234e-06, "loss": 0.9913, "step": 6524 }, { "epoch": 0.15, "learning_rate": 9.618984353779379e-06, "loss": 1.0214, "step": 6525 }, { "epoch": 0.15, "learning_rate": 9.618840543712527e-06, "loss": 1.0732, "step": 6526 }, { "epoch": 0.15, "learning_rate": 9.61869670758649e-06, "loss": 1.1142, "step": 6527 }, { "epoch": 0.15, "learning_rate": 9.61855284540208e-06, "loss": 0.8052, "step": 6528 }, { "epoch": 0.15, "learning_rate": 9.618408957160112e-06, "loss": 1.0835, "step": 6529 }, { "epoch": 0.15, "learning_rate": 9.618265042861392e-06, "loss": 0.9397, "step": 6530 }, { "epoch": 0.15, "learning_rate": 9.618121102506737e-06, "loss": 1.0038, "step": 6531 }, { "epoch": 0.15, "learning_rate": 9.617977136096955e-06, "loss": 1.2247, "step": 6532 }, { "epoch": 0.15, "learning_rate": 9.617833143632859e-06, "loss": 1.0614, "step": 6533 }, { "epoch": 0.15, "learning_rate": 9.617689125115266e-06, "loss": 0.9551, "step": 6534 }, { "epoch": 0.15, "learning_rate": 9.617545080544983e-06, "loss": 0.8058, "step": 6535 }, { "epoch": 0.15, "learning_rate": 9.617401009922825e-06, "loss": 1.1505, "step": 6536 }, { "epoch": 0.15, "learning_rate": 9.617256913249604e-06, "loss": 1.2376, "step": 6537 }, { "epoch": 0.15, "learning_rate": 9.617112790526135e-06, "loss": 0.9595, "step": 6538 }, { "epoch": 0.15, "learning_rate": 9.616968641753229e-06, "loss": 1.0643, "step": 6539 }, { "epoch": 0.15, "learning_rate": 9.6168244669317e-06, "loss": 1.3561, "step": 6540 }, { "epoch": 0.15, "learning_rate": 9.616680266062362e-06, "loss": 1.0921, "step": 6541 }, { "epoch": 0.15, "learning_rate": 9.616536039146026e-06, "loss": 0.9576, "step": 6542 }, { "epoch": 0.15, "learning_rate": 9.616391786183508e-06, "loss": 0.8359, "step": 6543 }, { "epoch": 0.15, "learning_rate": 9.616247507175624e-06, "loss": 1.1329, "step": 6544 }, { "epoch": 0.15, "learning_rate": 9.616103202123184e-06, "loss": 0.9874, "step": 6545 }, { "epoch": 0.15, "learning_rate": 9.615958871027003e-06, "loss": 1.1511, "step": 6546 }, { "epoch": 0.15, "learning_rate": 9.615814513887896e-06, "loss": 1.1338, "step": 6547 }, { "epoch": 0.15, "learning_rate": 9.615670130706679e-06, "loss": 1.1167, "step": 6548 }, { "epoch": 0.15, "learning_rate": 9.615525721484165e-06, "loss": 0.9721, "step": 6549 }, { "epoch": 0.15, "learning_rate": 9.615381286221168e-06, "loss": 1.1163, "step": 6550 }, { "epoch": 0.15, "learning_rate": 9.615236824918504e-06, "loss": 1.0178, "step": 6551 }, { "epoch": 0.15, "learning_rate": 9.615092337576987e-06, "loss": 1.0774, "step": 6552 }, { "epoch": 0.15, "learning_rate": 9.614947824197434e-06, "loss": 0.9718, "step": 6553 }, { "epoch": 0.15, "learning_rate": 9.614803284780659e-06, "loss": 1.1369, "step": 6554 }, { "epoch": 0.15, "learning_rate": 9.614658719327477e-06, "loss": 1.1679, "step": 6555 }, { "epoch": 0.15, "learning_rate": 9.614514127838706e-06, "loss": 0.7825, "step": 6556 }, { "epoch": 0.15, "learning_rate": 9.614369510315158e-06, "loss": 0.9548, "step": 6557 }, { "epoch": 0.15, "learning_rate": 9.614224866757654e-06, "loss": 1.065, "step": 6558 }, { "epoch": 0.15, "learning_rate": 9.614080197167004e-06, "loss": 0.7359, "step": 6559 }, { "epoch": 0.15, "learning_rate": 9.61393550154403e-06, "loss": 1.184, "step": 6560 }, { "epoch": 0.15, "learning_rate": 9.613790779889544e-06, "loss": 0.9847, "step": 6561 }, { "epoch": 0.15, "learning_rate": 9.613646032204365e-06, "loss": 0.8721, "step": 6562 }, { "epoch": 0.15, "learning_rate": 9.613501258489309e-06, "loss": 1.0943, "step": 6563 }, { "epoch": 0.15, "learning_rate": 9.61335645874519e-06, "loss": 0.8707, "step": 6564 }, { "epoch": 0.15, "learning_rate": 9.613211632972832e-06, "loss": 0.9903, "step": 6565 }, { "epoch": 0.15, "learning_rate": 9.613066781173045e-06, "loss": 0.9596, "step": 6566 }, { "epoch": 0.15, "learning_rate": 9.61292190334665e-06, "loss": 0.8817, "step": 6567 }, { "epoch": 0.15, "learning_rate": 9.612776999494465e-06, "loss": 0.7967, "step": 6568 }, { "epoch": 0.15, "learning_rate": 9.612632069617302e-06, "loss": 1.2052, "step": 6569 }, { "epoch": 0.15, "learning_rate": 9.612487113715985e-06, "loss": 1.0592, "step": 6570 }, { "epoch": 0.15, "learning_rate": 9.61234213179133e-06, "loss": 1.11, "step": 6571 }, { "epoch": 0.15, "learning_rate": 9.612197123844153e-06, "loss": 1.024, "step": 6572 }, { "epoch": 0.15, "learning_rate": 9.612052089875274e-06, "loss": 1.0979, "step": 6573 }, { "epoch": 0.15, "learning_rate": 9.611907029885512e-06, "loss": 1.0404, "step": 6574 }, { "epoch": 0.15, "learning_rate": 9.611761943875684e-06, "loss": 1.0561, "step": 6575 }, { "epoch": 0.15, "learning_rate": 9.611616831846607e-06, "loss": 1.1561, "step": 6576 }, { "epoch": 0.15, "learning_rate": 9.611471693799104e-06, "loss": 1.062, "step": 6577 }, { "epoch": 0.15, "learning_rate": 9.611326529733989e-06, "loss": 0.8375, "step": 6578 }, { "epoch": 0.15, "learning_rate": 9.611181339652086e-06, "loss": 0.9795, "step": 6579 }, { "epoch": 0.15, "learning_rate": 9.611036123554208e-06, "loss": 0.8738, "step": 6580 }, { "epoch": 0.15, "learning_rate": 9.61089088144118e-06, "loss": 1.2977, "step": 6581 }, { "epoch": 0.15, "learning_rate": 9.610745613313818e-06, "loss": 1.0275, "step": 6582 }, { "epoch": 0.15, "learning_rate": 9.610600319172945e-06, "loss": 0.9396, "step": 6583 }, { "epoch": 0.15, "learning_rate": 9.610454999019377e-06, "loss": 1.1485, "step": 6584 }, { "epoch": 0.15, "learning_rate": 9.610309652853937e-06, "loss": 0.8443, "step": 6585 }, { "epoch": 0.15, "learning_rate": 9.610164280677442e-06, "loss": 1.081, "step": 6586 }, { "epoch": 0.15, "learning_rate": 9.610018882490714e-06, "loss": 1.1936, "step": 6587 }, { "epoch": 0.15, "learning_rate": 9.609873458294575e-06, "loss": 1.2594, "step": 6588 }, { "epoch": 0.15, "learning_rate": 9.609728008089841e-06, "loss": 1.0643, "step": 6589 }, { "epoch": 0.15, "learning_rate": 9.609582531877335e-06, "loss": 0.9561, "step": 6590 }, { "epoch": 0.15, "learning_rate": 9.609437029657879e-06, "loss": 1.0824, "step": 6591 }, { "epoch": 0.15, "learning_rate": 9.609291501432293e-06, "loss": 0.9075, "step": 6592 }, { "epoch": 0.15, "learning_rate": 9.609145947201397e-06, "loss": 0.948, "step": 6593 }, { "epoch": 0.15, "learning_rate": 9.609000366966014e-06, "loss": 0.8247, "step": 6594 }, { "epoch": 0.15, "learning_rate": 9.608854760726964e-06, "loss": 0.9708, "step": 6595 }, { "epoch": 0.15, "learning_rate": 9.608709128485069e-06, "loss": 1.0422, "step": 6596 }, { "epoch": 0.15, "learning_rate": 9.60856347024115e-06, "loss": 0.7913, "step": 6597 }, { "epoch": 0.15, "learning_rate": 9.60841778599603e-06, "loss": 1.5257, "step": 6598 }, { "epoch": 0.15, "learning_rate": 9.608272075750532e-06, "loss": 0.9462, "step": 6599 }, { "epoch": 0.15, "learning_rate": 9.608126339505472e-06, "loss": 1.0845, "step": 6600 }, { "epoch": 0.15, "learning_rate": 9.60798057726168e-06, "loss": 0.8509, "step": 6601 }, { "epoch": 0.15, "learning_rate": 9.607834789019973e-06, "loss": 0.8375, "step": 6602 }, { "epoch": 0.15, "learning_rate": 9.607688974781179e-06, "loss": 0.8997, "step": 6603 }, { "epoch": 0.15, "learning_rate": 9.607543134546115e-06, "loss": 1.0972, "step": 6604 }, { "epoch": 0.15, "learning_rate": 9.607397268315607e-06, "loss": 0.9777, "step": 6605 }, { "epoch": 0.15, "learning_rate": 9.607251376090475e-06, "loss": 0.9073, "step": 6606 }, { "epoch": 0.15, "learning_rate": 9.607105457871546e-06, "loss": 1.1494, "step": 6607 }, { "epoch": 0.15, "learning_rate": 9.60695951365964e-06, "loss": 1.0748, "step": 6608 }, { "epoch": 0.15, "learning_rate": 9.606813543455582e-06, "loss": 1.2045, "step": 6609 }, { "epoch": 0.15, "learning_rate": 9.606667547260195e-06, "loss": 1.0873, "step": 6610 }, { "epoch": 0.15, "learning_rate": 9.606521525074305e-06, "loss": 0.9716, "step": 6611 }, { "epoch": 0.15, "learning_rate": 9.606375476898733e-06, "loss": 1.0838, "step": 6612 }, { "epoch": 0.15, "learning_rate": 9.606229402734304e-06, "loss": 1.1021, "step": 6613 }, { "epoch": 0.15, "learning_rate": 9.60608330258184e-06, "loss": 0.9207, "step": 6614 }, { "epoch": 0.15, "learning_rate": 9.60593717644217e-06, "loss": 1.104, "step": 6615 }, { "epoch": 0.15, "learning_rate": 9.605791024316114e-06, "loss": 1.0753, "step": 6616 }, { "epoch": 0.15, "learning_rate": 9.605644846204499e-06, "loss": 0.9268, "step": 6617 }, { "epoch": 0.15, "learning_rate": 9.60549864210815e-06, "loss": 0.7937, "step": 6618 }, { "epoch": 0.15, "learning_rate": 9.60535241202789e-06, "loss": 1.1435, "step": 6619 }, { "epoch": 0.15, "learning_rate": 9.605206155964543e-06, "loss": 0.8443, "step": 6620 }, { "epoch": 0.15, "learning_rate": 9.605059873918939e-06, "loss": 1.0823, "step": 6621 }, { "epoch": 0.15, "learning_rate": 9.6049135658919e-06, "loss": 1.0392, "step": 6622 }, { "epoch": 0.15, "learning_rate": 9.604767231884251e-06, "loss": 0.9347, "step": 6623 }, { "epoch": 0.15, "learning_rate": 9.60462087189682e-06, "loss": 1.0019, "step": 6624 }, { "epoch": 0.15, "learning_rate": 9.60447448593043e-06, "loss": 1.1974, "step": 6625 }, { "epoch": 0.15, "learning_rate": 9.604328073985908e-06, "loss": 1.174, "step": 6626 }, { "epoch": 0.15, "learning_rate": 9.60418163606408e-06, "loss": 0.8599, "step": 6627 }, { "epoch": 0.15, "learning_rate": 9.604035172165773e-06, "loss": 1.0713, "step": 6628 }, { "epoch": 0.15, "learning_rate": 9.603888682291814e-06, "loss": 1.0316, "step": 6629 }, { "epoch": 0.15, "learning_rate": 9.603742166443025e-06, "loss": 1.2838, "step": 6630 }, { "epoch": 0.15, "learning_rate": 9.603595624620237e-06, "loss": 1.1471, "step": 6631 }, { "epoch": 0.15, "learning_rate": 9.603449056824277e-06, "loss": 1.0872, "step": 6632 }, { "epoch": 0.15, "learning_rate": 9.60330246305597e-06, "loss": 0.9778, "step": 6633 }, { "epoch": 0.15, "learning_rate": 9.603155843316143e-06, "loss": 0.8178, "step": 6634 }, { "epoch": 0.15, "learning_rate": 9.603009197605623e-06, "loss": 1.1251, "step": 6635 }, { "epoch": 0.15, "learning_rate": 9.60286252592524e-06, "loss": 0.9113, "step": 6636 }, { "epoch": 0.15, "learning_rate": 9.602715828275819e-06, "loss": 0.9937, "step": 6637 }, { "epoch": 0.15, "learning_rate": 9.60256910465819e-06, "loss": 1.1623, "step": 6638 }, { "epoch": 0.15, "learning_rate": 9.602422355073177e-06, "loss": 0.9757, "step": 6639 }, { "epoch": 0.15, "learning_rate": 9.602275579521612e-06, "loss": 1.1133, "step": 6640 }, { "epoch": 0.15, "learning_rate": 9.60212877800432e-06, "loss": 0.8882, "step": 6641 }, { "epoch": 0.15, "learning_rate": 9.60198195052213e-06, "loss": 1.0935, "step": 6642 }, { "epoch": 0.15, "learning_rate": 9.601835097075872e-06, "loss": 0.8919, "step": 6643 }, { "epoch": 0.15, "learning_rate": 9.601688217666372e-06, "loss": 0.9129, "step": 6644 }, { "epoch": 0.15, "learning_rate": 9.601541312294461e-06, "loss": 1.3487, "step": 6645 }, { "epoch": 0.15, "learning_rate": 9.601394380960967e-06, "loss": 1.1782, "step": 6646 }, { "epoch": 0.15, "learning_rate": 9.60124742366672e-06, "loss": 0.9698, "step": 6647 }, { "epoch": 0.15, "learning_rate": 9.601100440412545e-06, "loss": 1.0104, "step": 6648 }, { "epoch": 0.15, "learning_rate": 9.600953431199276e-06, "loss": 0.9909, "step": 6649 }, { "epoch": 0.15, "learning_rate": 9.600806396027742e-06, "loss": 0.9457, "step": 6650 }, { "epoch": 0.15, "learning_rate": 9.60065933489877e-06, "loss": 0.869, "step": 6651 }, { "epoch": 0.15, "learning_rate": 9.600512247813189e-06, "loss": 0.901, "step": 6652 }, { "epoch": 0.15, "learning_rate": 9.600365134771834e-06, "loss": 0.9513, "step": 6653 }, { "epoch": 0.15, "learning_rate": 9.60021799577553e-06, "loss": 0.917, "step": 6654 }, { "epoch": 0.15, "learning_rate": 9.60007083082511e-06, "loss": 1.0395, "step": 6655 }, { "epoch": 0.15, "learning_rate": 9.599923639921402e-06, "loss": 1.1509, "step": 6656 }, { "epoch": 0.15, "learning_rate": 9.599776423065239e-06, "loss": 1.0164, "step": 6657 }, { "epoch": 0.15, "learning_rate": 9.59962918025745e-06, "loss": 0.9016, "step": 6658 }, { "epoch": 0.15, "learning_rate": 9.599481911498866e-06, "loss": 1.1936, "step": 6659 }, { "epoch": 0.15, "learning_rate": 9.599334616790318e-06, "loss": 1.2762, "step": 6660 }, { "epoch": 0.15, "learning_rate": 9.599187296132638e-06, "loss": 1.0901, "step": 6661 }, { "epoch": 0.15, "learning_rate": 9.599039949526654e-06, "loss": 1.246, "step": 6662 }, { "epoch": 0.15, "learning_rate": 9.5988925769732e-06, "loss": 1.1956, "step": 6663 }, { "epoch": 0.15, "learning_rate": 9.598745178473106e-06, "loss": 0.9222, "step": 6664 }, { "epoch": 0.15, "learning_rate": 9.598597754027205e-06, "loss": 1.0273, "step": 6665 }, { "epoch": 0.15, "learning_rate": 9.59845030363633e-06, "loss": 1.1561, "step": 6666 }, { "epoch": 0.15, "learning_rate": 9.598302827301311e-06, "loss": 1.1716, "step": 6667 }, { "epoch": 0.15, "learning_rate": 9.598155325022979e-06, "loss": 1.1793, "step": 6668 }, { "epoch": 0.15, "learning_rate": 9.598007796802168e-06, "loss": 0.943, "step": 6669 }, { "epoch": 0.15, "learning_rate": 9.59786024263971e-06, "loss": 0.8709, "step": 6670 }, { "epoch": 0.15, "learning_rate": 9.597712662536436e-06, "loss": 1.1933, "step": 6671 }, { "epoch": 0.15, "learning_rate": 9.597565056493181e-06, "loss": 1.4086, "step": 6672 }, { "epoch": 0.15, "learning_rate": 9.597417424510776e-06, "loss": 1.0636, "step": 6673 }, { "epoch": 0.15, "learning_rate": 9.597269766590054e-06, "loss": 1.0889, "step": 6674 }, { "epoch": 0.15, "learning_rate": 9.597122082731851e-06, "loss": 0.8221, "step": 6675 }, { "epoch": 0.15, "learning_rate": 9.596974372936996e-06, "loss": 1.0958, "step": 6676 }, { "epoch": 0.15, "learning_rate": 9.596826637206324e-06, "loss": 1.4035, "step": 6677 }, { "epoch": 0.15, "learning_rate": 9.59667887554067e-06, "loss": 1.0927, "step": 6678 }, { "epoch": 0.15, "learning_rate": 9.596531087940867e-06, "loss": 0.974, "step": 6679 }, { "epoch": 0.15, "learning_rate": 9.596383274407748e-06, "loss": 0.792, "step": 6680 }, { "epoch": 0.15, "learning_rate": 9.596235434942146e-06, "loss": 0.8616, "step": 6681 }, { "epoch": 0.15, "learning_rate": 9.596087569544897e-06, "loss": 0.8528, "step": 6682 }, { "epoch": 0.15, "learning_rate": 9.595939678216835e-06, "loss": 1.0398, "step": 6683 }, { "epoch": 0.16, "learning_rate": 9.595791760958793e-06, "loss": 1.0927, "step": 6684 }, { "epoch": 0.16, "learning_rate": 9.595643817771607e-06, "loss": 1.2018, "step": 6685 }, { "epoch": 0.16, "learning_rate": 9.59549584865611e-06, "loss": 0.8181, "step": 6686 }, { "epoch": 0.16, "learning_rate": 9.59534785361314e-06, "loss": 1.1506, "step": 6687 }, { "epoch": 0.16, "learning_rate": 9.59519983264353e-06, "loss": 1.1281, "step": 6688 }, { "epoch": 0.16, "learning_rate": 9.595051785748113e-06, "loss": 0.8725, "step": 6689 }, { "epoch": 0.16, "learning_rate": 9.594903712927728e-06, "loss": 0.9267, "step": 6690 }, { "epoch": 0.16, "learning_rate": 9.594755614183207e-06, "loss": 1.067, "step": 6691 }, { "epoch": 0.16, "learning_rate": 9.594607489515389e-06, "loss": 0.8928, "step": 6692 }, { "epoch": 0.16, "learning_rate": 9.594459338925108e-06, "loss": 1.0674, "step": 6693 }, { "epoch": 0.16, "learning_rate": 9.5943111624132e-06, "loss": 0.8282, "step": 6694 }, { "epoch": 0.16, "learning_rate": 9.5941629599805e-06, "loss": 0.9498, "step": 6695 }, { "epoch": 0.16, "learning_rate": 9.594014731627846e-06, "loss": 1.106, "step": 6696 }, { "epoch": 0.16, "learning_rate": 9.593866477356073e-06, "loss": 1.0516, "step": 6697 }, { "epoch": 0.16, "learning_rate": 9.593718197166018e-06, "loss": 0.7997, "step": 6698 }, { "epoch": 0.16, "learning_rate": 9.593569891058517e-06, "loss": 1.0037, "step": 6699 }, { "epoch": 0.16, "learning_rate": 9.593421559034408e-06, "loss": 0.8606, "step": 6700 }, { "epoch": 0.16, "learning_rate": 9.593273201094527e-06, "loss": 1.2094, "step": 6701 }, { "epoch": 0.16, "learning_rate": 9.593124817239709e-06, "loss": 0.9521, "step": 6702 }, { "epoch": 0.16, "learning_rate": 9.592976407470795e-06, "loss": 1.1865, "step": 6703 }, { "epoch": 0.16, "learning_rate": 9.592827971788621e-06, "loss": 1.3275, "step": 6704 }, { "epoch": 0.16, "learning_rate": 9.592679510194022e-06, "loss": 1.2607, "step": 6705 }, { "epoch": 0.16, "learning_rate": 9.592531022687838e-06, "loss": 1.0445, "step": 6706 }, { "epoch": 0.16, "learning_rate": 9.592382509270908e-06, "loss": 1.2616, "step": 6707 }, { "epoch": 0.16, "learning_rate": 9.592233969944067e-06, "loss": 0.9621, "step": 6708 }, { "epoch": 0.16, "learning_rate": 9.592085404708156e-06, "loss": 0.8651, "step": 6709 }, { "epoch": 0.16, "learning_rate": 9.59193681356401e-06, "loss": 0.8423, "step": 6710 }, { "epoch": 0.16, "learning_rate": 9.591788196512468e-06, "loss": 1.0977, "step": 6711 }, { "epoch": 0.16, "learning_rate": 9.59163955355437e-06, "loss": 0.9258, "step": 6712 }, { "epoch": 0.16, "learning_rate": 9.591490884690555e-06, "loss": 0.9628, "step": 6713 }, { "epoch": 0.16, "learning_rate": 9.59134218992186e-06, "loss": 1.1394, "step": 6714 }, { "epoch": 0.16, "learning_rate": 9.591193469249126e-06, "loss": 0.9064, "step": 6715 }, { "epoch": 0.16, "learning_rate": 9.591044722673188e-06, "loss": 1.2723, "step": 6716 }, { "epoch": 0.16, "learning_rate": 9.59089595019489e-06, "loss": 1.1296, "step": 6717 }, { "epoch": 0.16, "learning_rate": 9.590747151815068e-06, "loss": 0.9067, "step": 6718 }, { "epoch": 0.16, "learning_rate": 9.590598327534563e-06, "loss": 0.9432, "step": 6719 }, { "epoch": 0.16, "learning_rate": 9.590449477354216e-06, "loss": 1.1487, "step": 6720 }, { "epoch": 0.16, "learning_rate": 9.590300601274864e-06, "loss": 0.7562, "step": 6721 }, { "epoch": 0.16, "learning_rate": 9.59015169929735e-06, "loss": 0.8728, "step": 6722 }, { "epoch": 0.16, "learning_rate": 9.59000277142251e-06, "loss": 0.7373, "step": 6723 }, { "epoch": 0.16, "learning_rate": 9.589853817651188e-06, "loss": 0.7231, "step": 6724 }, { "epoch": 0.16, "learning_rate": 9.589704837984221e-06, "loss": 1.1612, "step": 6725 }, { "epoch": 0.16, "learning_rate": 9.589555832422455e-06, "loss": 0.7192, "step": 6726 }, { "epoch": 0.16, "learning_rate": 9.589406800966725e-06, "loss": 1.1919, "step": 6727 }, { "epoch": 0.16, "learning_rate": 9.589257743617874e-06, "loss": 0.9, "step": 6728 }, { "epoch": 0.16, "learning_rate": 9.589108660376743e-06, "loss": 0.7786, "step": 6729 }, { "epoch": 0.16, "learning_rate": 9.588959551244172e-06, "loss": 1.2624, "step": 6730 }, { "epoch": 0.16, "learning_rate": 9.588810416221005e-06, "loss": 1.0435, "step": 6731 }, { "epoch": 0.16, "learning_rate": 9.588661255308082e-06, "loss": 1.0777, "step": 6732 }, { "epoch": 0.16, "learning_rate": 9.588512068506244e-06, "loss": 1.1243, "step": 6733 }, { "epoch": 0.16, "learning_rate": 9.588362855816332e-06, "loss": 1.2188, "step": 6734 }, { "epoch": 0.16, "learning_rate": 9.58821361723919e-06, "loss": 0.9977, "step": 6735 }, { "epoch": 0.16, "learning_rate": 9.588064352775659e-06, "loss": 1.338, "step": 6736 }, { "epoch": 0.16, "learning_rate": 9.58791506242658e-06, "loss": 1.1848, "step": 6737 }, { "epoch": 0.16, "learning_rate": 9.587765746192797e-06, "loss": 0.8612, "step": 6738 }, { "epoch": 0.16, "learning_rate": 9.587616404075151e-06, "loss": 0.8423, "step": 6739 }, { "epoch": 0.16, "learning_rate": 9.587467036074485e-06, "loss": 1.0633, "step": 6740 }, { "epoch": 0.16, "learning_rate": 9.587317642191643e-06, "loss": 1.2141, "step": 6741 }, { "epoch": 0.16, "learning_rate": 9.587168222427468e-06, "loss": 0.9849, "step": 6742 }, { "epoch": 0.16, "learning_rate": 9.5870187767828e-06, "loss": 1.1319, "step": 6743 }, { "epoch": 0.16, "learning_rate": 9.586869305258484e-06, "loss": 1.1062, "step": 6744 }, { "epoch": 0.16, "learning_rate": 9.586719807855364e-06, "loss": 0.9287, "step": 6745 }, { "epoch": 0.16, "learning_rate": 9.586570284574283e-06, "loss": 1.1309, "step": 6746 }, { "epoch": 0.16, "learning_rate": 9.586420735416084e-06, "loss": 1.0769, "step": 6747 }, { "epoch": 0.16, "learning_rate": 9.586271160381612e-06, "loss": 0.9505, "step": 6748 }, { "epoch": 0.16, "learning_rate": 9.58612155947171e-06, "loss": 1.1677, "step": 6749 }, { "epoch": 0.16, "learning_rate": 9.585971932687221e-06, "loss": 0.7908, "step": 6750 }, { "epoch": 0.16, "learning_rate": 9.585822280028992e-06, "loss": 1.1081, "step": 6751 }, { "epoch": 0.16, "learning_rate": 9.585672601497864e-06, "loss": 1.0333, "step": 6752 }, { "epoch": 0.16, "learning_rate": 9.585522897094683e-06, "loss": 1.3207, "step": 6753 }, { "epoch": 0.16, "learning_rate": 9.585373166820294e-06, "loss": 1.2908, "step": 6754 }, { "epoch": 0.16, "learning_rate": 9.585223410675541e-06, "loss": 1.2105, "step": 6755 }, { "epoch": 0.16, "learning_rate": 9.58507362866127e-06, "loss": 0.8849, "step": 6756 }, { "epoch": 0.16, "learning_rate": 9.584923820778327e-06, "loss": 1.3573, "step": 6757 }, { "epoch": 0.16, "learning_rate": 9.584773987027554e-06, "loss": 0.8969, "step": 6758 }, { "epoch": 0.16, "learning_rate": 9.584624127409798e-06, "loss": 1.0842, "step": 6759 }, { "epoch": 0.16, "learning_rate": 9.584474241925905e-06, "loss": 1.1243, "step": 6760 }, { "epoch": 0.16, "learning_rate": 9.584324330576722e-06, "loss": 0.852, "step": 6761 }, { "epoch": 0.16, "learning_rate": 9.584174393363091e-06, "loss": 0.9594, "step": 6762 }, { "epoch": 0.16, "learning_rate": 9.584024430285858e-06, "loss": 1.0983, "step": 6763 }, { "epoch": 0.16, "learning_rate": 9.583874441345874e-06, "loss": 1.033, "step": 6764 }, { "epoch": 0.16, "learning_rate": 9.583724426543981e-06, "loss": 0.9198, "step": 6765 }, { "epoch": 0.16, "learning_rate": 9.583574385881028e-06, "loss": 1.1352, "step": 6766 }, { "epoch": 0.16, "learning_rate": 9.583424319357856e-06, "loss": 1.2191, "step": 6767 }, { "epoch": 0.16, "learning_rate": 9.58327422697532e-06, "loss": 1.2261, "step": 6768 }, { "epoch": 0.16, "learning_rate": 9.58312410873426e-06, "loss": 1.1745, "step": 6769 }, { "epoch": 0.16, "learning_rate": 9.582973964635528e-06, "loss": 0.9584, "step": 6770 }, { "epoch": 0.16, "learning_rate": 9.582823794679967e-06, "loss": 0.8626, "step": 6771 }, { "epoch": 0.16, "learning_rate": 9.582673598868426e-06, "loss": 1.28, "step": 6772 }, { "epoch": 0.16, "learning_rate": 9.582523377201752e-06, "loss": 1.1238, "step": 6773 }, { "epoch": 0.16, "learning_rate": 9.582373129680793e-06, "loss": 1.0202, "step": 6774 }, { "epoch": 0.16, "learning_rate": 9.582222856306397e-06, "loss": 1.3924, "step": 6775 }, { "epoch": 0.16, "learning_rate": 9.582072557079411e-06, "loss": 1.0224, "step": 6776 }, { "epoch": 0.16, "learning_rate": 9.581922232000685e-06, "loss": 0.8777, "step": 6777 }, { "epoch": 0.16, "learning_rate": 9.581771881071062e-06, "loss": 1.3902, "step": 6778 }, { "epoch": 0.16, "learning_rate": 9.581621504291396e-06, "loss": 0.9579, "step": 6779 }, { "epoch": 0.16, "learning_rate": 9.581471101662533e-06, "loss": 1.0943, "step": 6780 }, { "epoch": 0.16, "learning_rate": 9.58132067318532e-06, "loss": 0.8874, "step": 6781 }, { "epoch": 0.16, "learning_rate": 9.58117021886061e-06, "loss": 1.0258, "step": 6782 }, { "epoch": 0.16, "learning_rate": 9.581019738689248e-06, "loss": 0.9527, "step": 6783 }, { "epoch": 0.16, "learning_rate": 9.580869232672084e-06, "loss": 1.2041, "step": 6784 }, { "epoch": 0.16, "learning_rate": 9.580718700809969e-06, "loss": 0.81, "step": 6785 }, { "epoch": 0.16, "learning_rate": 9.580568143103748e-06, "loss": 1.3452, "step": 6786 }, { "epoch": 0.16, "learning_rate": 9.580417559554273e-06, "loss": 1.034, "step": 6787 }, { "epoch": 0.16, "learning_rate": 9.580266950162396e-06, "loss": 1.3241, "step": 6788 }, { "epoch": 0.16, "learning_rate": 9.580116314928963e-06, "loss": 0.951, "step": 6789 }, { "epoch": 0.16, "learning_rate": 9.579965653854826e-06, "loss": 1.0281, "step": 6790 }, { "epoch": 0.16, "learning_rate": 9.579814966940833e-06, "loss": 1.0065, "step": 6791 }, { "epoch": 0.16, "learning_rate": 9.579664254187837e-06, "loss": 0.9515, "step": 6792 }, { "epoch": 0.16, "learning_rate": 9.579513515596686e-06, "loss": 1.0734, "step": 6793 }, { "epoch": 0.16, "learning_rate": 9.579362751168231e-06, "loss": 1.0186, "step": 6794 }, { "epoch": 0.16, "learning_rate": 9.579211960903323e-06, "loss": 1.0563, "step": 6795 }, { "epoch": 0.16, "learning_rate": 9.579061144802814e-06, "loss": 0.8665, "step": 6796 }, { "epoch": 0.16, "learning_rate": 9.578910302867552e-06, "loss": 0.9029, "step": 6797 }, { "epoch": 0.16, "learning_rate": 9.57875943509839e-06, "loss": 1.173, "step": 6798 }, { "epoch": 0.16, "learning_rate": 9.57860854149618e-06, "loss": 0.7931, "step": 6799 }, { "epoch": 0.16, "learning_rate": 9.57845762206177e-06, "loss": 0.9756, "step": 6800 }, { "epoch": 0.16, "learning_rate": 9.578306676796014e-06, "loss": 1.0606, "step": 6801 }, { "epoch": 0.16, "learning_rate": 9.578155705699763e-06, "loss": 1.0224, "step": 6802 }, { "epoch": 0.16, "learning_rate": 9.57800470877387e-06, "loss": 0.9645, "step": 6803 }, { "epoch": 0.16, "learning_rate": 9.577853686019185e-06, "loss": 1.3162, "step": 6804 }, { "epoch": 0.16, "learning_rate": 9.57770263743656e-06, "loss": 1.1631, "step": 6805 }, { "epoch": 0.16, "learning_rate": 9.57755156302685e-06, "loss": 1.2131, "step": 6806 }, { "epoch": 0.16, "learning_rate": 9.577400462790905e-06, "loss": 1.1351, "step": 6807 }, { "epoch": 0.16, "learning_rate": 9.577249336729577e-06, "loss": 0.855, "step": 6808 }, { "epoch": 0.16, "learning_rate": 9.57709818484372e-06, "loss": 0.745, "step": 6809 }, { "epoch": 0.16, "learning_rate": 9.576947007134187e-06, "loss": 0.993, "step": 6810 }, { "epoch": 0.16, "learning_rate": 9.57679580360183e-06, "loss": 1.1209, "step": 6811 }, { "epoch": 0.16, "learning_rate": 9.576644574247502e-06, "loss": 1.1238, "step": 6812 }, { "epoch": 0.16, "learning_rate": 9.576493319072056e-06, "loss": 0.9177, "step": 6813 }, { "epoch": 0.16, "learning_rate": 9.576342038076347e-06, "loss": 1.3169, "step": 6814 }, { "epoch": 0.16, "learning_rate": 9.576190731261229e-06, "loss": 1.3968, "step": 6815 }, { "epoch": 0.16, "learning_rate": 9.57603939862755e-06, "loss": 0.7769, "step": 6816 }, { "epoch": 0.16, "learning_rate": 9.575888040176172e-06, "loss": 0.9575, "step": 6817 }, { "epoch": 0.16, "learning_rate": 9.575736655907944e-06, "loss": 0.7039, "step": 6818 }, { "epoch": 0.16, "learning_rate": 9.57558524582372e-06, "loss": 0.964, "step": 6819 }, { "epoch": 0.16, "learning_rate": 9.575433809924354e-06, "loss": 0.9309, "step": 6820 }, { "epoch": 0.16, "learning_rate": 9.575282348210703e-06, "loss": 0.8092, "step": 6821 }, { "epoch": 0.16, "learning_rate": 9.575130860683621e-06, "loss": 0.8159, "step": 6822 }, { "epoch": 0.16, "learning_rate": 9.574979347343963e-06, "loss": 0.9639, "step": 6823 }, { "epoch": 0.16, "learning_rate": 9.574827808192581e-06, "loss": 1.1972, "step": 6824 }, { "epoch": 0.16, "learning_rate": 9.574676243230331e-06, "loss": 0.9664, "step": 6825 }, { "epoch": 0.16, "learning_rate": 9.57452465245807e-06, "loss": 1.0518, "step": 6826 }, { "epoch": 0.16, "learning_rate": 9.574373035876652e-06, "loss": 1.1024, "step": 6827 }, { "epoch": 0.16, "learning_rate": 9.574221393486931e-06, "loss": 1.1337, "step": 6828 }, { "epoch": 0.16, "learning_rate": 9.574069725289765e-06, "loss": 0.9869, "step": 6829 }, { "epoch": 0.16, "learning_rate": 9.57391803128601e-06, "loss": 1.4134, "step": 6830 }, { "epoch": 0.16, "learning_rate": 9.57376631147652e-06, "loss": 1.0191, "step": 6831 }, { "epoch": 0.16, "learning_rate": 9.57361456586215e-06, "loss": 1.1441, "step": 6832 }, { "epoch": 0.16, "learning_rate": 9.57346279444376e-06, "loss": 1.1568, "step": 6833 }, { "epoch": 0.16, "learning_rate": 9.573310997222203e-06, "loss": 1.2635, "step": 6834 }, { "epoch": 0.16, "learning_rate": 9.573159174198336e-06, "loss": 0.7875, "step": 6835 }, { "epoch": 0.16, "learning_rate": 9.573007325373016e-06, "loss": 1.3486, "step": 6836 }, { "epoch": 0.16, "learning_rate": 9.5728554507471e-06, "loss": 1.0355, "step": 6837 }, { "epoch": 0.16, "learning_rate": 9.572703550321445e-06, "loss": 1.0967, "step": 6838 }, { "epoch": 0.16, "learning_rate": 9.572551624096906e-06, "loss": 0.9913, "step": 6839 }, { "epoch": 0.16, "learning_rate": 9.572399672074344e-06, "loss": 0.9382, "step": 6840 }, { "epoch": 0.16, "learning_rate": 9.572247694254612e-06, "loss": 0.8218, "step": 6841 }, { "epoch": 0.16, "learning_rate": 9.57209569063857e-06, "loss": 1.0299, "step": 6842 }, { "epoch": 0.16, "learning_rate": 9.571943661227076e-06, "loss": 1.0959, "step": 6843 }, { "epoch": 0.16, "learning_rate": 9.571791606020987e-06, "loss": 1.0296, "step": 6844 }, { "epoch": 0.16, "learning_rate": 9.57163952502116e-06, "loss": 0.9051, "step": 6845 }, { "epoch": 0.16, "learning_rate": 9.571487418228455e-06, "loss": 1.0499, "step": 6846 }, { "epoch": 0.16, "learning_rate": 9.571335285643728e-06, "loss": 0.9312, "step": 6847 }, { "epoch": 0.16, "learning_rate": 9.571183127267838e-06, "loss": 0.9778, "step": 6848 }, { "epoch": 0.16, "learning_rate": 9.571030943101643e-06, "loss": 1.1008, "step": 6849 }, { "epoch": 0.16, "learning_rate": 9.570878733146005e-06, "loss": 0.8417, "step": 6850 }, { "epoch": 0.16, "learning_rate": 9.570726497401776e-06, "loss": 1.0924, "step": 6851 }, { "epoch": 0.16, "learning_rate": 9.570574235869823e-06, "loss": 0.9607, "step": 6852 }, { "epoch": 0.16, "learning_rate": 9.570421948550998e-06, "loss": 1.0837, "step": 6853 }, { "epoch": 0.16, "learning_rate": 9.570269635446166e-06, "loss": 0.8223, "step": 6854 }, { "epoch": 0.16, "learning_rate": 9.570117296556182e-06, "loss": 1.5239, "step": 6855 }, { "epoch": 0.16, "learning_rate": 9.569964931881908e-06, "loss": 1.0125, "step": 6856 }, { "epoch": 0.16, "learning_rate": 9.5698125414242e-06, "loss": 1.0237, "step": 6857 }, { "epoch": 0.16, "learning_rate": 9.569660125183924e-06, "loss": 1.3828, "step": 6858 }, { "epoch": 0.16, "learning_rate": 9.569507683161935e-06, "loss": 1.109, "step": 6859 }, { "epoch": 0.16, "learning_rate": 9.569355215359095e-06, "loss": 1.0003, "step": 6860 }, { "epoch": 0.16, "learning_rate": 9.569202721776263e-06, "loss": 1.3936, "step": 6861 }, { "epoch": 0.16, "learning_rate": 9.569050202414299e-06, "loss": 1.0349, "step": 6862 }, { "epoch": 0.16, "learning_rate": 9.568897657274066e-06, "loss": 1.3119, "step": 6863 }, { "epoch": 0.16, "learning_rate": 9.568745086356422e-06, "loss": 0.9819, "step": 6864 }, { "epoch": 0.16, "learning_rate": 9.56859248966223e-06, "loss": 1.0863, "step": 6865 }, { "epoch": 0.16, "learning_rate": 9.56843986719235e-06, "loss": 1.0379, "step": 6866 }, { "epoch": 0.16, "learning_rate": 9.568287218947643e-06, "loss": 1.141, "step": 6867 }, { "epoch": 0.16, "learning_rate": 9.56813454492897e-06, "loss": 1.0882, "step": 6868 }, { "epoch": 0.16, "learning_rate": 9.567981845137193e-06, "loss": 1.0528, "step": 6869 }, { "epoch": 0.16, "learning_rate": 9.567829119573172e-06, "loss": 1.1175, "step": 6870 }, { "epoch": 0.16, "learning_rate": 9.567676368237771e-06, "loss": 0.888, "step": 6871 }, { "epoch": 0.16, "learning_rate": 9.567523591131852e-06, "loss": 1.0712, "step": 6872 }, { "epoch": 0.16, "learning_rate": 9.567370788256271e-06, "loss": 0.7881, "step": 6873 }, { "epoch": 0.16, "learning_rate": 9.567217959611898e-06, "loss": 0.8336, "step": 6874 }, { "epoch": 0.16, "learning_rate": 9.567065105199593e-06, "loss": 0.9128, "step": 6875 }, { "epoch": 0.16, "learning_rate": 9.566912225020216e-06, "loss": 0.9945, "step": 6876 }, { "epoch": 0.16, "learning_rate": 9.56675931907463e-06, "loss": 0.9829, "step": 6877 }, { "epoch": 0.16, "learning_rate": 9.566606387363699e-06, "loss": 1.2484, "step": 6878 }, { "epoch": 0.16, "learning_rate": 9.566453429888284e-06, "loss": 1.1264, "step": 6879 }, { "epoch": 0.16, "learning_rate": 9.566300446649252e-06, "loss": 1.2389, "step": 6880 }, { "epoch": 0.16, "learning_rate": 9.566147437647463e-06, "loss": 1.0519, "step": 6881 }, { "epoch": 0.16, "learning_rate": 9.56599440288378e-06, "loss": 0.8285, "step": 6882 }, { "epoch": 0.16, "learning_rate": 9.565841342359068e-06, "loss": 1.0533, "step": 6883 }, { "epoch": 0.16, "learning_rate": 9.565688256074189e-06, "loss": 0.8056, "step": 6884 }, { "epoch": 0.16, "learning_rate": 9.565535144030007e-06, "loss": 1.0446, "step": 6885 }, { "epoch": 0.16, "learning_rate": 9.565382006227387e-06, "loss": 0.9837, "step": 6886 }, { "epoch": 0.16, "learning_rate": 9.565228842667191e-06, "loss": 0.989, "step": 6887 }, { "epoch": 0.16, "learning_rate": 9.565075653350286e-06, "loss": 0.9775, "step": 6888 }, { "epoch": 0.16, "learning_rate": 9.564922438277535e-06, "loss": 1.0636, "step": 6889 }, { "epoch": 0.16, "learning_rate": 9.564769197449801e-06, "loss": 0.9249, "step": 6890 }, { "epoch": 0.16, "learning_rate": 9.56461593086795e-06, "loss": 1.032, "step": 6891 }, { "epoch": 0.16, "learning_rate": 9.564462638532845e-06, "loss": 0.7678, "step": 6892 }, { "epoch": 0.16, "learning_rate": 9.564309320445353e-06, "loss": 0.8662, "step": 6893 }, { "epoch": 0.16, "learning_rate": 9.56415597660634e-06, "loss": 1.1618, "step": 6894 }, { "epoch": 0.16, "learning_rate": 9.564002607016669e-06, "loss": 0.8783, "step": 6895 }, { "epoch": 0.16, "learning_rate": 9.563849211677203e-06, "loss": 1.348, "step": 6896 }, { "epoch": 0.16, "learning_rate": 9.563695790588812e-06, "loss": 0.652, "step": 6897 }, { "epoch": 0.16, "learning_rate": 9.563542343752361e-06, "loss": 0.8545, "step": 6898 }, { "epoch": 0.16, "learning_rate": 9.563388871168713e-06, "loss": 1.1143, "step": 6899 }, { "epoch": 0.16, "learning_rate": 9.563235372838736e-06, "loss": 0.9882, "step": 6900 }, { "epoch": 0.16, "learning_rate": 9.563081848763296e-06, "loss": 1.0247, "step": 6901 }, { "epoch": 0.16, "learning_rate": 9.562928298943256e-06, "loss": 1.1425, "step": 6902 }, { "epoch": 0.16, "learning_rate": 9.56277472337949e-06, "loss": 0.9389, "step": 6903 }, { "epoch": 0.16, "learning_rate": 9.562621122072855e-06, "loss": 0.8503, "step": 6904 }, { "epoch": 0.16, "learning_rate": 9.562467495024222e-06, "loss": 1.5516, "step": 6905 }, { "epoch": 0.16, "learning_rate": 9.562313842234459e-06, "loss": 1.1058, "step": 6906 }, { "epoch": 0.16, "learning_rate": 9.562160163704432e-06, "loss": 0.9153, "step": 6907 }, { "epoch": 0.16, "learning_rate": 9.562006459435006e-06, "loss": 0.8315, "step": 6908 }, { "epoch": 0.16, "learning_rate": 9.561852729427052e-06, "loss": 1.0177, "step": 6909 }, { "epoch": 0.16, "learning_rate": 9.561698973681435e-06, "loss": 1.1616, "step": 6910 }, { "epoch": 0.16, "learning_rate": 9.561545192199021e-06, "loss": 0.8872, "step": 6911 }, { "epoch": 0.16, "learning_rate": 9.561391384980681e-06, "loss": 1.2536, "step": 6912 }, { "epoch": 0.16, "learning_rate": 9.56123755202728e-06, "loss": 1.0002, "step": 6913 }, { "epoch": 0.16, "learning_rate": 9.561083693339687e-06, "loss": 0.9551, "step": 6914 }, { "epoch": 0.16, "learning_rate": 9.560929808918771e-06, "loss": 0.8935, "step": 6915 }, { "epoch": 0.16, "learning_rate": 9.560775898765398e-06, "loss": 1.1336, "step": 6916 }, { "epoch": 0.16, "learning_rate": 9.560621962880438e-06, "loss": 0.8367, "step": 6917 }, { "epoch": 0.16, "learning_rate": 9.56046800126476e-06, "loss": 0.6627, "step": 6918 }, { "epoch": 0.16, "learning_rate": 9.56031401391923e-06, "loss": 1.2392, "step": 6919 }, { "epoch": 0.16, "learning_rate": 9.56016000084472e-06, "loss": 1.3582, "step": 6920 }, { "epoch": 0.16, "learning_rate": 9.560005962042095e-06, "loss": 1.1106, "step": 6921 }, { "epoch": 0.16, "learning_rate": 9.559851897512229e-06, "loss": 0.8449, "step": 6922 }, { "epoch": 0.16, "learning_rate": 9.55969780725599e-06, "loss": 1.0106, "step": 6923 }, { "epoch": 0.16, "learning_rate": 9.559543691274244e-06, "loss": 0.8103, "step": 6924 }, { "epoch": 0.16, "learning_rate": 9.559389549567863e-06, "loss": 1.0207, "step": 6925 }, { "epoch": 0.16, "learning_rate": 9.559235382137715e-06, "loss": 1.1935, "step": 6926 }, { "epoch": 0.16, "learning_rate": 9.559081188984673e-06, "loss": 0.9711, "step": 6927 }, { "epoch": 0.16, "learning_rate": 9.558926970109605e-06, "loss": 1.1503, "step": 6928 }, { "epoch": 0.16, "learning_rate": 9.558772725513382e-06, "loss": 1.0546, "step": 6929 }, { "epoch": 0.16, "learning_rate": 9.55861845519687e-06, "loss": 1.0003, "step": 6930 }, { "epoch": 0.16, "learning_rate": 9.558464159160945e-06, "loss": 1.2329, "step": 6931 }, { "epoch": 0.16, "learning_rate": 9.558309837406475e-06, "loss": 1.1411, "step": 6932 }, { "epoch": 0.16, "learning_rate": 9.55815548993433e-06, "loss": 0.8662, "step": 6933 }, { "epoch": 0.16, "learning_rate": 9.558001116745384e-06, "loss": 1.0941, "step": 6934 }, { "epoch": 0.16, "learning_rate": 9.557846717840505e-06, "loss": 1.0197, "step": 6935 }, { "epoch": 0.16, "learning_rate": 9.557692293220565e-06, "loss": 1.2426, "step": 6936 }, { "epoch": 0.16, "learning_rate": 9.557537842886434e-06, "loss": 1.2467, "step": 6937 }, { "epoch": 0.16, "learning_rate": 9.557383366838983e-06, "loss": 1.293, "step": 6938 }, { "epoch": 0.16, "learning_rate": 9.557228865079088e-06, "loss": 1.2021, "step": 6939 }, { "epoch": 0.16, "learning_rate": 9.557074337607616e-06, "loss": 1.1426, "step": 6940 }, { "epoch": 0.16, "learning_rate": 9.55691978442544e-06, "loss": 1.0262, "step": 6941 }, { "epoch": 0.16, "learning_rate": 9.556765205533436e-06, "loss": 0.9711, "step": 6942 }, { "epoch": 0.16, "learning_rate": 9.55661060093247e-06, "loss": 1.0513, "step": 6943 }, { "epoch": 0.16, "learning_rate": 9.556455970623417e-06, "loss": 0.9332, "step": 6944 }, { "epoch": 0.16, "learning_rate": 9.55630131460715e-06, "loss": 0.8055, "step": 6945 }, { "epoch": 0.16, "learning_rate": 9.55614663288454e-06, "loss": 1.0678, "step": 6946 }, { "epoch": 0.16, "learning_rate": 9.555991925456462e-06, "loss": 0.8595, "step": 6947 }, { "epoch": 0.16, "learning_rate": 9.555837192323786e-06, "loss": 1.1882, "step": 6948 }, { "epoch": 0.16, "learning_rate": 9.555682433487388e-06, "loss": 0.7088, "step": 6949 }, { "epoch": 0.16, "learning_rate": 9.555527648948137e-06, "loss": 1.1756, "step": 6950 }, { "epoch": 0.16, "learning_rate": 9.555372838706912e-06, "loss": 0.946, "step": 6951 }, { "epoch": 0.16, "learning_rate": 9.55521800276458e-06, "loss": 1.1265, "step": 6952 }, { "epoch": 0.16, "learning_rate": 9.555063141122021e-06, "loss": 0.9971, "step": 6953 }, { "epoch": 0.16, "learning_rate": 9.554908253780105e-06, "loss": 1.0798, "step": 6954 }, { "epoch": 0.16, "learning_rate": 9.554753340739705e-06, "loss": 0.743, "step": 6955 }, { "epoch": 0.16, "learning_rate": 9.554598402001697e-06, "loss": 0.9482, "step": 6956 }, { "epoch": 0.16, "learning_rate": 9.554443437566957e-06, "loss": 0.9118, "step": 6957 }, { "epoch": 0.16, "learning_rate": 9.554288447436354e-06, "loss": 1.1321, "step": 6958 }, { "epoch": 0.16, "learning_rate": 9.554133431610765e-06, "loss": 1.021, "step": 6959 }, { "epoch": 0.16, "learning_rate": 9.553978390091066e-06, "loss": 0.8166, "step": 6960 }, { "epoch": 0.16, "learning_rate": 9.553823322878132e-06, "loss": 1.1148, "step": 6961 }, { "epoch": 0.16, "learning_rate": 9.553668229972834e-06, "loss": 0.9743, "step": 6962 }, { "epoch": 0.16, "learning_rate": 9.553513111376052e-06, "loss": 1.1045, "step": 6963 }, { "epoch": 0.16, "learning_rate": 9.553357967088658e-06, "loss": 1.0654, "step": 6964 }, { "epoch": 0.16, "learning_rate": 9.553202797111526e-06, "loss": 0.7497, "step": 6965 }, { "epoch": 0.16, "learning_rate": 9.553047601445536e-06, "loss": 0.7978, "step": 6966 }, { "epoch": 0.16, "learning_rate": 9.55289238009156e-06, "loss": 1.0159, "step": 6967 }, { "epoch": 0.16, "learning_rate": 9.552737133050475e-06, "loss": 0.8651, "step": 6968 }, { "epoch": 0.16, "learning_rate": 9.552581860323157e-06, "loss": 0.9914, "step": 6969 }, { "epoch": 0.16, "learning_rate": 9.552426561910485e-06, "loss": 1.029, "step": 6970 }, { "epoch": 0.16, "learning_rate": 9.552271237813327e-06, "loss": 0.8493, "step": 6971 }, { "epoch": 0.16, "learning_rate": 9.552115888032566e-06, "loss": 0.9697, "step": 6972 }, { "epoch": 0.16, "learning_rate": 9.55196051256908e-06, "loss": 1.113, "step": 6973 }, { "epoch": 0.16, "learning_rate": 9.551805111423738e-06, "loss": 1.1647, "step": 6974 }, { "epoch": 0.16, "learning_rate": 9.551649684597421e-06, "loss": 0.8581, "step": 6975 }, { "epoch": 0.16, "learning_rate": 9.551494232091009e-06, "loss": 1.2312, "step": 6976 }, { "epoch": 0.16, "learning_rate": 9.551338753905375e-06, "loss": 0.8754, "step": 6977 }, { "epoch": 0.16, "learning_rate": 9.551183250041396e-06, "loss": 0.9757, "step": 6978 }, { "epoch": 0.16, "learning_rate": 9.551027720499953e-06, "loss": 1.0948, "step": 6979 }, { "epoch": 0.16, "learning_rate": 9.550872165281919e-06, "loss": 1.3953, "step": 6980 }, { "epoch": 0.16, "learning_rate": 9.550716584388175e-06, "loss": 1.0406, "step": 6981 }, { "epoch": 0.16, "learning_rate": 9.550560977819597e-06, "loss": 1.0827, "step": 6982 }, { "epoch": 0.16, "learning_rate": 9.550405345577065e-06, "loss": 1.1505, "step": 6983 }, { "epoch": 0.16, "learning_rate": 9.550249687661453e-06, "loss": 1.2097, "step": 6984 }, { "epoch": 0.16, "learning_rate": 9.550094004073645e-06, "loss": 0.9643, "step": 6985 }, { "epoch": 0.16, "learning_rate": 9.549938294814514e-06, "loss": 0.9444, "step": 6986 }, { "epoch": 0.16, "learning_rate": 9.54978255988494e-06, "loss": 1.3039, "step": 6987 }, { "epoch": 0.16, "learning_rate": 9.549626799285802e-06, "loss": 1.1537, "step": 6988 }, { "epoch": 0.16, "learning_rate": 9.549471013017981e-06, "loss": 0.9632, "step": 6989 }, { "epoch": 0.16, "learning_rate": 9.549315201082353e-06, "loss": 0.8319, "step": 6990 }, { "epoch": 0.16, "learning_rate": 9.5491593634798e-06, "loss": 1.0849, "step": 6991 }, { "epoch": 0.16, "learning_rate": 9.549003500211197e-06, "loss": 1.1666, "step": 6992 }, { "epoch": 0.16, "learning_rate": 9.548847611277426e-06, "loss": 1.0615, "step": 6993 }, { "epoch": 0.16, "learning_rate": 9.548691696679367e-06, "loss": 1.0309, "step": 6994 }, { "epoch": 0.16, "learning_rate": 9.548535756417899e-06, "loss": 0.854, "step": 6995 }, { "epoch": 0.16, "learning_rate": 9.5483797904939e-06, "loss": 0.9432, "step": 6996 }, { "epoch": 0.16, "learning_rate": 9.548223798908254e-06, "loss": 1.0413, "step": 6997 }, { "epoch": 0.16, "learning_rate": 9.548067781661837e-06, "loss": 1.0888, "step": 6998 }, { "epoch": 0.16, "learning_rate": 9.54791173875553e-06, "loss": 0.8141, "step": 6999 }, { "epoch": 0.16, "learning_rate": 9.547755670190217e-06, "loss": 1.1423, "step": 7000 }, { "epoch": 0.16, "learning_rate": 9.547599575966773e-06, "loss": 1.0262, "step": 7001 }, { "epoch": 0.16, "learning_rate": 9.547443456086083e-06, "loss": 1.3105, "step": 7002 }, { "epoch": 0.16, "learning_rate": 9.547287310549026e-06, "loss": 1.0586, "step": 7003 }, { "epoch": 0.16, "learning_rate": 9.547131139356485e-06, "loss": 1.0299, "step": 7004 }, { "epoch": 0.16, "learning_rate": 9.546974942509338e-06, "loss": 1.0765, "step": 7005 }, { "epoch": 0.16, "learning_rate": 9.546818720008469e-06, "loss": 1.1178, "step": 7006 }, { "epoch": 0.16, "learning_rate": 9.546662471854756e-06, "loss": 1.1447, "step": 7007 }, { "epoch": 0.16, "learning_rate": 9.546506198049082e-06, "loss": 1.0591, "step": 7008 }, { "epoch": 0.16, "learning_rate": 9.54634989859233e-06, "loss": 0.9906, "step": 7009 }, { "epoch": 0.16, "learning_rate": 9.546193573485383e-06, "loss": 1.0536, "step": 7010 }, { "epoch": 0.16, "learning_rate": 9.54603722272912e-06, "loss": 1.038, "step": 7011 }, { "epoch": 0.16, "learning_rate": 9.545880846324424e-06, "loss": 0.9969, "step": 7012 }, { "epoch": 0.16, "learning_rate": 9.545724444272177e-06, "loss": 1.524, "step": 7013 }, { "epoch": 0.16, "learning_rate": 9.545568016573263e-06, "loss": 1.2319, "step": 7014 }, { "epoch": 0.16, "learning_rate": 9.545411563228563e-06, "loss": 0.992, "step": 7015 }, { "epoch": 0.16, "learning_rate": 9.54525508423896e-06, "loss": 1.0084, "step": 7016 }, { "epoch": 0.16, "learning_rate": 9.545098579605336e-06, "loss": 0.9676, "step": 7017 }, { "epoch": 0.16, "learning_rate": 9.544942049328575e-06, "loss": 0.8337, "step": 7018 }, { "epoch": 0.16, "learning_rate": 9.544785493409563e-06, "loss": 1.3349, "step": 7019 }, { "epoch": 0.16, "learning_rate": 9.544628911849179e-06, "loss": 0.9569, "step": 7020 }, { "epoch": 0.16, "learning_rate": 9.544472304648306e-06, "loss": 1.109, "step": 7021 }, { "epoch": 0.16, "learning_rate": 9.544315671807831e-06, "loss": 1.0929, "step": 7022 }, { "epoch": 0.16, "learning_rate": 9.544159013328635e-06, "loss": 1.1659, "step": 7023 }, { "epoch": 0.16, "learning_rate": 9.544002329211604e-06, "loss": 1.2603, "step": 7024 }, { "epoch": 0.16, "learning_rate": 9.543845619457622e-06, "loss": 1.0402, "step": 7025 }, { "epoch": 0.16, "learning_rate": 9.543688884067571e-06, "loss": 0.9934, "step": 7026 }, { "epoch": 0.16, "learning_rate": 9.543532123042334e-06, "loss": 1.1127, "step": 7027 }, { "epoch": 0.16, "learning_rate": 9.543375336382802e-06, "loss": 0.7981, "step": 7028 }, { "epoch": 0.16, "learning_rate": 9.543218524089852e-06, "loss": 1.1368, "step": 7029 }, { "epoch": 0.16, "learning_rate": 9.543061686164374e-06, "loss": 1.0616, "step": 7030 }, { "epoch": 0.16, "learning_rate": 9.54290482260725e-06, "loss": 1.1234, "step": 7031 }, { "epoch": 0.16, "learning_rate": 9.542747933419365e-06, "loss": 1.0512, "step": 7032 }, { "epoch": 0.16, "learning_rate": 9.542591018601609e-06, "loss": 1.1248, "step": 7033 }, { "epoch": 0.16, "learning_rate": 9.54243407815486e-06, "loss": 0.7003, "step": 7034 }, { "epoch": 0.16, "learning_rate": 9.542277112080007e-06, "loss": 1.2211, "step": 7035 }, { "epoch": 0.16, "learning_rate": 9.542120120377935e-06, "loss": 0.8455, "step": 7036 }, { "epoch": 0.16, "learning_rate": 9.541963103049534e-06, "loss": 0.9685, "step": 7037 }, { "epoch": 0.16, "learning_rate": 9.541806060095684e-06, "loss": 1.1962, "step": 7038 }, { "epoch": 0.16, "learning_rate": 9.541648991517271e-06, "loss": 1.2119, "step": 7039 }, { "epoch": 0.16, "learning_rate": 9.541491897315187e-06, "loss": 0.8931, "step": 7040 }, { "epoch": 0.16, "learning_rate": 9.541334777490312e-06, "loss": 1.0438, "step": 7041 }, { "epoch": 0.16, "learning_rate": 9.541177632043535e-06, "loss": 1.0617, "step": 7042 }, { "epoch": 0.16, "learning_rate": 9.541020460975745e-06, "loss": 1.148, "step": 7043 }, { "epoch": 0.16, "learning_rate": 9.540863264287824e-06, "loss": 1.1724, "step": 7044 }, { "epoch": 0.16, "learning_rate": 9.540706041980664e-06, "loss": 0.8338, "step": 7045 }, { "epoch": 0.16, "learning_rate": 9.540548794055147e-06, "loss": 1.1653, "step": 7046 }, { "epoch": 0.16, "learning_rate": 9.540391520512163e-06, "loss": 1.3648, "step": 7047 }, { "epoch": 0.16, "learning_rate": 9.5402342213526e-06, "loss": 0.8855, "step": 7048 }, { "epoch": 0.16, "learning_rate": 9.540076896577342e-06, "loss": 0.9558, "step": 7049 }, { "epoch": 0.16, "learning_rate": 9.539919546187282e-06, "loss": 0.7916, "step": 7050 }, { "epoch": 0.16, "learning_rate": 9.539762170183302e-06, "loss": 0.8855, "step": 7051 }, { "epoch": 0.16, "learning_rate": 9.539604768566294e-06, "loss": 0.9607, "step": 7052 }, { "epoch": 0.16, "learning_rate": 9.539447341337145e-06, "loss": 1.0405, "step": 7053 }, { "epoch": 0.16, "learning_rate": 9.539289888496742e-06, "loss": 1.1008, "step": 7054 }, { "epoch": 0.16, "learning_rate": 9.539132410045976e-06, "loss": 1.05, "step": 7055 }, { "epoch": 0.16, "learning_rate": 9.538974905985732e-06, "loss": 1.0916, "step": 7056 }, { "epoch": 0.16, "learning_rate": 9.5388173763169e-06, "loss": 1.0716, "step": 7057 }, { "epoch": 0.16, "learning_rate": 9.538659821040371e-06, "loss": 1.0218, "step": 7058 }, { "epoch": 0.16, "learning_rate": 9.53850224015703e-06, "loss": 1.0908, "step": 7059 }, { "epoch": 0.16, "learning_rate": 9.538344633667769e-06, "loss": 1.3075, "step": 7060 }, { "epoch": 0.16, "learning_rate": 9.538187001573476e-06, "loss": 1.0447, "step": 7061 }, { "epoch": 0.16, "learning_rate": 9.53802934387504e-06, "loss": 1.0646, "step": 7062 }, { "epoch": 0.16, "learning_rate": 9.537871660573353e-06, "loss": 0.9901, "step": 7063 }, { "epoch": 0.16, "learning_rate": 9.537713951669301e-06, "loss": 0.9813, "step": 7064 }, { "epoch": 0.16, "learning_rate": 9.537556217163775e-06, "loss": 0.6722, "step": 7065 }, { "epoch": 0.16, "learning_rate": 9.537398457057668e-06, "loss": 0.7223, "step": 7066 }, { "epoch": 0.16, "learning_rate": 9.537240671351865e-06, "loss": 0.9542, "step": 7067 }, { "epoch": 0.16, "learning_rate": 9.537082860047259e-06, "loss": 1.0839, "step": 7068 }, { "epoch": 0.16, "learning_rate": 9.536925023144742e-06, "loss": 1.0749, "step": 7069 }, { "epoch": 0.16, "learning_rate": 9.536767160645202e-06, "loss": 1.0593, "step": 7070 }, { "epoch": 0.16, "learning_rate": 9.53660927254953e-06, "loss": 0.8722, "step": 7071 }, { "epoch": 0.16, "learning_rate": 9.536451358858615e-06, "loss": 1.0601, "step": 7072 }, { "epoch": 0.16, "learning_rate": 9.536293419573354e-06, "loss": 0.9632, "step": 7073 }, { "epoch": 0.16, "learning_rate": 9.536135454694632e-06, "loss": 1.0189, "step": 7074 }, { "epoch": 0.16, "learning_rate": 9.535977464223343e-06, "loss": 1.1268, "step": 7075 }, { "epoch": 0.16, "learning_rate": 9.535819448160377e-06, "loss": 1.0, "step": 7076 }, { "epoch": 0.16, "learning_rate": 9.535661406506625e-06, "loss": 1.1044, "step": 7077 }, { "epoch": 0.16, "learning_rate": 9.53550333926298e-06, "loss": 1.0467, "step": 7078 }, { "epoch": 0.16, "learning_rate": 9.535345246430336e-06, "loss": 0.8534, "step": 7079 }, { "epoch": 0.16, "learning_rate": 9.535187128009581e-06, "loss": 1.3186, "step": 7080 }, { "epoch": 0.16, "learning_rate": 9.53502898400161e-06, "loss": 1.0067, "step": 7081 }, { "epoch": 0.16, "learning_rate": 9.534870814407314e-06, "loss": 0.9558, "step": 7082 }, { "epoch": 0.16, "learning_rate": 9.534712619227583e-06, "loss": 0.9461, "step": 7083 }, { "epoch": 0.16, "learning_rate": 9.534554398463314e-06, "loss": 1.0905, "step": 7084 }, { "epoch": 0.16, "learning_rate": 9.534396152115397e-06, "loss": 1.0091, "step": 7085 }, { "epoch": 0.16, "learning_rate": 9.534237880184725e-06, "loss": 1.0244, "step": 7086 }, { "epoch": 0.16, "learning_rate": 9.53407958267219e-06, "loss": 1.077, "step": 7087 }, { "epoch": 0.16, "learning_rate": 9.533921259578689e-06, "loss": 1.3128, "step": 7088 }, { "epoch": 0.16, "learning_rate": 9.533762910905111e-06, "loss": 0.8334, "step": 7089 }, { "epoch": 0.16, "learning_rate": 9.533604536652353e-06, "loss": 1.0714, "step": 7090 }, { "epoch": 0.16, "learning_rate": 9.533446136821303e-06, "loss": 1.1043, "step": 7091 }, { "epoch": 0.16, "learning_rate": 9.533287711412862e-06, "loss": 1.2455, "step": 7092 }, { "epoch": 0.16, "learning_rate": 9.533129260427918e-06, "loss": 0.844, "step": 7093 }, { "epoch": 0.16, "learning_rate": 9.532970783867367e-06, "loss": 0.8105, "step": 7094 }, { "epoch": 0.16, "learning_rate": 9.532812281732104e-06, "loss": 1.0701, "step": 7095 }, { "epoch": 0.16, "learning_rate": 9.532653754023023e-06, "loss": 1.0829, "step": 7096 }, { "epoch": 0.16, "learning_rate": 9.532495200741017e-06, "loss": 0.9561, "step": 7097 }, { "epoch": 0.16, "learning_rate": 9.532336621886979e-06, "loss": 0.9907, "step": 7098 }, { "epoch": 0.16, "learning_rate": 9.53217801746181e-06, "loss": 1.0453, "step": 7099 }, { "epoch": 0.16, "learning_rate": 9.532019387466397e-06, "loss": 0.9577, "step": 7100 }, { "epoch": 0.16, "learning_rate": 9.531860731901644e-06, "loss": 0.8611, "step": 7101 }, { "epoch": 0.16, "learning_rate": 9.531702050768437e-06, "loss": 0.9632, "step": 7102 }, { "epoch": 0.16, "learning_rate": 9.531543344067676e-06, "loss": 1.3787, "step": 7103 }, { "epoch": 0.16, "learning_rate": 9.531384611800256e-06, "loss": 1.0411, "step": 7104 }, { "epoch": 0.16, "learning_rate": 9.531225853967074e-06, "loss": 1.1182, "step": 7105 }, { "epoch": 0.16, "learning_rate": 9.531067070569021e-06, "loss": 0.8619, "step": 7106 }, { "epoch": 0.16, "learning_rate": 9.530908261606997e-06, "loss": 1.1449, "step": 7107 }, { "epoch": 0.16, "learning_rate": 9.530749427081899e-06, "loss": 0.8579, "step": 7108 }, { "epoch": 0.16, "learning_rate": 9.530590566994618e-06, "loss": 1.1945, "step": 7109 }, { "epoch": 0.16, "learning_rate": 9.530431681346053e-06, "loss": 0.8295, "step": 7110 }, { "epoch": 0.16, "learning_rate": 9.530272770137102e-06, "loss": 0.954, "step": 7111 }, { "epoch": 0.16, "learning_rate": 9.53011383336866e-06, "loss": 1.0498, "step": 7112 }, { "epoch": 0.16, "learning_rate": 9.529954871041623e-06, "loss": 0.9525, "step": 7113 }, { "epoch": 0.16, "learning_rate": 9.52979588315689e-06, "loss": 0.8039, "step": 7114 }, { "epoch": 0.17, "learning_rate": 9.529636869715356e-06, "loss": 0.8878, "step": 7115 }, { "epoch": 0.17, "learning_rate": 9.52947783071792e-06, "loss": 1.07, "step": 7116 }, { "epoch": 0.17, "learning_rate": 9.529318766165476e-06, "loss": 0.9709, "step": 7117 }, { "epoch": 0.17, "learning_rate": 9.529159676058926e-06, "loss": 1.0209, "step": 7118 }, { "epoch": 0.17, "learning_rate": 9.529000560399163e-06, "loss": 0.9884, "step": 7119 }, { "epoch": 0.17, "learning_rate": 9.528841419187088e-06, "loss": 0.9268, "step": 7120 }, { "epoch": 0.17, "learning_rate": 9.528682252423597e-06, "loss": 1.1012, "step": 7121 }, { "epoch": 0.17, "learning_rate": 9.528523060109591e-06, "loss": 1.1135, "step": 7122 }, { "epoch": 0.17, "learning_rate": 9.528363842245965e-06, "loss": 1.1466, "step": 7123 }, { "epoch": 0.17, "learning_rate": 9.528204598833617e-06, "loss": 1.0296, "step": 7124 }, { "epoch": 0.17, "learning_rate": 9.528045329873448e-06, "loss": 0.9742, "step": 7125 }, { "epoch": 0.17, "learning_rate": 9.527886035366354e-06, "loss": 1.0736, "step": 7126 }, { "epoch": 0.17, "learning_rate": 9.527726715313235e-06, "loss": 0.6795, "step": 7127 }, { "epoch": 0.17, "learning_rate": 9.527567369714989e-06, "loss": 0.9994, "step": 7128 }, { "epoch": 0.17, "learning_rate": 9.527407998572519e-06, "loss": 0.8771, "step": 7129 }, { "epoch": 0.17, "learning_rate": 9.527248601886719e-06, "loss": 1.1476, "step": 7130 }, { "epoch": 0.17, "learning_rate": 9.52708917965849e-06, "loss": 0.876, "step": 7131 }, { "epoch": 0.17, "learning_rate": 9.526929731888733e-06, "loss": 0.8868, "step": 7132 }, { "epoch": 0.17, "learning_rate": 9.526770258578347e-06, "loss": 1.3453, "step": 7133 }, { "epoch": 0.17, "learning_rate": 9.526610759728228e-06, "loss": 0.9385, "step": 7134 }, { "epoch": 0.17, "learning_rate": 9.526451235339282e-06, "loss": 0.925, "step": 7135 }, { "epoch": 0.17, "learning_rate": 9.526291685412403e-06, "loss": 1.0175, "step": 7136 }, { "epoch": 0.17, "learning_rate": 9.526132109948498e-06, "loss": 0.9755, "step": 7137 }, { "epoch": 0.17, "learning_rate": 9.52597250894846e-06, "loss": 1.2244, "step": 7138 }, { "epoch": 0.17, "learning_rate": 9.525812882413194e-06, "loss": 1.1714, "step": 7139 }, { "epoch": 0.17, "learning_rate": 9.5256532303436e-06, "loss": 1.0527, "step": 7140 }, { "epoch": 0.17, "learning_rate": 9.52549355274058e-06, "loss": 1.1737, "step": 7141 }, { "epoch": 0.17, "learning_rate": 9.525333849605033e-06, "loss": 0.9177, "step": 7142 }, { "epoch": 0.17, "learning_rate": 9.525174120937857e-06, "loss": 1.1067, "step": 7143 }, { "epoch": 0.17, "learning_rate": 9.525014366739958e-06, "loss": 1.1227, "step": 7144 }, { "epoch": 0.17, "learning_rate": 9.524854587012237e-06, "loss": 0.9187, "step": 7145 }, { "epoch": 0.17, "learning_rate": 9.524694781755592e-06, "loss": 1.2635, "step": 7146 }, { "epoch": 0.17, "learning_rate": 9.524534950970928e-06, "loss": 0.9017, "step": 7147 }, { "epoch": 0.17, "learning_rate": 9.524375094659147e-06, "loss": 1.1483, "step": 7148 }, { "epoch": 0.17, "learning_rate": 9.524215212821147e-06, "loss": 1.0981, "step": 7149 }, { "epoch": 0.17, "learning_rate": 9.524055305457834e-06, "loss": 0.9463, "step": 7150 }, { "epoch": 0.17, "learning_rate": 9.523895372570108e-06, "loss": 1.0781, "step": 7151 }, { "epoch": 0.17, "learning_rate": 9.523735414158873e-06, "loss": 0.8144, "step": 7152 }, { "epoch": 0.17, "learning_rate": 9.52357543022503e-06, "loss": 0.8276, "step": 7153 }, { "epoch": 0.17, "learning_rate": 9.523415420769482e-06, "loss": 1.2555, "step": 7154 }, { "epoch": 0.17, "learning_rate": 9.52325538579313e-06, "loss": 0.7937, "step": 7155 }, { "epoch": 0.17, "learning_rate": 9.523095325296881e-06, "loss": 1.2366, "step": 7156 }, { "epoch": 0.17, "learning_rate": 9.522935239281636e-06, "loss": 0.8688, "step": 7157 }, { "epoch": 0.17, "learning_rate": 9.522775127748297e-06, "loss": 1.2356, "step": 7158 }, { "epoch": 0.17, "learning_rate": 9.52261499069777e-06, "loss": 0.8576, "step": 7159 }, { "epoch": 0.17, "learning_rate": 9.522454828130953e-06, "loss": 1.0871, "step": 7160 }, { "epoch": 0.17, "learning_rate": 9.522294640048756e-06, "loss": 0.9954, "step": 7161 }, { "epoch": 0.17, "learning_rate": 9.522134426452083e-06, "loss": 1.0428, "step": 7162 }, { "epoch": 0.17, "learning_rate": 9.521974187341831e-06, "loss": 1.3888, "step": 7163 }, { "epoch": 0.17, "learning_rate": 9.52181392271891e-06, "loss": 1.0284, "step": 7164 }, { "epoch": 0.17, "learning_rate": 9.521653632584223e-06, "loss": 1.2117, "step": 7165 }, { "epoch": 0.17, "learning_rate": 9.521493316938673e-06, "loss": 1.03, "step": 7166 }, { "epoch": 0.17, "learning_rate": 9.521332975783164e-06, "loss": 1.0803, "step": 7167 }, { "epoch": 0.17, "learning_rate": 9.521172609118604e-06, "loss": 1.0261, "step": 7168 }, { "epoch": 0.17, "learning_rate": 9.521012216945894e-06, "loss": 0.9332, "step": 7169 }, { "epoch": 0.17, "learning_rate": 9.520851799265942e-06, "loss": 0.9838, "step": 7170 }, { "epoch": 0.17, "learning_rate": 9.52069135607965e-06, "loss": 0.8839, "step": 7171 }, { "epoch": 0.17, "learning_rate": 9.520530887387926e-06, "loss": 1.1181, "step": 7172 }, { "epoch": 0.17, "learning_rate": 9.520370393191675e-06, "loss": 1.0063, "step": 7173 }, { "epoch": 0.17, "learning_rate": 9.5202098734918e-06, "loss": 1.0929, "step": 7174 }, { "epoch": 0.17, "learning_rate": 9.520049328289209e-06, "loss": 1.3701, "step": 7175 }, { "epoch": 0.17, "learning_rate": 9.519888757584808e-06, "loss": 0.9104, "step": 7176 }, { "epoch": 0.17, "learning_rate": 9.519728161379502e-06, "loss": 1.0074, "step": 7177 }, { "epoch": 0.17, "learning_rate": 9.519567539674195e-06, "loss": 0.8174, "step": 7178 }, { "epoch": 0.17, "learning_rate": 9.519406892469797e-06, "loss": 1.0855, "step": 7179 }, { "epoch": 0.17, "learning_rate": 9.519246219767212e-06, "loss": 0.9539, "step": 7180 }, { "epoch": 0.17, "learning_rate": 9.51908552156735e-06, "loss": 1.0467, "step": 7181 }, { "epoch": 0.17, "learning_rate": 9.518924797871111e-06, "loss": 1.2222, "step": 7182 }, { "epoch": 0.17, "learning_rate": 9.518764048679408e-06, "loss": 0.8674, "step": 7183 }, { "epoch": 0.17, "learning_rate": 9.518603273993146e-06, "loss": 0.8018, "step": 7184 }, { "epoch": 0.17, "learning_rate": 9.518442473813229e-06, "loss": 1.0562, "step": 7185 }, { "epoch": 0.17, "learning_rate": 9.51828164814057e-06, "loss": 1.0534, "step": 7186 }, { "epoch": 0.17, "learning_rate": 9.51812079697607e-06, "loss": 1.0043, "step": 7187 }, { "epoch": 0.17, "learning_rate": 9.517959920320642e-06, "loss": 1.2285, "step": 7188 }, { "epoch": 0.17, "learning_rate": 9.517799018175192e-06, "loss": 0.935, "step": 7189 }, { "epoch": 0.17, "learning_rate": 9.517638090540626e-06, "loss": 0.9737, "step": 7190 }, { "epoch": 0.17, "learning_rate": 9.517477137417854e-06, "loss": 0.9929, "step": 7191 }, { "epoch": 0.17, "learning_rate": 9.517316158807783e-06, "loss": 0.9906, "step": 7192 }, { "epoch": 0.17, "learning_rate": 9.517155154711321e-06, "loss": 1.1589, "step": 7193 }, { "epoch": 0.17, "learning_rate": 9.516994125129378e-06, "loss": 1.0539, "step": 7194 }, { "epoch": 0.17, "learning_rate": 9.516833070062859e-06, "loss": 0.7713, "step": 7195 }, { "epoch": 0.17, "learning_rate": 9.516671989512678e-06, "loss": 0.8652, "step": 7196 }, { "epoch": 0.17, "learning_rate": 9.51651088347974e-06, "loss": 0.7971, "step": 7197 }, { "epoch": 0.17, "learning_rate": 9.516349751964952e-06, "loss": 0.9208, "step": 7198 }, { "epoch": 0.17, "learning_rate": 9.51618859496923e-06, "loss": 1.0661, "step": 7199 }, { "epoch": 0.17, "learning_rate": 9.516027412493477e-06, "loss": 0.9591, "step": 7200 }, { "epoch": 0.17, "learning_rate": 9.515866204538604e-06, "loss": 0.8476, "step": 7201 }, { "epoch": 0.17, "learning_rate": 9.515704971105522e-06, "loss": 1.0083, "step": 7202 }, { "epoch": 0.17, "learning_rate": 9.51554371219514e-06, "loss": 1.0768, "step": 7203 }, { "epoch": 0.17, "learning_rate": 9.515382427808367e-06, "loss": 1.2552, "step": 7204 }, { "epoch": 0.17, "learning_rate": 9.515221117946115e-06, "loss": 1.0622, "step": 7205 }, { "epoch": 0.17, "learning_rate": 9.515059782609291e-06, "loss": 1.0248, "step": 7206 }, { "epoch": 0.17, "learning_rate": 9.514898421798807e-06, "loss": 0.9524, "step": 7207 }, { "epoch": 0.17, "learning_rate": 9.514737035515572e-06, "loss": 1.0459, "step": 7208 }, { "epoch": 0.17, "learning_rate": 9.514575623760499e-06, "loss": 1.0367, "step": 7209 }, { "epoch": 0.17, "learning_rate": 9.514414186534497e-06, "loss": 0.8558, "step": 7210 }, { "epoch": 0.17, "learning_rate": 9.514252723838478e-06, "loss": 0.9685, "step": 7211 }, { "epoch": 0.17, "learning_rate": 9.514091235673351e-06, "loss": 1.0426, "step": 7212 }, { "epoch": 0.17, "learning_rate": 9.513929722040029e-06, "loss": 1.0285, "step": 7213 }, { "epoch": 0.17, "learning_rate": 9.513768182939424e-06, "loss": 1.0556, "step": 7214 }, { "epoch": 0.17, "learning_rate": 9.513606618372444e-06, "loss": 1.0648, "step": 7215 }, { "epoch": 0.17, "learning_rate": 9.513445028340002e-06, "loss": 1.0714, "step": 7216 }, { "epoch": 0.17, "learning_rate": 9.513283412843013e-06, "loss": 1.0477, "step": 7217 }, { "epoch": 0.17, "learning_rate": 9.513121771882383e-06, "loss": 1.0461, "step": 7218 }, { "epoch": 0.17, "learning_rate": 9.512960105459028e-06, "loss": 1.4006, "step": 7219 }, { "epoch": 0.17, "learning_rate": 9.512798413573861e-06, "loss": 0.9337, "step": 7220 }, { "epoch": 0.17, "learning_rate": 9.512636696227789e-06, "loss": 1.0638, "step": 7221 }, { "epoch": 0.17, "learning_rate": 9.51247495342173e-06, "loss": 0.9181, "step": 7222 }, { "epoch": 0.17, "learning_rate": 9.512313185156594e-06, "loss": 1.2577, "step": 7223 }, { "epoch": 0.17, "learning_rate": 9.512151391433293e-06, "loss": 0.8369, "step": 7224 }, { "epoch": 0.17, "learning_rate": 9.51198957225274e-06, "loss": 1.0129, "step": 7225 }, { "epoch": 0.17, "learning_rate": 9.51182772761585e-06, "loss": 1.171, "step": 7226 }, { "epoch": 0.17, "learning_rate": 9.511665857523535e-06, "loss": 1.0863, "step": 7227 }, { "epoch": 0.17, "learning_rate": 9.511503961976708e-06, "loss": 0.9458, "step": 7228 }, { "epoch": 0.17, "learning_rate": 9.511342040976282e-06, "loss": 0.8974, "step": 7229 }, { "epoch": 0.17, "learning_rate": 9.511180094523171e-06, "loss": 1.1102, "step": 7230 }, { "epoch": 0.17, "learning_rate": 9.51101812261829e-06, "loss": 1.3677, "step": 7231 }, { "epoch": 0.17, "learning_rate": 9.510856125262551e-06, "loss": 1.0754, "step": 7232 }, { "epoch": 0.17, "learning_rate": 9.510694102456867e-06, "loss": 0.7197, "step": 7233 }, { "epoch": 0.17, "learning_rate": 9.510532054202157e-06, "loss": 0.9817, "step": 7234 }, { "epoch": 0.17, "learning_rate": 9.51036998049933e-06, "loss": 1.0724, "step": 7235 }, { "epoch": 0.17, "learning_rate": 9.510207881349303e-06, "loss": 1.4065, "step": 7236 }, { "epoch": 0.17, "learning_rate": 9.510045756752988e-06, "loss": 1.0626, "step": 7237 }, { "epoch": 0.17, "learning_rate": 9.509883606711303e-06, "loss": 1.0576, "step": 7238 }, { "epoch": 0.17, "learning_rate": 9.509721431225162e-06, "loss": 1.137, "step": 7239 }, { "epoch": 0.17, "learning_rate": 9.509559230295479e-06, "loss": 1.1095, "step": 7240 }, { "epoch": 0.17, "learning_rate": 9.509397003923168e-06, "loss": 1.0455, "step": 7241 }, { "epoch": 0.17, "learning_rate": 9.509234752109148e-06, "loss": 0.9598, "step": 7242 }, { "epoch": 0.17, "learning_rate": 9.509072474854331e-06, "loss": 1.0746, "step": 7243 }, { "epoch": 0.17, "learning_rate": 9.508910172159635e-06, "loss": 1.1499, "step": 7244 }, { "epoch": 0.17, "learning_rate": 9.508747844025975e-06, "loss": 1.0147, "step": 7245 }, { "epoch": 0.17, "learning_rate": 9.508585490454263e-06, "loss": 0.838, "step": 7246 }, { "epoch": 0.17, "learning_rate": 9.508423111445422e-06, "loss": 0.9867, "step": 7247 }, { "epoch": 0.17, "learning_rate": 9.508260707000363e-06, "loss": 1.0811, "step": 7248 }, { "epoch": 0.17, "learning_rate": 9.508098277120003e-06, "loss": 0.8308, "step": 7249 }, { "epoch": 0.17, "learning_rate": 9.50793582180526e-06, "loss": 0.8471, "step": 7250 }, { "epoch": 0.17, "learning_rate": 9.507773341057049e-06, "loss": 0.9741, "step": 7251 }, { "epoch": 0.17, "learning_rate": 9.507610834876289e-06, "loss": 0.8946, "step": 7252 }, { "epoch": 0.17, "learning_rate": 9.507448303263893e-06, "loss": 0.9355, "step": 7253 }, { "epoch": 0.17, "learning_rate": 9.507285746220782e-06, "loss": 1.0741, "step": 7254 }, { "epoch": 0.17, "learning_rate": 9.507123163747871e-06, "loss": 0.9898, "step": 7255 }, { "epoch": 0.17, "learning_rate": 9.506960555846077e-06, "loss": 1.0067, "step": 7256 }, { "epoch": 0.17, "learning_rate": 9.50679792251632e-06, "loss": 1.0068, "step": 7257 }, { "epoch": 0.17, "learning_rate": 9.506635263759514e-06, "loss": 0.8812, "step": 7258 }, { "epoch": 0.17, "learning_rate": 9.50647257957658e-06, "loss": 1.2081, "step": 7259 }, { "epoch": 0.17, "learning_rate": 9.506309869968431e-06, "loss": 1.0834, "step": 7260 }, { "epoch": 0.17, "learning_rate": 9.50614713493599e-06, "loss": 1.1218, "step": 7261 }, { "epoch": 0.17, "learning_rate": 9.505984374480176e-06, "loss": 1.2062, "step": 7262 }, { "epoch": 0.17, "learning_rate": 9.5058215886019e-06, "loss": 0.9264, "step": 7263 }, { "epoch": 0.17, "learning_rate": 9.505658777302088e-06, "loss": 1.1138, "step": 7264 }, { "epoch": 0.17, "learning_rate": 9.505495940581655e-06, "loss": 0.9302, "step": 7265 }, { "epoch": 0.17, "learning_rate": 9.505333078441521e-06, "loss": 0.9947, "step": 7266 }, { "epoch": 0.17, "learning_rate": 9.505170190882603e-06, "loss": 0.9686, "step": 7267 }, { "epoch": 0.17, "learning_rate": 9.505007277905822e-06, "loss": 1.0544, "step": 7268 }, { "epoch": 0.17, "learning_rate": 9.504844339512096e-06, "loss": 0.8614, "step": 7269 }, { "epoch": 0.17, "learning_rate": 9.504681375702345e-06, "loss": 0.9432, "step": 7270 }, { "epoch": 0.17, "learning_rate": 9.504518386477488e-06, "loss": 0.9713, "step": 7271 }, { "epoch": 0.17, "learning_rate": 9.504355371838445e-06, "loss": 0.9151, "step": 7272 }, { "epoch": 0.17, "learning_rate": 9.504192331786135e-06, "loss": 1.2299, "step": 7273 }, { "epoch": 0.17, "learning_rate": 9.504029266321479e-06, "loss": 0.949, "step": 7274 }, { "epoch": 0.17, "learning_rate": 9.503866175445395e-06, "loss": 1.0668, "step": 7275 }, { "epoch": 0.17, "learning_rate": 9.503703059158804e-06, "loss": 0.8197, "step": 7276 }, { "epoch": 0.17, "learning_rate": 9.503539917462627e-06, "loss": 0.9691, "step": 7277 }, { "epoch": 0.17, "learning_rate": 9.503376750357786e-06, "loss": 0.9521, "step": 7278 }, { "epoch": 0.17, "learning_rate": 9.503213557845199e-06, "loss": 0.9371, "step": 7279 }, { "epoch": 0.17, "learning_rate": 9.503050339925786e-06, "loss": 1.0271, "step": 7280 }, { "epoch": 0.17, "learning_rate": 9.50288709660047e-06, "loss": 0.9692, "step": 7281 }, { "epoch": 0.17, "learning_rate": 9.502723827870171e-06, "loss": 1.1706, "step": 7282 }, { "epoch": 0.17, "learning_rate": 9.502560533735813e-06, "loss": 0.9401, "step": 7283 }, { "epoch": 0.17, "learning_rate": 9.502397214198311e-06, "loss": 1.043, "step": 7284 }, { "epoch": 0.17, "learning_rate": 9.502233869258591e-06, "loss": 1.1704, "step": 7285 }, { "epoch": 0.17, "learning_rate": 9.502070498917574e-06, "loss": 1.0784, "step": 7286 }, { "epoch": 0.17, "learning_rate": 9.501907103176182e-06, "loss": 1.1222, "step": 7287 }, { "epoch": 0.17, "learning_rate": 9.501743682035337e-06, "loss": 1.0201, "step": 7288 }, { "epoch": 0.17, "learning_rate": 9.50158023549596e-06, "loss": 1.0419, "step": 7289 }, { "epoch": 0.17, "learning_rate": 9.501416763558972e-06, "loss": 1.0563, "step": 7290 }, { "epoch": 0.17, "learning_rate": 9.5012532662253e-06, "loss": 0.7473, "step": 7291 }, { "epoch": 0.17, "learning_rate": 9.501089743495861e-06, "loss": 1.0418, "step": 7292 }, { "epoch": 0.17, "learning_rate": 9.50092619537158e-06, "loss": 1.0195, "step": 7293 }, { "epoch": 0.17, "learning_rate": 9.500762621853378e-06, "loss": 1.2111, "step": 7294 }, { "epoch": 0.17, "learning_rate": 9.500599022942181e-06, "loss": 0.9825, "step": 7295 }, { "epoch": 0.17, "learning_rate": 9.500435398638911e-06, "loss": 1.1091, "step": 7296 }, { "epoch": 0.17, "learning_rate": 9.50027174894449e-06, "loss": 0.8454, "step": 7297 }, { "epoch": 0.17, "learning_rate": 9.500108073859842e-06, "loss": 1.3016, "step": 7298 }, { "epoch": 0.17, "learning_rate": 9.499944373385891e-06, "loss": 0.819, "step": 7299 }, { "epoch": 0.17, "learning_rate": 9.49978064752356e-06, "loss": 1.2438, "step": 7300 }, { "epoch": 0.17, "learning_rate": 9.499616896273771e-06, "loss": 1.1823, "step": 7301 }, { "epoch": 0.17, "learning_rate": 9.49945311963745e-06, "loss": 1.3172, "step": 7302 }, { "epoch": 0.17, "learning_rate": 9.499289317615521e-06, "loss": 1.1474, "step": 7303 }, { "epoch": 0.17, "learning_rate": 9.499125490208907e-06, "loss": 0.8939, "step": 7304 }, { "epoch": 0.17, "learning_rate": 9.498961637418536e-06, "loss": 0.8058, "step": 7305 }, { "epoch": 0.17, "learning_rate": 9.498797759245326e-06, "loss": 0.9372, "step": 7306 }, { "epoch": 0.17, "learning_rate": 9.498633855690206e-06, "loss": 0.9523, "step": 7307 }, { "epoch": 0.17, "learning_rate": 9.4984699267541e-06, "loss": 1.041, "step": 7308 }, { "epoch": 0.17, "learning_rate": 9.498305972437934e-06, "loss": 0.9467, "step": 7309 }, { "epoch": 0.17, "learning_rate": 9.498141992742628e-06, "loss": 0.7576, "step": 7310 }, { "epoch": 0.17, "learning_rate": 9.497977987669114e-06, "loss": 1.012, "step": 7311 }, { "epoch": 0.17, "learning_rate": 9.497813957218313e-06, "loss": 0.9278, "step": 7312 }, { "epoch": 0.17, "learning_rate": 9.497649901391152e-06, "loss": 1.1714, "step": 7313 }, { "epoch": 0.17, "learning_rate": 9.497485820188556e-06, "loss": 0.9307, "step": 7314 }, { "epoch": 0.17, "learning_rate": 9.497321713611452e-06, "loss": 0.881, "step": 7315 }, { "epoch": 0.17, "learning_rate": 9.497157581660764e-06, "loss": 0.9822, "step": 7316 }, { "epoch": 0.17, "learning_rate": 9.49699342433742e-06, "loss": 1.19, "step": 7317 }, { "epoch": 0.17, "learning_rate": 9.496829241642343e-06, "loss": 1.1685, "step": 7318 }, { "epoch": 0.17, "learning_rate": 9.496665033576462e-06, "loss": 0.9897, "step": 7319 }, { "epoch": 0.17, "learning_rate": 9.496500800140701e-06, "loss": 0.9199, "step": 7320 }, { "epoch": 0.17, "learning_rate": 9.496336541335991e-06, "loss": 1.0256, "step": 7321 }, { "epoch": 0.17, "learning_rate": 9.496172257163256e-06, "loss": 0.9841, "step": 7322 }, { "epoch": 0.17, "learning_rate": 9.496007947623422e-06, "loss": 0.875, "step": 7323 }, { "epoch": 0.17, "learning_rate": 9.495843612717417e-06, "loss": 1.1808, "step": 7324 }, { "epoch": 0.17, "learning_rate": 9.495679252446168e-06, "loss": 1.0806, "step": 7325 }, { "epoch": 0.17, "learning_rate": 9.495514866810602e-06, "loss": 1.3708, "step": 7326 }, { "epoch": 0.17, "learning_rate": 9.495350455811647e-06, "loss": 0.8814, "step": 7327 }, { "epoch": 0.17, "learning_rate": 9.495186019450231e-06, "loss": 0.9086, "step": 7328 }, { "epoch": 0.17, "learning_rate": 9.495021557727283e-06, "loss": 1.2765, "step": 7329 }, { "epoch": 0.17, "learning_rate": 9.494857070643725e-06, "loss": 1.1441, "step": 7330 }, { "epoch": 0.17, "learning_rate": 9.494692558200493e-06, "loss": 1.0011, "step": 7331 }, { "epoch": 0.17, "learning_rate": 9.49452802039851e-06, "loss": 1.0181, "step": 7332 }, { "epoch": 0.17, "learning_rate": 9.494363457238706e-06, "loss": 0.6986, "step": 7333 }, { "epoch": 0.17, "learning_rate": 9.49419886872201e-06, "loss": 1.4387, "step": 7334 }, { "epoch": 0.17, "learning_rate": 9.494034254849346e-06, "loss": 0.8078, "step": 7335 }, { "epoch": 0.17, "learning_rate": 9.49386961562165e-06, "loss": 0.7796, "step": 7336 }, { "epoch": 0.17, "learning_rate": 9.493704951039846e-06, "loss": 0.7907, "step": 7337 }, { "epoch": 0.17, "learning_rate": 9.493540261104863e-06, "loss": 0.8852, "step": 7338 }, { "epoch": 0.17, "learning_rate": 9.493375545817634e-06, "loss": 1.0187, "step": 7339 }, { "epoch": 0.17, "learning_rate": 9.493210805179086e-06, "loss": 0.8759, "step": 7340 }, { "epoch": 0.17, "learning_rate": 9.493046039190146e-06, "loss": 0.8597, "step": 7341 }, { "epoch": 0.17, "learning_rate": 9.492881247851745e-06, "loss": 1.0872, "step": 7342 }, { "epoch": 0.17, "learning_rate": 9.492716431164817e-06, "loss": 1.0529, "step": 7343 }, { "epoch": 0.17, "learning_rate": 9.492551589130286e-06, "loss": 1.0573, "step": 7344 }, { "epoch": 0.17, "learning_rate": 9.492386721749086e-06, "loss": 0.8267, "step": 7345 }, { "epoch": 0.17, "learning_rate": 9.492221829022145e-06, "loss": 0.9967, "step": 7346 }, { "epoch": 0.17, "learning_rate": 9.492056910950394e-06, "loss": 0.9481, "step": 7347 }, { "epoch": 0.17, "learning_rate": 9.491891967534763e-06, "loss": 1.3253, "step": 7348 }, { "epoch": 0.17, "learning_rate": 9.491726998776185e-06, "loss": 1.1172, "step": 7349 }, { "epoch": 0.17, "learning_rate": 9.491562004675586e-06, "loss": 0.9766, "step": 7350 }, { "epoch": 0.17, "learning_rate": 9.491396985233902e-06, "loss": 0.9689, "step": 7351 }, { "epoch": 0.17, "learning_rate": 9.49123194045206e-06, "loss": 1.1602, "step": 7352 }, { "epoch": 0.17, "learning_rate": 9.491066870330993e-06, "loss": 0.7162, "step": 7353 }, { "epoch": 0.17, "learning_rate": 9.490901774871634e-06, "loss": 0.9095, "step": 7354 }, { "epoch": 0.17, "learning_rate": 9.49073665407491e-06, "loss": 1.1524, "step": 7355 }, { "epoch": 0.17, "learning_rate": 9.490571507941758e-06, "loss": 0.8418, "step": 7356 }, { "epoch": 0.17, "learning_rate": 9.490406336473106e-06, "loss": 1.0352, "step": 7357 }, { "epoch": 0.17, "learning_rate": 9.490241139669887e-06, "loss": 1.0126, "step": 7358 }, { "epoch": 0.17, "learning_rate": 9.490075917533033e-06, "loss": 1.0752, "step": 7359 }, { "epoch": 0.17, "learning_rate": 9.489910670063476e-06, "loss": 0.8541, "step": 7360 }, { "epoch": 0.17, "learning_rate": 9.489745397262147e-06, "loss": 1.2094, "step": 7361 }, { "epoch": 0.17, "learning_rate": 9.48958009912998e-06, "loss": 0.9657, "step": 7362 }, { "epoch": 0.17, "learning_rate": 9.489414775667908e-06, "loss": 1.2214, "step": 7363 }, { "epoch": 0.17, "learning_rate": 9.489249426876865e-06, "loss": 1.0036, "step": 7364 }, { "epoch": 0.17, "learning_rate": 9.48908405275778e-06, "loss": 0.9702, "step": 7365 }, { "epoch": 0.17, "learning_rate": 9.48891865331159e-06, "loss": 0.8838, "step": 7366 }, { "epoch": 0.17, "learning_rate": 9.488753228539224e-06, "loss": 1.2202, "step": 7367 }, { "epoch": 0.17, "learning_rate": 9.48858777844162e-06, "loss": 1.0079, "step": 7368 }, { "epoch": 0.17, "learning_rate": 9.488422303019707e-06, "loss": 1.1984, "step": 7369 }, { "epoch": 0.17, "learning_rate": 9.488256802274422e-06, "loss": 1.1941, "step": 7370 }, { "epoch": 0.17, "learning_rate": 9.488091276206697e-06, "loss": 1.0689, "step": 7371 }, { "epoch": 0.17, "learning_rate": 9.487925724817466e-06, "loss": 1.0365, "step": 7372 }, { "epoch": 0.17, "learning_rate": 9.487760148107663e-06, "loss": 0.855, "step": 7373 }, { "epoch": 0.17, "learning_rate": 9.487594546078223e-06, "loss": 0.803, "step": 7374 }, { "epoch": 0.17, "learning_rate": 9.48742891873008e-06, "loss": 1.0777, "step": 7375 }, { "epoch": 0.17, "learning_rate": 9.487263266064169e-06, "loss": 0.8652, "step": 7376 }, { "epoch": 0.17, "learning_rate": 9.487097588081424e-06, "loss": 1.0288, "step": 7377 }, { "epoch": 0.17, "learning_rate": 9.486931884782777e-06, "loss": 1.0975, "step": 7378 }, { "epoch": 0.17, "learning_rate": 9.486766156169168e-06, "loss": 1.0551, "step": 7379 }, { "epoch": 0.17, "learning_rate": 9.486600402241528e-06, "loss": 0.8161, "step": 7380 }, { "epoch": 0.17, "learning_rate": 9.486434623000796e-06, "loss": 0.9013, "step": 7381 }, { "epoch": 0.17, "learning_rate": 9.486268818447903e-06, "loss": 0.9788, "step": 7382 }, { "epoch": 0.17, "learning_rate": 9.486102988583787e-06, "loss": 0.9956, "step": 7383 }, { "epoch": 0.17, "learning_rate": 9.485937133409381e-06, "loss": 1.0724, "step": 7384 }, { "epoch": 0.17, "learning_rate": 9.485771252925626e-06, "loss": 0.9286, "step": 7385 }, { "epoch": 0.17, "learning_rate": 9.485605347133453e-06, "loss": 0.966, "step": 7386 }, { "epoch": 0.17, "learning_rate": 9.485439416033802e-06, "loss": 0.9873, "step": 7387 }, { "epoch": 0.17, "learning_rate": 9.485273459627604e-06, "loss": 0.8262, "step": 7388 }, { "epoch": 0.17, "learning_rate": 9.485107477915798e-06, "loss": 0.7587, "step": 7389 }, { "epoch": 0.17, "learning_rate": 9.484941470899322e-06, "loss": 0.9164, "step": 7390 }, { "epoch": 0.17, "learning_rate": 9.484775438579112e-06, "loss": 0.8957, "step": 7391 }, { "epoch": 0.17, "learning_rate": 9.484609380956104e-06, "loss": 0.9804, "step": 7392 }, { "epoch": 0.17, "learning_rate": 9.484443298031234e-06, "loss": 1.0797, "step": 7393 }, { "epoch": 0.17, "learning_rate": 9.48427718980544e-06, "loss": 0.9817, "step": 7394 }, { "epoch": 0.17, "learning_rate": 9.48411105627966e-06, "loss": 1.0325, "step": 7395 }, { "epoch": 0.17, "learning_rate": 9.48394489745483e-06, "loss": 0.8915, "step": 7396 }, { "epoch": 0.17, "learning_rate": 9.483778713331889e-06, "loss": 0.8824, "step": 7397 }, { "epoch": 0.17, "learning_rate": 9.48361250391177e-06, "loss": 1.2377, "step": 7398 }, { "epoch": 0.17, "learning_rate": 9.483446269195418e-06, "loss": 1.1612, "step": 7399 }, { "epoch": 0.17, "learning_rate": 9.483280009183765e-06, "loss": 1.2402, "step": 7400 }, { "epoch": 0.17, "learning_rate": 9.483113723877751e-06, "loss": 0.8286, "step": 7401 }, { "epoch": 0.17, "learning_rate": 9.482947413278316e-06, "loss": 1.0564, "step": 7402 }, { "epoch": 0.17, "learning_rate": 9.482781077386395e-06, "loss": 1.0098, "step": 7403 }, { "epoch": 0.17, "learning_rate": 9.48261471620293e-06, "loss": 1.1597, "step": 7404 }, { "epoch": 0.17, "learning_rate": 9.482448329728854e-06, "loss": 1.0447, "step": 7405 }, { "epoch": 0.17, "learning_rate": 9.482281917965113e-06, "loss": 1.062, "step": 7406 }, { "epoch": 0.17, "learning_rate": 9.482115480912642e-06, "loss": 1.0673, "step": 7407 }, { "epoch": 0.17, "learning_rate": 9.481949018572379e-06, "loss": 0.9213, "step": 7408 }, { "epoch": 0.17, "learning_rate": 9.481782530945265e-06, "loss": 0.7839, "step": 7409 }, { "epoch": 0.17, "learning_rate": 9.481616018032238e-06, "loss": 0.9823, "step": 7410 }, { "epoch": 0.17, "learning_rate": 9.48144947983424e-06, "loss": 0.9004, "step": 7411 }, { "epoch": 0.17, "learning_rate": 9.481282916352209e-06, "loss": 0.9702, "step": 7412 }, { "epoch": 0.17, "learning_rate": 9.481116327587082e-06, "loss": 0.9919, "step": 7413 }, { "epoch": 0.17, "learning_rate": 9.480949713539803e-06, "loss": 1.0766, "step": 7414 }, { "epoch": 0.17, "learning_rate": 9.48078307421131e-06, "loss": 0.7758, "step": 7415 }, { "epoch": 0.17, "learning_rate": 9.480616409602545e-06, "loss": 1.1903, "step": 7416 }, { "epoch": 0.17, "learning_rate": 9.480449719714446e-06, "loss": 1.1455, "step": 7417 }, { "epoch": 0.17, "learning_rate": 9.480283004547954e-06, "loss": 1.2077, "step": 7418 }, { "epoch": 0.17, "learning_rate": 9.48011626410401e-06, "loss": 0.9269, "step": 7419 }, { "epoch": 0.17, "learning_rate": 9.479949498383555e-06, "loss": 1.3778, "step": 7420 }, { "epoch": 0.17, "learning_rate": 9.479782707387532e-06, "loss": 0.9172, "step": 7421 }, { "epoch": 0.17, "learning_rate": 9.479615891116878e-06, "loss": 0.9347, "step": 7422 }, { "epoch": 0.17, "learning_rate": 9.479449049572536e-06, "loss": 0.9317, "step": 7423 }, { "epoch": 0.17, "learning_rate": 9.479282182755446e-06, "loss": 1.1466, "step": 7424 }, { "epoch": 0.17, "learning_rate": 9.479115290666552e-06, "loss": 1.0543, "step": 7425 }, { "epoch": 0.17, "learning_rate": 9.478948373306793e-06, "loss": 1.2748, "step": 7426 }, { "epoch": 0.17, "learning_rate": 9.478781430677112e-06, "loss": 0.9636, "step": 7427 }, { "epoch": 0.17, "learning_rate": 9.47861446277845e-06, "loss": 0.8103, "step": 7428 }, { "epoch": 0.17, "learning_rate": 9.478447469611752e-06, "loss": 0.9528, "step": 7429 }, { "epoch": 0.17, "learning_rate": 9.478280451177958e-06, "loss": 1.18, "step": 7430 }, { "epoch": 0.17, "learning_rate": 9.478113407478009e-06, "loss": 0.9637, "step": 7431 }, { "epoch": 0.17, "learning_rate": 9.477946338512848e-06, "loss": 1.0501, "step": 7432 }, { "epoch": 0.17, "learning_rate": 9.477779244283421e-06, "loss": 1.178, "step": 7433 }, { "epoch": 0.17, "learning_rate": 9.477612124790667e-06, "loss": 0.9369, "step": 7434 }, { "epoch": 0.17, "learning_rate": 9.47744498003553e-06, "loss": 0.9929, "step": 7435 }, { "epoch": 0.17, "learning_rate": 9.477277810018953e-06, "loss": 0.9918, "step": 7436 }, { "epoch": 0.17, "learning_rate": 9.477110614741878e-06, "loss": 1.018, "step": 7437 }, { "epoch": 0.17, "learning_rate": 9.476943394205249e-06, "loss": 1.0692, "step": 7438 }, { "epoch": 0.17, "learning_rate": 9.476776148410011e-06, "loss": 1.091, "step": 7439 }, { "epoch": 0.17, "learning_rate": 9.476608877357108e-06, "loss": 0.936, "step": 7440 }, { "epoch": 0.17, "learning_rate": 9.47644158104748e-06, "loss": 0.9926, "step": 7441 }, { "epoch": 0.17, "learning_rate": 9.476274259482074e-06, "loss": 0.9451, "step": 7442 }, { "epoch": 0.17, "learning_rate": 9.476106912661833e-06, "loss": 0.9273, "step": 7443 }, { "epoch": 0.17, "learning_rate": 9.475939540587701e-06, "loss": 0.8656, "step": 7444 }, { "epoch": 0.17, "learning_rate": 9.475772143260624e-06, "loss": 1.0854, "step": 7445 }, { "epoch": 0.17, "learning_rate": 9.475604720681543e-06, "loss": 1.1845, "step": 7446 }, { "epoch": 0.17, "learning_rate": 9.475437272851405e-06, "loss": 1.0886, "step": 7447 }, { "epoch": 0.17, "learning_rate": 9.475269799771156e-06, "loss": 1.0021, "step": 7448 }, { "epoch": 0.17, "learning_rate": 9.475102301441737e-06, "loss": 0.9457, "step": 7449 }, { "epoch": 0.17, "learning_rate": 9.474934777864096e-06, "loss": 0.8044, "step": 7450 }, { "epoch": 0.17, "learning_rate": 9.474767229039177e-06, "loss": 1.0311, "step": 7451 }, { "epoch": 0.17, "learning_rate": 9.474599654967926e-06, "loss": 0.988, "step": 7452 }, { "epoch": 0.17, "learning_rate": 9.474432055651289e-06, "loss": 0.9834, "step": 7453 }, { "epoch": 0.17, "learning_rate": 9.47426443109021e-06, "loss": 1.2874, "step": 7454 }, { "epoch": 0.17, "learning_rate": 9.474096781285635e-06, "loss": 0.8911, "step": 7455 }, { "epoch": 0.17, "learning_rate": 9.473929106238511e-06, "loss": 1.0104, "step": 7456 }, { "epoch": 0.17, "learning_rate": 9.473761405949783e-06, "loss": 0.9579, "step": 7457 }, { "epoch": 0.17, "learning_rate": 9.473593680420397e-06, "loss": 1.026, "step": 7458 }, { "epoch": 0.17, "learning_rate": 9.4734259296513e-06, "loss": 0.9895, "step": 7459 }, { "epoch": 0.17, "learning_rate": 9.473258153643438e-06, "loss": 1.166, "step": 7460 }, { "epoch": 0.17, "learning_rate": 9.47309035239776e-06, "loss": 1.119, "step": 7461 }, { "epoch": 0.17, "learning_rate": 9.472922525915209e-06, "loss": 1.0537, "step": 7462 }, { "epoch": 0.17, "learning_rate": 9.472754674196731e-06, "loss": 1.0946, "step": 7463 }, { "epoch": 0.17, "learning_rate": 9.472586797243278e-06, "loss": 1.0483, "step": 7464 }, { "epoch": 0.17, "learning_rate": 9.472418895055794e-06, "loss": 1.0461, "step": 7465 }, { "epoch": 0.17, "learning_rate": 9.472250967635227e-06, "loss": 0.9832, "step": 7466 }, { "epoch": 0.17, "learning_rate": 9.472083014982524e-06, "loss": 0.9514, "step": 7467 }, { "epoch": 0.17, "learning_rate": 9.471915037098633e-06, "loss": 1.1411, "step": 7468 }, { "epoch": 0.17, "learning_rate": 9.471747033984501e-06, "loss": 0.8688, "step": 7469 }, { "epoch": 0.17, "learning_rate": 9.471579005641077e-06, "loss": 1.0178, "step": 7470 }, { "epoch": 0.17, "learning_rate": 9.471410952069308e-06, "loss": 1.0364, "step": 7471 }, { "epoch": 0.17, "learning_rate": 9.471242873270142e-06, "loss": 1.0014, "step": 7472 }, { "epoch": 0.17, "learning_rate": 9.471074769244528e-06, "loss": 0.9487, "step": 7473 }, { "epoch": 0.17, "learning_rate": 9.470906639993415e-06, "loss": 0.7695, "step": 7474 }, { "epoch": 0.17, "learning_rate": 9.47073848551775e-06, "loss": 0.9214, "step": 7475 }, { "epoch": 0.17, "learning_rate": 9.470570305818484e-06, "loss": 1.0886, "step": 7476 }, { "epoch": 0.17, "learning_rate": 9.470402100896564e-06, "loss": 1.0467, "step": 7477 }, { "epoch": 0.17, "learning_rate": 9.47023387075294e-06, "loss": 1.2035, "step": 7478 }, { "epoch": 0.17, "learning_rate": 9.470065615388559e-06, "loss": 1.1849, "step": 7479 }, { "epoch": 0.17, "learning_rate": 9.469897334804373e-06, "loss": 1.001, "step": 7480 }, { "epoch": 0.17, "learning_rate": 9.469729029001328e-06, "loss": 0.8968, "step": 7481 }, { "epoch": 0.17, "learning_rate": 9.469560697980377e-06, "loss": 0.7723, "step": 7482 }, { "epoch": 0.17, "learning_rate": 9.46939234174247e-06, "loss": 0.9851, "step": 7483 }, { "epoch": 0.17, "learning_rate": 9.469223960288556e-06, "loss": 1.4181, "step": 7484 }, { "epoch": 0.17, "learning_rate": 9.469055553619581e-06, "loss": 0.984, "step": 7485 }, { "epoch": 0.17, "learning_rate": 9.468887121736501e-06, "loss": 1.0924, "step": 7486 }, { "epoch": 0.17, "learning_rate": 9.468718664640264e-06, "loss": 0.9786, "step": 7487 }, { "epoch": 0.17, "learning_rate": 9.468550182331819e-06, "loss": 0.9801, "step": 7488 }, { "epoch": 0.17, "learning_rate": 9.46838167481212e-06, "loss": 1.0322, "step": 7489 }, { "epoch": 0.17, "learning_rate": 9.468213142082114e-06, "loss": 1.079, "step": 7490 }, { "epoch": 0.17, "learning_rate": 9.468044584142752e-06, "loss": 1.0258, "step": 7491 }, { "epoch": 0.17, "learning_rate": 9.467876000994988e-06, "loss": 1.0206, "step": 7492 }, { "epoch": 0.17, "learning_rate": 9.467707392639771e-06, "loss": 0.9545, "step": 7493 }, { "epoch": 0.17, "learning_rate": 9.467538759078053e-06, "loss": 0.9365, "step": 7494 }, { "epoch": 0.17, "learning_rate": 9.467370100310786e-06, "loss": 0.9776, "step": 7495 }, { "epoch": 0.17, "learning_rate": 9.46720141633892e-06, "loss": 0.8849, "step": 7496 }, { "epoch": 0.17, "learning_rate": 9.467032707163407e-06, "loss": 1.2227, "step": 7497 }, { "epoch": 0.17, "learning_rate": 9.466863972785201e-06, "loss": 1.0289, "step": 7498 }, { "epoch": 0.17, "learning_rate": 9.46669521320525e-06, "loss": 0.8344, "step": 7499 }, { "epoch": 0.17, "learning_rate": 9.466526428424509e-06, "loss": 1.0156, "step": 7500 }, { "epoch": 0.17, "learning_rate": 9.46635761844393e-06, "loss": 0.7891, "step": 7501 }, { "epoch": 0.17, "learning_rate": 9.466188783264466e-06, "loss": 1.2053, "step": 7502 }, { "epoch": 0.17, "learning_rate": 9.46601992288707e-06, "loss": 0.9548, "step": 7503 }, { "epoch": 0.17, "learning_rate": 9.46585103731269e-06, "loss": 0.8623, "step": 7504 }, { "epoch": 0.17, "learning_rate": 9.465682126542284e-06, "loss": 1.038, "step": 7505 }, { "epoch": 0.17, "learning_rate": 9.465513190576802e-06, "loss": 1.3261, "step": 7506 }, { "epoch": 0.17, "learning_rate": 9.4653442294172e-06, "loss": 0.8721, "step": 7507 }, { "epoch": 0.17, "learning_rate": 9.465175243064428e-06, "loss": 0.9598, "step": 7508 }, { "epoch": 0.17, "learning_rate": 9.46500623151944e-06, "loss": 1.0586, "step": 7509 }, { "epoch": 0.17, "learning_rate": 9.464837194783194e-06, "loss": 1.0273, "step": 7510 }, { "epoch": 0.17, "learning_rate": 9.464668132856639e-06, "loss": 1.1362, "step": 7511 }, { "epoch": 0.17, "learning_rate": 9.464499045740729e-06, "loss": 1.0009, "step": 7512 }, { "epoch": 0.17, "learning_rate": 9.46432993343642e-06, "loss": 0.7269, "step": 7513 }, { "epoch": 0.17, "learning_rate": 9.464160795944664e-06, "loss": 0.9094, "step": 7514 }, { "epoch": 0.17, "learning_rate": 9.463991633266419e-06, "loss": 0.8775, "step": 7515 }, { "epoch": 0.17, "learning_rate": 9.463822445402634e-06, "loss": 1.0434, "step": 7516 }, { "epoch": 0.17, "learning_rate": 9.463653232354267e-06, "loss": 0.7668, "step": 7517 }, { "epoch": 0.17, "learning_rate": 9.463483994122274e-06, "loss": 0.9373, "step": 7518 }, { "epoch": 0.17, "learning_rate": 9.463314730707605e-06, "loss": 1.1247, "step": 7519 }, { "epoch": 0.17, "learning_rate": 9.463145442111221e-06, "loss": 0.8723, "step": 7520 }, { "epoch": 0.17, "learning_rate": 9.462976128334072e-06, "loss": 1.1952, "step": 7521 }, { "epoch": 0.17, "learning_rate": 9.462806789377115e-06, "loss": 0.7018, "step": 7522 }, { "epoch": 0.17, "learning_rate": 9.462637425241305e-06, "loss": 0.9875, "step": 7523 }, { "epoch": 0.17, "learning_rate": 9.4624680359276e-06, "loss": 0.8554, "step": 7524 }, { "epoch": 0.17, "learning_rate": 9.462298621436954e-06, "loss": 0.7515, "step": 7525 }, { "epoch": 0.17, "learning_rate": 9.462129181770323e-06, "loss": 0.8391, "step": 7526 }, { "epoch": 0.17, "learning_rate": 9.461959716928661e-06, "loss": 1.3076, "step": 7527 }, { "epoch": 0.17, "learning_rate": 9.461790226912926e-06, "loss": 0.9626, "step": 7528 }, { "epoch": 0.17, "learning_rate": 9.461620711724075e-06, "loss": 0.8956, "step": 7529 }, { "epoch": 0.17, "learning_rate": 9.461451171363063e-06, "loss": 0.8625, "step": 7530 }, { "epoch": 0.17, "learning_rate": 9.461281605830847e-06, "loss": 1.0253, "step": 7531 }, { "epoch": 0.17, "learning_rate": 9.461112015128384e-06, "loss": 1.0553, "step": 7532 }, { "epoch": 0.17, "learning_rate": 9.46094239925663e-06, "loss": 0.8276, "step": 7533 }, { "epoch": 0.17, "learning_rate": 9.460772758216543e-06, "loss": 1.0548, "step": 7534 }, { "epoch": 0.17, "learning_rate": 9.460603092009078e-06, "loss": 1.0553, "step": 7535 }, { "epoch": 0.17, "learning_rate": 9.460433400635195e-06, "loss": 0.9612, "step": 7536 }, { "epoch": 0.17, "learning_rate": 9.46026368409585e-06, "loss": 1.207, "step": 7537 }, { "epoch": 0.17, "learning_rate": 9.460093942392001e-06, "loss": 0.9215, "step": 7538 }, { "epoch": 0.17, "learning_rate": 9.459924175524605e-06, "loss": 0.9926, "step": 7539 }, { "epoch": 0.17, "learning_rate": 9.459754383494619e-06, "loss": 1.0712, "step": 7540 }, { "epoch": 0.17, "learning_rate": 9.459584566303004e-06, "loss": 1.3871, "step": 7541 }, { "epoch": 0.17, "learning_rate": 9.459414723950715e-06, "loss": 1.1552, "step": 7542 }, { "epoch": 0.17, "learning_rate": 9.459244856438712e-06, "loss": 0.9244, "step": 7543 }, { "epoch": 0.17, "learning_rate": 9.459074963767953e-06, "loss": 0.8703, "step": 7544 }, { "epoch": 0.17, "learning_rate": 9.458905045939397e-06, "loss": 0.9389, "step": 7545 }, { "epoch": 0.18, "learning_rate": 9.458735102953999e-06, "loss": 0.7797, "step": 7546 }, { "epoch": 0.18, "learning_rate": 9.458565134812724e-06, "loss": 1.0696, "step": 7547 }, { "epoch": 0.18, "learning_rate": 9.458395141516527e-06, "loss": 0.9105, "step": 7548 }, { "epoch": 0.18, "learning_rate": 9.458225123066368e-06, "loss": 1.0523, "step": 7549 }, { "epoch": 0.18, "learning_rate": 9.458055079463205e-06, "loss": 0.8923, "step": 7550 }, { "epoch": 0.18, "learning_rate": 9.457885010708e-06, "loss": 1.3705, "step": 7551 }, { "epoch": 0.18, "learning_rate": 9.45771491680171e-06, "loss": 1.0701, "step": 7552 }, { "epoch": 0.18, "learning_rate": 9.457544797745295e-06, "loss": 1.175, "step": 7553 }, { "epoch": 0.18, "learning_rate": 9.457374653539716e-06, "loss": 1.1687, "step": 7554 }, { "epoch": 0.18, "learning_rate": 9.457204484185933e-06, "loss": 0.9317, "step": 7555 }, { "epoch": 0.18, "learning_rate": 9.457034289684906e-06, "loss": 1.1196, "step": 7556 }, { "epoch": 0.18, "learning_rate": 9.456864070037594e-06, "loss": 0.9789, "step": 7557 }, { "epoch": 0.18, "learning_rate": 9.456693825244957e-06, "loss": 0.8628, "step": 7558 }, { "epoch": 0.18, "learning_rate": 9.456523555307957e-06, "loss": 1.2056, "step": 7559 }, { "epoch": 0.18, "learning_rate": 9.456353260227555e-06, "loss": 0.9645, "step": 7560 }, { "epoch": 0.18, "learning_rate": 9.456182940004712e-06, "loss": 0.8542, "step": 7561 }, { "epoch": 0.18, "learning_rate": 9.456012594640387e-06, "loss": 0.9141, "step": 7562 }, { "epoch": 0.18, "learning_rate": 9.455842224135541e-06, "loss": 0.8901, "step": 7563 }, { "epoch": 0.18, "learning_rate": 9.455671828491137e-06, "loss": 1.0827, "step": 7564 }, { "epoch": 0.18, "learning_rate": 9.455501407708136e-06, "loss": 0.9208, "step": 7565 }, { "epoch": 0.18, "learning_rate": 9.455330961787498e-06, "loss": 1.1573, "step": 7566 }, { "epoch": 0.18, "learning_rate": 9.455160490730187e-06, "loss": 0.9324, "step": 7567 }, { "epoch": 0.18, "learning_rate": 9.454989994537164e-06, "loss": 1.2486, "step": 7568 }, { "epoch": 0.18, "learning_rate": 9.45481947320939e-06, "loss": 1.0785, "step": 7569 }, { "epoch": 0.18, "learning_rate": 9.454648926747827e-06, "loss": 0.8719, "step": 7570 }, { "epoch": 0.18, "learning_rate": 9.454478355153438e-06, "loss": 0.9927, "step": 7571 }, { "epoch": 0.18, "learning_rate": 9.454307758427183e-06, "loss": 1.1715, "step": 7572 }, { "epoch": 0.18, "learning_rate": 9.45413713657003e-06, "loss": 1.0652, "step": 7573 }, { "epoch": 0.18, "learning_rate": 9.453966489582938e-06, "loss": 0.9435, "step": 7574 }, { "epoch": 0.18, "learning_rate": 9.453795817466868e-06, "loss": 1.2301, "step": 7575 }, { "epoch": 0.18, "learning_rate": 9.453625120222785e-06, "loss": 1.2247, "step": 7576 }, { "epoch": 0.18, "learning_rate": 9.453454397851654e-06, "loss": 1.1901, "step": 7577 }, { "epoch": 0.18, "learning_rate": 9.453283650354435e-06, "loss": 1.2614, "step": 7578 }, { "epoch": 0.18, "learning_rate": 9.453112877732092e-06, "loss": 1.0922, "step": 7579 }, { "epoch": 0.18, "learning_rate": 9.45294207998559e-06, "loss": 1.0777, "step": 7580 }, { "epoch": 0.18, "learning_rate": 9.452771257115892e-06, "loss": 1.0336, "step": 7581 }, { "epoch": 0.18, "learning_rate": 9.452600409123959e-06, "loss": 1.1984, "step": 7582 }, { "epoch": 0.18, "learning_rate": 9.45242953601076e-06, "loss": 0.8938, "step": 7583 }, { "epoch": 0.18, "learning_rate": 9.452258637777257e-06, "loss": 1.036, "step": 7584 }, { "epoch": 0.18, "learning_rate": 9.452087714424412e-06, "loss": 1.0661, "step": 7585 }, { "epoch": 0.18, "learning_rate": 9.45191676595319e-06, "loss": 0.8045, "step": 7586 }, { "epoch": 0.18, "learning_rate": 9.451745792364558e-06, "loss": 1.161, "step": 7587 }, { "epoch": 0.18, "learning_rate": 9.451574793659478e-06, "loss": 0.926, "step": 7588 }, { "epoch": 0.18, "learning_rate": 9.451403769838917e-06, "loss": 0.9153, "step": 7589 }, { "epoch": 0.18, "learning_rate": 9.451232720903839e-06, "loss": 1.3569, "step": 7590 }, { "epoch": 0.18, "learning_rate": 9.451061646855206e-06, "loss": 1.0692, "step": 7591 }, { "epoch": 0.18, "learning_rate": 9.45089054769399e-06, "loss": 0.9561, "step": 7592 }, { "epoch": 0.18, "learning_rate": 9.450719423421148e-06, "loss": 1.1286, "step": 7593 }, { "epoch": 0.18, "learning_rate": 9.450548274037652e-06, "loss": 0.9273, "step": 7594 }, { "epoch": 0.18, "learning_rate": 9.450377099544466e-06, "loss": 1.1567, "step": 7595 }, { "epoch": 0.18, "learning_rate": 9.450205899942555e-06, "loss": 1.0051, "step": 7596 }, { "epoch": 0.18, "learning_rate": 9.450034675232884e-06, "loss": 0.8654, "step": 7597 }, { "epoch": 0.18, "learning_rate": 9.44986342541642e-06, "loss": 0.9554, "step": 7598 }, { "epoch": 0.18, "learning_rate": 9.44969215049413e-06, "loss": 1.0405, "step": 7599 }, { "epoch": 0.18, "learning_rate": 9.44952085046698e-06, "loss": 0.9737, "step": 7600 }, { "epoch": 0.18, "learning_rate": 9.449349525335934e-06, "loss": 1.0447, "step": 7601 }, { "epoch": 0.18, "learning_rate": 9.449178175101964e-06, "loss": 1.0594, "step": 7602 }, { "epoch": 0.18, "learning_rate": 9.449006799766029e-06, "loss": 1.0518, "step": 7603 }, { "epoch": 0.18, "learning_rate": 9.448835399329103e-06, "loss": 1.1978, "step": 7604 }, { "epoch": 0.18, "learning_rate": 9.44866397379215e-06, "loss": 1.0634, "step": 7605 }, { "epoch": 0.18, "learning_rate": 9.448492523156138e-06, "loss": 1.0381, "step": 7606 }, { "epoch": 0.18, "learning_rate": 9.448321047422032e-06, "loss": 1.1624, "step": 7607 }, { "epoch": 0.18, "learning_rate": 9.448149546590802e-06, "loss": 0.9598, "step": 7608 }, { "epoch": 0.18, "learning_rate": 9.447978020663416e-06, "loss": 0.687, "step": 7609 }, { "epoch": 0.18, "learning_rate": 9.447806469640839e-06, "loss": 0.9046, "step": 7610 }, { "epoch": 0.18, "learning_rate": 9.447634893524042e-06, "loss": 0.934, "step": 7611 }, { "epoch": 0.18, "learning_rate": 9.44746329231399e-06, "loss": 0.953, "step": 7612 }, { "epoch": 0.18, "learning_rate": 9.447291666011653e-06, "loss": 1.0204, "step": 7613 }, { "epoch": 0.18, "learning_rate": 9.447120014618e-06, "loss": 0.9685, "step": 7614 }, { "epoch": 0.18, "learning_rate": 9.446948338133996e-06, "loss": 0.9522, "step": 7615 }, { "epoch": 0.18, "learning_rate": 9.446776636560613e-06, "loss": 1.0958, "step": 7616 }, { "epoch": 0.18, "learning_rate": 9.44660490989882e-06, "loss": 1.0295, "step": 7617 }, { "epoch": 0.18, "learning_rate": 9.446433158149584e-06, "loss": 0.9411, "step": 7618 }, { "epoch": 0.18, "learning_rate": 9.446261381313875e-06, "loss": 1.1721, "step": 7619 }, { "epoch": 0.18, "learning_rate": 9.44608957939266e-06, "loss": 0.9601, "step": 7620 }, { "epoch": 0.18, "learning_rate": 9.44591775238691e-06, "loss": 1.0859, "step": 7621 }, { "epoch": 0.18, "learning_rate": 9.445745900297596e-06, "loss": 0.9424, "step": 7622 }, { "epoch": 0.18, "learning_rate": 9.445574023125685e-06, "loss": 1.2493, "step": 7623 }, { "epoch": 0.18, "learning_rate": 9.445402120872149e-06, "loss": 0.882, "step": 7624 }, { "epoch": 0.18, "learning_rate": 9.445230193537956e-06, "loss": 0.9408, "step": 7625 }, { "epoch": 0.18, "learning_rate": 9.445058241124077e-06, "loss": 1.0291, "step": 7626 }, { "epoch": 0.18, "learning_rate": 9.444886263631482e-06, "loss": 1.0151, "step": 7627 }, { "epoch": 0.18, "learning_rate": 9.44471426106114e-06, "loss": 1.1759, "step": 7628 }, { "epoch": 0.18, "learning_rate": 9.44454223341402e-06, "loss": 0.9716, "step": 7629 }, { "epoch": 0.18, "learning_rate": 9.444370180691098e-06, "loss": 1.1311, "step": 7630 }, { "epoch": 0.18, "learning_rate": 9.444198102893342e-06, "loss": 0.971, "step": 7631 }, { "epoch": 0.18, "learning_rate": 9.444026000021722e-06, "loss": 1.159, "step": 7632 }, { "epoch": 0.18, "learning_rate": 9.44385387207721e-06, "loss": 1.255, "step": 7633 }, { "epoch": 0.18, "learning_rate": 9.443681719060777e-06, "loss": 0.7783, "step": 7634 }, { "epoch": 0.18, "learning_rate": 9.443509540973392e-06, "loss": 0.9476, "step": 7635 }, { "epoch": 0.18, "learning_rate": 9.44333733781603e-06, "loss": 1.1252, "step": 7636 }, { "epoch": 0.18, "learning_rate": 9.443165109589662e-06, "loss": 1.0841, "step": 7637 }, { "epoch": 0.18, "learning_rate": 9.442992856295257e-06, "loss": 1.1196, "step": 7638 }, { "epoch": 0.18, "learning_rate": 9.442820577933789e-06, "loss": 0.9266, "step": 7639 }, { "epoch": 0.18, "learning_rate": 9.44264827450623e-06, "loss": 0.8493, "step": 7640 }, { "epoch": 0.18, "learning_rate": 9.442475946013551e-06, "loss": 1.1507, "step": 7641 }, { "epoch": 0.18, "learning_rate": 9.442303592456725e-06, "loss": 1.1011, "step": 7642 }, { "epoch": 0.18, "learning_rate": 9.442131213836724e-06, "loss": 1.2648, "step": 7643 }, { "epoch": 0.18, "learning_rate": 9.44195881015452e-06, "loss": 0.8079, "step": 7644 }, { "epoch": 0.18, "learning_rate": 9.44178638141109e-06, "loss": 1.0528, "step": 7645 }, { "epoch": 0.18, "learning_rate": 9.4416139276074e-06, "loss": 0.7601, "step": 7646 }, { "epoch": 0.18, "learning_rate": 9.441441448744428e-06, "loss": 0.7877, "step": 7647 }, { "epoch": 0.18, "learning_rate": 9.441268944823145e-06, "loss": 1.0603, "step": 7648 }, { "epoch": 0.18, "learning_rate": 9.441096415844524e-06, "loss": 1.1842, "step": 7649 }, { "epoch": 0.18, "learning_rate": 9.44092386180954e-06, "loss": 0.8289, "step": 7650 }, { "epoch": 0.18, "learning_rate": 9.440751282719164e-06, "loss": 1.0398, "step": 7651 }, { "epoch": 0.18, "learning_rate": 9.440578678574373e-06, "loss": 1.0387, "step": 7652 }, { "epoch": 0.18, "learning_rate": 9.440406049376139e-06, "loss": 1.1632, "step": 7653 }, { "epoch": 0.18, "learning_rate": 9.440233395125435e-06, "loss": 1.1614, "step": 7654 }, { "epoch": 0.18, "learning_rate": 9.440060715823238e-06, "loss": 0.8794, "step": 7655 }, { "epoch": 0.18, "learning_rate": 9.43988801147052e-06, "loss": 0.8603, "step": 7656 }, { "epoch": 0.18, "learning_rate": 9.439715282068255e-06, "loss": 1.1353, "step": 7657 }, { "epoch": 0.18, "learning_rate": 9.439542527617417e-06, "loss": 0.9236, "step": 7658 }, { "epoch": 0.18, "learning_rate": 9.439369748118984e-06, "loss": 1.0677, "step": 7659 }, { "epoch": 0.18, "learning_rate": 9.439196943573929e-06, "loss": 0.9476, "step": 7660 }, { "epoch": 0.18, "learning_rate": 9.439024113983228e-06, "loss": 1.0689, "step": 7661 }, { "epoch": 0.18, "learning_rate": 9.438851259347853e-06, "loss": 0.9123, "step": 7662 }, { "epoch": 0.18, "learning_rate": 9.438678379668781e-06, "loss": 1.159, "step": 7663 }, { "epoch": 0.18, "learning_rate": 9.43850547494699e-06, "loss": 1.0665, "step": 7664 }, { "epoch": 0.18, "learning_rate": 9.43833254518345e-06, "loss": 1.1122, "step": 7665 }, { "epoch": 0.18, "learning_rate": 9.43815959037914e-06, "loss": 1.0661, "step": 7666 }, { "epoch": 0.18, "learning_rate": 9.437986610535036e-06, "loss": 0.8675, "step": 7667 }, { "epoch": 0.18, "learning_rate": 9.437813605652114e-06, "loss": 0.8204, "step": 7668 }, { "epoch": 0.18, "learning_rate": 9.437640575731349e-06, "loss": 0.9313, "step": 7669 }, { "epoch": 0.18, "learning_rate": 9.437467520773717e-06, "loss": 1.0933, "step": 7670 }, { "epoch": 0.18, "learning_rate": 9.437294440780197e-06, "loss": 0.9951, "step": 7671 }, { "epoch": 0.18, "learning_rate": 9.437121335751762e-06, "loss": 0.8129, "step": 7672 }, { "epoch": 0.18, "learning_rate": 9.43694820568939e-06, "loss": 1.1899, "step": 7673 }, { "epoch": 0.18, "learning_rate": 9.436775050594058e-06, "loss": 1.1792, "step": 7674 }, { "epoch": 0.18, "learning_rate": 9.436601870466744e-06, "loss": 0.8399, "step": 7675 }, { "epoch": 0.18, "learning_rate": 9.436428665308423e-06, "loss": 1.0734, "step": 7676 }, { "epoch": 0.18, "learning_rate": 9.436255435120075e-06, "loss": 0.9195, "step": 7677 }, { "epoch": 0.18, "learning_rate": 9.436082179902675e-06, "loss": 1.1827, "step": 7678 }, { "epoch": 0.18, "learning_rate": 9.435908899657201e-06, "loss": 1.2294, "step": 7679 }, { "epoch": 0.18, "learning_rate": 9.43573559438463e-06, "loss": 1.2811, "step": 7680 }, { "epoch": 0.18, "learning_rate": 9.43556226408594e-06, "loss": 1.0138, "step": 7681 }, { "epoch": 0.18, "learning_rate": 9.435388908762111e-06, "loss": 1.1736, "step": 7682 }, { "epoch": 0.18, "learning_rate": 9.435215528414118e-06, "loss": 0.9788, "step": 7683 }, { "epoch": 0.18, "learning_rate": 9.435042123042942e-06, "loss": 0.9052, "step": 7684 }, { "epoch": 0.18, "learning_rate": 9.434868692649559e-06, "loss": 1.062, "step": 7685 }, { "epoch": 0.18, "learning_rate": 9.43469523723495e-06, "loss": 0.948, "step": 7686 }, { "epoch": 0.18, "learning_rate": 9.434521756800091e-06, "loss": 1.0307, "step": 7687 }, { "epoch": 0.18, "learning_rate": 9.43434825134596e-06, "loss": 0.9206, "step": 7688 }, { "epoch": 0.18, "learning_rate": 9.43417472087354e-06, "loss": 1.0171, "step": 7689 }, { "epoch": 0.18, "learning_rate": 9.434001165383809e-06, "loss": 0.942, "step": 7690 }, { "epoch": 0.18, "learning_rate": 9.433827584877742e-06, "loss": 1.0464, "step": 7691 }, { "epoch": 0.18, "learning_rate": 9.433653979356323e-06, "loss": 0.7367, "step": 7692 }, { "epoch": 0.18, "learning_rate": 9.43348034882053e-06, "loss": 1.0234, "step": 7693 }, { "epoch": 0.18, "learning_rate": 9.433306693271342e-06, "loss": 0.9565, "step": 7694 }, { "epoch": 0.18, "learning_rate": 9.43313301270974e-06, "loss": 1.1514, "step": 7695 }, { "epoch": 0.18, "learning_rate": 9.432959307136702e-06, "loss": 0.8674, "step": 7696 }, { "epoch": 0.18, "learning_rate": 9.432785576553209e-06, "loss": 0.9475, "step": 7697 }, { "epoch": 0.18, "learning_rate": 9.432611820960242e-06, "loss": 1.0479, "step": 7698 }, { "epoch": 0.18, "learning_rate": 9.43243804035878e-06, "loss": 1.1014, "step": 7699 }, { "epoch": 0.18, "learning_rate": 9.432264234749805e-06, "loss": 1.1107, "step": 7700 }, { "epoch": 0.18, "learning_rate": 9.432090404134296e-06, "loss": 1.2964, "step": 7701 }, { "epoch": 0.18, "learning_rate": 9.431916548513236e-06, "loss": 0.8732, "step": 7702 }, { "epoch": 0.18, "learning_rate": 9.431742667887603e-06, "loss": 1.0202, "step": 7703 }, { "epoch": 0.18, "learning_rate": 9.431568762258379e-06, "loss": 0.9979, "step": 7704 }, { "epoch": 0.18, "learning_rate": 9.431394831626546e-06, "loss": 0.7837, "step": 7705 }, { "epoch": 0.18, "learning_rate": 9.431220875993083e-06, "loss": 1.2276, "step": 7706 }, { "epoch": 0.18, "learning_rate": 9.431046895358975e-06, "loss": 0.8974, "step": 7707 }, { "epoch": 0.18, "learning_rate": 9.430872889725202e-06, "loss": 1.0662, "step": 7708 }, { "epoch": 0.18, "learning_rate": 9.430698859092745e-06, "loss": 1.1107, "step": 7709 }, { "epoch": 0.18, "learning_rate": 9.430524803462587e-06, "loss": 0.9664, "step": 7710 }, { "epoch": 0.18, "learning_rate": 9.430350722835708e-06, "loss": 0.8988, "step": 7711 }, { "epoch": 0.18, "learning_rate": 9.430176617213092e-06, "loss": 1.0027, "step": 7712 }, { "epoch": 0.18, "learning_rate": 9.430002486595722e-06, "loss": 1.0815, "step": 7713 }, { "epoch": 0.18, "learning_rate": 9.42982833098458e-06, "loss": 1.1572, "step": 7714 }, { "epoch": 0.18, "learning_rate": 9.429654150380645e-06, "loss": 1.0037, "step": 7715 }, { "epoch": 0.18, "learning_rate": 9.429479944784906e-06, "loss": 0.9685, "step": 7716 }, { "epoch": 0.18, "learning_rate": 9.429305714198339e-06, "loss": 1.0015, "step": 7717 }, { "epoch": 0.18, "learning_rate": 9.429131458621931e-06, "loss": 1.1463, "step": 7718 }, { "epoch": 0.18, "learning_rate": 9.428957178056668e-06, "loss": 1.1747, "step": 7719 }, { "epoch": 0.18, "learning_rate": 9.428782872503525e-06, "loss": 1.0967, "step": 7720 }, { "epoch": 0.18, "learning_rate": 9.428608541963493e-06, "loss": 0.8042, "step": 7721 }, { "epoch": 0.18, "learning_rate": 9.428434186437555e-06, "loss": 0.9347, "step": 7722 }, { "epoch": 0.18, "learning_rate": 9.428259805926688e-06, "loss": 1.1244, "step": 7723 }, { "epoch": 0.18, "learning_rate": 9.428085400431883e-06, "loss": 0.9367, "step": 7724 }, { "epoch": 0.18, "learning_rate": 9.427910969954122e-06, "loss": 0.8281, "step": 7725 }, { "epoch": 0.18, "learning_rate": 9.427736514494385e-06, "loss": 1.1691, "step": 7726 }, { "epoch": 0.18, "learning_rate": 9.427562034053664e-06, "loss": 1.1104, "step": 7727 }, { "epoch": 0.18, "learning_rate": 9.427387528632937e-06, "loss": 1.0744, "step": 7728 }, { "epoch": 0.18, "learning_rate": 9.42721299823319e-06, "loss": 0.7723, "step": 7729 }, { "epoch": 0.18, "learning_rate": 9.42703844285541e-06, "loss": 1.0942, "step": 7730 }, { "epoch": 0.18, "learning_rate": 9.426863862500579e-06, "loss": 1.155, "step": 7731 }, { "epoch": 0.18, "learning_rate": 9.426689257169685e-06, "loss": 1.2073, "step": 7732 }, { "epoch": 0.18, "learning_rate": 9.426514626863709e-06, "loss": 1.0773, "step": 7733 }, { "epoch": 0.18, "learning_rate": 9.42633997158364e-06, "loss": 1.1576, "step": 7734 }, { "epoch": 0.18, "learning_rate": 9.426165291330462e-06, "loss": 1.0043, "step": 7735 }, { "epoch": 0.18, "learning_rate": 9.42599058610516e-06, "loss": 0.9242, "step": 7736 }, { "epoch": 0.18, "learning_rate": 9.42581585590872e-06, "loss": 0.9406, "step": 7737 }, { "epoch": 0.18, "learning_rate": 9.425641100742128e-06, "loss": 0.7718, "step": 7738 }, { "epoch": 0.18, "learning_rate": 9.425466320606372e-06, "loss": 1.0072, "step": 7739 }, { "epoch": 0.18, "learning_rate": 9.425291515502434e-06, "loss": 0.9318, "step": 7740 }, { "epoch": 0.18, "learning_rate": 9.425116685431303e-06, "loss": 0.9117, "step": 7741 }, { "epoch": 0.18, "learning_rate": 9.424941830393963e-06, "loss": 0.9515, "step": 7742 }, { "epoch": 0.18, "learning_rate": 9.424766950391404e-06, "loss": 0.9376, "step": 7743 }, { "epoch": 0.18, "learning_rate": 9.42459204542461e-06, "loss": 0.8988, "step": 7744 }, { "epoch": 0.18, "learning_rate": 9.42441711549457e-06, "loss": 1.069, "step": 7745 }, { "epoch": 0.18, "learning_rate": 9.424242160602268e-06, "loss": 0.9359, "step": 7746 }, { "epoch": 0.18, "learning_rate": 9.424067180748692e-06, "loss": 0.8953, "step": 7747 }, { "epoch": 0.18, "learning_rate": 9.423892175934833e-06, "loss": 1.0851, "step": 7748 }, { "epoch": 0.18, "learning_rate": 9.423717146161673e-06, "loss": 1.0039, "step": 7749 }, { "epoch": 0.18, "learning_rate": 9.4235420914302e-06, "loss": 1.0276, "step": 7750 }, { "epoch": 0.18, "learning_rate": 9.423367011741406e-06, "loss": 1.2235, "step": 7751 }, { "epoch": 0.18, "learning_rate": 9.423191907096276e-06, "loss": 0.8457, "step": 7752 }, { "epoch": 0.18, "learning_rate": 9.4230167774958e-06, "loss": 1.0322, "step": 7753 }, { "epoch": 0.18, "learning_rate": 9.42284162294096e-06, "loss": 1.0599, "step": 7754 }, { "epoch": 0.18, "learning_rate": 9.422666443432752e-06, "loss": 0.9843, "step": 7755 }, { "epoch": 0.18, "learning_rate": 9.422491238972157e-06, "loss": 0.9459, "step": 7756 }, { "epoch": 0.18, "learning_rate": 9.422316009560171e-06, "loss": 1.2116, "step": 7757 }, { "epoch": 0.18, "learning_rate": 9.422140755197778e-06, "loss": 1.0947, "step": 7758 }, { "epoch": 0.18, "learning_rate": 9.421965475885966e-06, "loss": 1.0322, "step": 7759 }, { "epoch": 0.18, "learning_rate": 9.421790171625727e-06, "loss": 1.1046, "step": 7760 }, { "epoch": 0.18, "learning_rate": 9.421614842418047e-06, "loss": 1.0192, "step": 7761 }, { "epoch": 0.18, "learning_rate": 9.421439488263919e-06, "loss": 1.221, "step": 7762 }, { "epoch": 0.18, "learning_rate": 9.421264109164328e-06, "loss": 1.0863, "step": 7763 }, { "epoch": 0.18, "learning_rate": 9.421088705120267e-06, "loss": 1.1527, "step": 7764 }, { "epoch": 0.18, "learning_rate": 9.420913276132724e-06, "loss": 1.001, "step": 7765 }, { "epoch": 0.18, "learning_rate": 9.42073782220269e-06, "loss": 1.028, "step": 7766 }, { "epoch": 0.18, "learning_rate": 9.420562343331153e-06, "loss": 1.1301, "step": 7767 }, { "epoch": 0.18, "learning_rate": 9.420386839519103e-06, "loss": 1.1693, "step": 7768 }, { "epoch": 0.18, "learning_rate": 9.420211310767534e-06, "loss": 0.8978, "step": 7769 }, { "epoch": 0.18, "learning_rate": 9.42003575707743e-06, "loss": 0.836, "step": 7770 }, { "epoch": 0.18, "learning_rate": 9.419860178449786e-06, "loss": 1.0233, "step": 7771 }, { "epoch": 0.18, "learning_rate": 9.419684574885593e-06, "loss": 0.9948, "step": 7772 }, { "epoch": 0.18, "learning_rate": 9.419508946385838e-06, "loss": 1.0103, "step": 7773 }, { "epoch": 0.18, "learning_rate": 9.419333292951515e-06, "loss": 1.2523, "step": 7774 }, { "epoch": 0.18, "learning_rate": 9.419157614583613e-06, "loss": 0.9112, "step": 7775 }, { "epoch": 0.18, "learning_rate": 9.418981911283128e-06, "loss": 1.2302, "step": 7776 }, { "epoch": 0.18, "learning_rate": 9.418806183051045e-06, "loss": 0.9448, "step": 7777 }, { "epoch": 0.18, "learning_rate": 9.418630429888357e-06, "loss": 1.115, "step": 7778 }, { "epoch": 0.18, "learning_rate": 9.41845465179606e-06, "loss": 1.2497, "step": 7779 }, { "epoch": 0.18, "learning_rate": 9.418278848775139e-06, "loss": 0.9523, "step": 7780 }, { "epoch": 0.18, "learning_rate": 9.418103020826592e-06, "loss": 1.0786, "step": 7781 }, { "epoch": 0.18, "learning_rate": 9.417927167951406e-06, "loss": 0.8721, "step": 7782 }, { "epoch": 0.18, "learning_rate": 9.417751290150578e-06, "loss": 0.8751, "step": 7783 }, { "epoch": 0.18, "learning_rate": 9.417575387425095e-06, "loss": 0.8848, "step": 7784 }, { "epoch": 0.18, "learning_rate": 9.417399459775955e-06, "loss": 1.0984, "step": 7785 }, { "epoch": 0.18, "learning_rate": 9.417223507204145e-06, "loss": 0.8062, "step": 7786 }, { "epoch": 0.18, "learning_rate": 9.417047529710661e-06, "loss": 0.939, "step": 7787 }, { "epoch": 0.18, "learning_rate": 9.416871527296496e-06, "loss": 0.9955, "step": 7788 }, { "epoch": 0.18, "learning_rate": 9.416695499962643e-06, "loss": 1.1639, "step": 7789 }, { "epoch": 0.18, "learning_rate": 9.416519447710093e-06, "loss": 1.0816, "step": 7790 }, { "epoch": 0.18, "learning_rate": 9.416343370539842e-06, "loss": 1.0719, "step": 7791 }, { "epoch": 0.18, "learning_rate": 9.41616726845288e-06, "loss": 1.0571, "step": 7792 }, { "epoch": 0.18, "learning_rate": 9.415991141450204e-06, "loss": 0.8453, "step": 7793 }, { "epoch": 0.18, "learning_rate": 9.415814989532807e-06, "loss": 1.0203, "step": 7794 }, { "epoch": 0.18, "learning_rate": 9.415638812701681e-06, "loss": 0.8329, "step": 7795 }, { "epoch": 0.18, "learning_rate": 9.415462610957822e-06, "loss": 0.7712, "step": 7796 }, { "epoch": 0.18, "learning_rate": 9.415286384302222e-06, "loss": 1.0845, "step": 7797 }, { "epoch": 0.18, "learning_rate": 9.415110132735878e-06, "loss": 1.2428, "step": 7798 }, { "epoch": 0.18, "learning_rate": 9.414933856259783e-06, "loss": 1.3501, "step": 7799 }, { "epoch": 0.18, "learning_rate": 9.414757554874932e-06, "loss": 0.9026, "step": 7800 }, { "epoch": 0.18, "learning_rate": 9.414581228582318e-06, "loss": 0.9071, "step": 7801 }, { "epoch": 0.18, "learning_rate": 9.414404877382936e-06, "loss": 0.9211, "step": 7802 }, { "epoch": 0.18, "learning_rate": 9.414228501277783e-06, "loss": 1.1129, "step": 7803 }, { "epoch": 0.18, "learning_rate": 9.414052100267854e-06, "loss": 1.1727, "step": 7804 }, { "epoch": 0.18, "learning_rate": 9.413875674354142e-06, "loss": 1.0602, "step": 7805 }, { "epoch": 0.18, "learning_rate": 9.413699223537644e-06, "loss": 0.8584, "step": 7806 }, { "epoch": 0.18, "learning_rate": 9.413522747819355e-06, "loss": 0.8342, "step": 7807 }, { "epoch": 0.18, "learning_rate": 9.413346247200272e-06, "loss": 1.3574, "step": 7808 }, { "epoch": 0.18, "learning_rate": 9.413169721681389e-06, "loss": 0.9332, "step": 7809 }, { "epoch": 0.18, "learning_rate": 9.412993171263703e-06, "loss": 0.7883, "step": 7810 }, { "epoch": 0.18, "learning_rate": 9.412816595948209e-06, "loss": 1.0533, "step": 7811 }, { "epoch": 0.18, "learning_rate": 9.412639995735904e-06, "loss": 1.1146, "step": 7812 }, { "epoch": 0.18, "learning_rate": 9.412463370627783e-06, "loss": 1.0395, "step": 7813 }, { "epoch": 0.18, "learning_rate": 9.412286720624847e-06, "loss": 0.863, "step": 7814 }, { "epoch": 0.18, "learning_rate": 9.412110045728087e-06, "loss": 0.8368, "step": 7815 }, { "epoch": 0.18, "learning_rate": 9.411933345938502e-06, "loss": 1.0314, "step": 7816 }, { "epoch": 0.18, "learning_rate": 9.411756621257091e-06, "loss": 1.1723, "step": 7817 }, { "epoch": 0.18, "learning_rate": 9.411579871684847e-06, "loss": 0.9025, "step": 7818 }, { "epoch": 0.18, "learning_rate": 9.411403097222771e-06, "loss": 1.1332, "step": 7819 }, { "epoch": 0.18, "learning_rate": 9.411226297871858e-06, "loss": 1.0865, "step": 7820 }, { "epoch": 0.18, "learning_rate": 9.411049473633107e-06, "loss": 1.0078, "step": 7821 }, { "epoch": 0.18, "learning_rate": 9.410872624507514e-06, "loss": 0.9853, "step": 7822 }, { "epoch": 0.18, "learning_rate": 9.41069575049608e-06, "loss": 1.0181, "step": 7823 }, { "epoch": 0.18, "learning_rate": 9.410518851599798e-06, "loss": 0.8281, "step": 7824 }, { "epoch": 0.18, "learning_rate": 9.410341927819671e-06, "loss": 1.1292, "step": 7825 }, { "epoch": 0.18, "learning_rate": 9.410164979156694e-06, "loss": 0.9689, "step": 7826 }, { "epoch": 0.18, "learning_rate": 9.409988005611865e-06, "loss": 0.9609, "step": 7827 }, { "epoch": 0.18, "learning_rate": 9.409811007186183e-06, "loss": 1.0957, "step": 7828 }, { "epoch": 0.18, "learning_rate": 9.409633983880648e-06, "loss": 0.8116, "step": 7829 }, { "epoch": 0.18, "learning_rate": 9.40945693569626e-06, "loss": 1.0451, "step": 7830 }, { "epoch": 0.18, "learning_rate": 9.409279862634012e-06, "loss": 0.9998, "step": 7831 }, { "epoch": 0.18, "learning_rate": 9.40910276469491e-06, "loss": 0.8905, "step": 7832 }, { "epoch": 0.18, "learning_rate": 9.40892564187995e-06, "loss": 1.1002, "step": 7833 }, { "epoch": 0.18, "learning_rate": 9.408748494190131e-06, "loss": 1.0455, "step": 7834 }, { "epoch": 0.18, "learning_rate": 9.408571321626452e-06, "loss": 1.0717, "step": 7835 }, { "epoch": 0.18, "learning_rate": 9.408394124189914e-06, "loss": 0.82, "step": 7836 }, { "epoch": 0.18, "learning_rate": 9.408216901881517e-06, "loss": 1.1211, "step": 7837 }, { "epoch": 0.18, "learning_rate": 9.40803965470226e-06, "loss": 0.9975, "step": 7838 }, { "epoch": 0.18, "learning_rate": 9.407862382653144e-06, "loss": 1.027, "step": 7839 }, { "epoch": 0.18, "learning_rate": 9.407685085735166e-06, "loss": 1.2157, "step": 7840 }, { "epoch": 0.18, "learning_rate": 9.407507763949329e-06, "loss": 1.2345, "step": 7841 }, { "epoch": 0.18, "learning_rate": 9.407330417296634e-06, "loss": 1.0386, "step": 7842 }, { "epoch": 0.18, "learning_rate": 9.407153045778079e-06, "loss": 0.9903, "step": 7843 }, { "epoch": 0.18, "learning_rate": 9.406975649394666e-06, "loss": 0.7937, "step": 7844 }, { "epoch": 0.18, "learning_rate": 9.406798228147398e-06, "loss": 0.9285, "step": 7845 }, { "epoch": 0.18, "learning_rate": 9.406620782037274e-06, "loss": 0.7787, "step": 7846 }, { "epoch": 0.18, "learning_rate": 9.406443311065296e-06, "loss": 1.2125, "step": 7847 }, { "epoch": 0.18, "learning_rate": 9.406265815232463e-06, "loss": 1.055, "step": 7848 }, { "epoch": 0.18, "learning_rate": 9.40608829453978e-06, "loss": 1.0107, "step": 7849 }, { "epoch": 0.18, "learning_rate": 9.405910748988243e-06, "loss": 1.1423, "step": 7850 }, { "epoch": 0.18, "learning_rate": 9.40573317857886e-06, "loss": 1.3267, "step": 7851 }, { "epoch": 0.18, "learning_rate": 9.40555558331263e-06, "loss": 0.9178, "step": 7852 }, { "epoch": 0.18, "learning_rate": 9.405377963190553e-06, "loss": 1.1862, "step": 7853 }, { "epoch": 0.18, "learning_rate": 9.405200318213633e-06, "loss": 1.059, "step": 7854 }, { "epoch": 0.18, "learning_rate": 9.405022648382875e-06, "loss": 1.0208, "step": 7855 }, { "epoch": 0.18, "learning_rate": 9.40484495369928e-06, "loss": 0.9687, "step": 7856 }, { "epoch": 0.18, "learning_rate": 9.404667234163847e-06, "loss": 1.1072, "step": 7857 }, { "epoch": 0.18, "learning_rate": 9.40448948977758e-06, "loss": 1.0149, "step": 7858 }, { "epoch": 0.18, "learning_rate": 9.404311720541485e-06, "loss": 1.1543, "step": 7859 }, { "epoch": 0.18, "learning_rate": 9.404133926456563e-06, "loss": 1.0822, "step": 7860 }, { "epoch": 0.18, "learning_rate": 9.403956107523816e-06, "loss": 0.9778, "step": 7861 }, { "epoch": 0.18, "learning_rate": 9.403778263744246e-06, "loss": 1.0906, "step": 7862 }, { "epoch": 0.18, "learning_rate": 9.403600395118861e-06, "loss": 1.1953, "step": 7863 }, { "epoch": 0.18, "learning_rate": 9.403422501648662e-06, "loss": 0.9059, "step": 7864 }, { "epoch": 0.18, "learning_rate": 9.403244583334654e-06, "loss": 1.1541, "step": 7865 }, { "epoch": 0.18, "learning_rate": 9.403066640177837e-06, "loss": 1.0226, "step": 7866 }, { "epoch": 0.18, "learning_rate": 9.40288867217922e-06, "loss": 0.8701, "step": 7867 }, { "epoch": 0.18, "learning_rate": 9.402710679339803e-06, "loss": 1.0072, "step": 7868 }, { "epoch": 0.18, "learning_rate": 9.40253266166059e-06, "loss": 1.109, "step": 7869 }, { "epoch": 0.18, "learning_rate": 9.402354619142591e-06, "loss": 0.9086, "step": 7870 }, { "epoch": 0.18, "learning_rate": 9.402176551786805e-06, "loss": 1.0246, "step": 7871 }, { "epoch": 0.18, "learning_rate": 9.401998459594238e-06, "loss": 1.1118, "step": 7872 }, { "epoch": 0.18, "learning_rate": 9.401820342565896e-06, "loss": 1.1014, "step": 7873 }, { "epoch": 0.18, "learning_rate": 9.401642200702783e-06, "loss": 0.9431, "step": 7874 }, { "epoch": 0.18, "learning_rate": 9.401464034005902e-06, "loss": 1.1701, "step": 7875 }, { "epoch": 0.18, "learning_rate": 9.401285842476264e-06, "loss": 0.8633, "step": 7876 }, { "epoch": 0.18, "learning_rate": 9.401107626114867e-06, "loss": 1.0789, "step": 7877 }, { "epoch": 0.18, "learning_rate": 9.400929384922723e-06, "loss": 0.8446, "step": 7878 }, { "epoch": 0.18, "learning_rate": 9.400751118900833e-06, "loss": 1.1896, "step": 7879 }, { "epoch": 0.18, "learning_rate": 9.400572828050205e-06, "loss": 1.1001, "step": 7880 }, { "epoch": 0.18, "learning_rate": 9.400394512371843e-06, "loss": 1.2029, "step": 7881 }, { "epoch": 0.18, "learning_rate": 9.400216171866757e-06, "loss": 1.216, "step": 7882 }, { "epoch": 0.18, "learning_rate": 9.40003780653595e-06, "loss": 0.8962, "step": 7883 }, { "epoch": 0.18, "learning_rate": 9.399859416380428e-06, "loss": 0.9802, "step": 7884 }, { "epoch": 0.18, "learning_rate": 9.3996810014012e-06, "loss": 1.0946, "step": 7885 }, { "epoch": 0.18, "learning_rate": 9.399502561599269e-06, "loss": 0.7847, "step": 7886 }, { "epoch": 0.18, "learning_rate": 9.399324096975646e-06, "loss": 0.7304, "step": 7887 }, { "epoch": 0.18, "learning_rate": 9.399145607531335e-06, "loss": 0.8649, "step": 7888 }, { "epoch": 0.18, "learning_rate": 9.398967093267342e-06, "loss": 1.0922, "step": 7889 }, { "epoch": 0.18, "learning_rate": 9.398788554184676e-06, "loss": 1.0686, "step": 7890 }, { "epoch": 0.18, "learning_rate": 9.398609990284347e-06, "loss": 0.8223, "step": 7891 }, { "epoch": 0.18, "learning_rate": 9.398431401567359e-06, "loss": 1.1094, "step": 7892 }, { "epoch": 0.18, "learning_rate": 9.398252788034719e-06, "loss": 1.0675, "step": 7893 }, { "epoch": 0.18, "learning_rate": 9.398074149687435e-06, "loss": 0.9296, "step": 7894 }, { "epoch": 0.18, "learning_rate": 9.397895486526518e-06, "loss": 1.291, "step": 7895 }, { "epoch": 0.18, "learning_rate": 9.397716798552971e-06, "loss": 0.94, "step": 7896 }, { "epoch": 0.18, "learning_rate": 9.397538085767808e-06, "loss": 0.8979, "step": 7897 }, { "epoch": 0.18, "learning_rate": 9.397359348172033e-06, "loss": 1.014, "step": 7898 }, { "epoch": 0.18, "learning_rate": 9.397180585766654e-06, "loss": 1.1051, "step": 7899 }, { "epoch": 0.18, "learning_rate": 9.397001798552684e-06, "loss": 0.9773, "step": 7900 }, { "epoch": 0.18, "learning_rate": 9.396822986531128e-06, "loss": 0.8578, "step": 7901 }, { "epoch": 0.18, "learning_rate": 9.396644149702997e-06, "loss": 1.021, "step": 7902 }, { "epoch": 0.18, "learning_rate": 9.396465288069297e-06, "loss": 0.9623, "step": 7903 }, { "epoch": 0.18, "learning_rate": 9.396286401631038e-06, "loss": 0.979, "step": 7904 }, { "epoch": 0.18, "learning_rate": 9.39610749038923e-06, "loss": 1.1333, "step": 7905 }, { "epoch": 0.18, "learning_rate": 9.395928554344886e-06, "loss": 1.2072, "step": 7906 }, { "epoch": 0.18, "learning_rate": 9.39574959349901e-06, "loss": 1.305, "step": 7907 }, { "epoch": 0.18, "learning_rate": 9.395570607852613e-06, "loss": 0.9305, "step": 7908 }, { "epoch": 0.18, "learning_rate": 9.395391597406707e-06, "loss": 1.0494, "step": 7909 }, { "epoch": 0.18, "learning_rate": 9.3952125621623e-06, "loss": 1.0392, "step": 7910 }, { "epoch": 0.18, "learning_rate": 9.395033502120404e-06, "loss": 0.7329, "step": 7911 }, { "epoch": 0.18, "learning_rate": 9.394854417282024e-06, "loss": 1.0569, "step": 7912 }, { "epoch": 0.18, "learning_rate": 9.394675307648177e-06, "loss": 1.2273, "step": 7913 }, { "epoch": 0.18, "learning_rate": 9.394496173219871e-06, "loss": 0.7974, "step": 7914 }, { "epoch": 0.18, "learning_rate": 9.394317013998118e-06, "loss": 1.2407, "step": 7915 }, { "epoch": 0.18, "learning_rate": 9.394137829983924e-06, "loss": 1.2178, "step": 7916 }, { "epoch": 0.18, "learning_rate": 9.393958621178305e-06, "loss": 1.0268, "step": 7917 }, { "epoch": 0.18, "learning_rate": 9.393779387582272e-06, "loss": 0.9203, "step": 7918 }, { "epoch": 0.18, "learning_rate": 9.393600129196832e-06, "loss": 0.9517, "step": 7919 }, { "epoch": 0.18, "learning_rate": 9.393420846023e-06, "loss": 1.0146, "step": 7920 }, { "epoch": 0.18, "learning_rate": 9.393241538061787e-06, "loss": 0.918, "step": 7921 }, { "epoch": 0.18, "learning_rate": 9.393062205314203e-06, "loss": 0.8392, "step": 7922 }, { "epoch": 0.18, "learning_rate": 9.392882847781259e-06, "loss": 0.9863, "step": 7923 }, { "epoch": 0.18, "learning_rate": 9.392703465463973e-06, "loss": 0.9901, "step": 7924 }, { "epoch": 0.18, "learning_rate": 9.39252405836335e-06, "loss": 0.9381, "step": 7925 }, { "epoch": 0.18, "learning_rate": 9.392344626480405e-06, "loss": 1.0831, "step": 7926 }, { "epoch": 0.18, "learning_rate": 9.392165169816152e-06, "loss": 0.9658, "step": 7927 }, { "epoch": 0.18, "learning_rate": 9.3919856883716e-06, "loss": 1.0438, "step": 7928 }, { "epoch": 0.18, "learning_rate": 9.391806182147764e-06, "loss": 1.2691, "step": 7929 }, { "epoch": 0.18, "learning_rate": 9.391626651145658e-06, "loss": 0.92, "step": 7930 }, { "epoch": 0.18, "learning_rate": 9.39144709536629e-06, "loss": 0.995, "step": 7931 }, { "epoch": 0.18, "learning_rate": 9.39126751481068e-06, "loss": 0.814, "step": 7932 }, { "epoch": 0.18, "learning_rate": 9.391087909479835e-06, "loss": 0.8214, "step": 7933 }, { "epoch": 0.18, "learning_rate": 9.39090827937477e-06, "loss": 1.3585, "step": 7934 }, { "epoch": 0.18, "learning_rate": 9.3907286244965e-06, "loss": 1.461, "step": 7935 }, { "epoch": 0.18, "learning_rate": 9.39054894484604e-06, "loss": 0.8503, "step": 7936 }, { "epoch": 0.18, "learning_rate": 9.3903692404244e-06, "loss": 1.0288, "step": 7937 }, { "epoch": 0.18, "learning_rate": 9.390189511232595e-06, "loss": 1.1971, "step": 7938 }, { "epoch": 0.18, "learning_rate": 9.390009757271639e-06, "loss": 0.8676, "step": 7939 }, { "epoch": 0.18, "learning_rate": 9.389829978542546e-06, "loss": 0.9294, "step": 7940 }, { "epoch": 0.18, "learning_rate": 9.389650175046332e-06, "loss": 1.0384, "step": 7941 }, { "epoch": 0.18, "learning_rate": 9.389470346784011e-06, "loss": 1.0665, "step": 7942 }, { "epoch": 0.18, "learning_rate": 9.389290493756595e-06, "loss": 0.9812, "step": 7943 }, { "epoch": 0.18, "learning_rate": 9.389110615965102e-06, "loss": 0.9603, "step": 7944 }, { "epoch": 0.18, "learning_rate": 9.388930713410545e-06, "loss": 0.9593, "step": 7945 }, { "epoch": 0.18, "learning_rate": 9.388750786093938e-06, "loss": 1.221, "step": 7946 }, { "epoch": 0.18, "learning_rate": 9.3885708340163e-06, "loss": 1.0873, "step": 7947 }, { "epoch": 0.18, "learning_rate": 9.388390857178643e-06, "loss": 1.1568, "step": 7948 }, { "epoch": 0.18, "learning_rate": 9.388210855581983e-06, "loss": 0.904, "step": 7949 }, { "epoch": 0.18, "learning_rate": 9.388030829227337e-06, "loss": 1.0373, "step": 7950 }, { "epoch": 0.18, "learning_rate": 9.387850778115718e-06, "loss": 1.0097, "step": 7951 }, { "epoch": 0.18, "learning_rate": 9.387670702248143e-06, "loss": 1.1953, "step": 7952 }, { "epoch": 0.18, "learning_rate": 9.38749060162563e-06, "loss": 1.2336, "step": 7953 }, { "epoch": 0.18, "learning_rate": 9.387310476249192e-06, "loss": 0.9172, "step": 7954 }, { "epoch": 0.18, "learning_rate": 9.387130326119849e-06, "loss": 1.1064, "step": 7955 }, { "epoch": 0.18, "learning_rate": 9.386950151238614e-06, "loss": 0.7954, "step": 7956 }, { "epoch": 0.18, "learning_rate": 9.386769951606503e-06, "loss": 1.1495, "step": 7957 }, { "epoch": 0.18, "learning_rate": 9.386589727224535e-06, "loss": 1.2277, "step": 7958 }, { "epoch": 0.18, "learning_rate": 9.386409478093727e-06, "loss": 1.0607, "step": 7959 }, { "epoch": 0.18, "learning_rate": 9.386229204215094e-06, "loss": 0.8358, "step": 7960 }, { "epoch": 0.18, "learning_rate": 9.386048905589655e-06, "loss": 1.0237, "step": 7961 }, { "epoch": 0.18, "learning_rate": 9.385868582218427e-06, "loss": 1.1885, "step": 7962 }, { "epoch": 0.18, "learning_rate": 9.385688234102425e-06, "loss": 0.9569, "step": 7963 }, { "epoch": 0.18, "learning_rate": 9.385507861242671e-06, "loss": 1.0331, "step": 7964 }, { "epoch": 0.18, "learning_rate": 9.385327463640177e-06, "loss": 0.9298, "step": 7965 }, { "epoch": 0.18, "learning_rate": 9.385147041295966e-06, "loss": 1.0302, "step": 7966 }, { "epoch": 0.18, "learning_rate": 9.384966594211054e-06, "loss": 1.2242, "step": 7967 }, { "epoch": 0.18, "learning_rate": 9.384786122386456e-06, "loss": 1.087, "step": 7968 }, { "epoch": 0.18, "learning_rate": 9.384605625823195e-06, "loss": 1.0214, "step": 7969 }, { "epoch": 0.18, "learning_rate": 9.384425104522288e-06, "loss": 0.9881, "step": 7970 }, { "epoch": 0.18, "learning_rate": 9.384244558484751e-06, "loss": 0.9613, "step": 7971 }, { "epoch": 0.18, "learning_rate": 9.384063987711605e-06, "loss": 1.0594, "step": 7972 }, { "epoch": 0.18, "learning_rate": 9.383883392203868e-06, "loss": 0.8078, "step": 7973 }, { "epoch": 0.18, "learning_rate": 9.38370277196256e-06, "loss": 0.6279, "step": 7974 }, { "epoch": 0.18, "learning_rate": 9.383522126988698e-06, "loss": 0.9026, "step": 7975 }, { "epoch": 0.18, "learning_rate": 9.383341457283302e-06, "loss": 0.8645, "step": 7976 }, { "epoch": 0.18, "learning_rate": 9.383160762847394e-06, "loss": 1.1638, "step": 7977 }, { "epoch": 0.19, "learning_rate": 9.382980043681989e-06, "loss": 0.8371, "step": 7978 }, { "epoch": 0.19, "learning_rate": 9.382799299788108e-06, "loss": 1.2318, "step": 7979 }, { "epoch": 0.19, "learning_rate": 9.382618531166773e-06, "loss": 0.9004, "step": 7980 }, { "epoch": 0.19, "learning_rate": 9.382437737819002e-06, "loss": 0.8588, "step": 7981 }, { "epoch": 0.19, "learning_rate": 9.382256919745816e-06, "loss": 1.1601, "step": 7982 }, { "epoch": 0.19, "learning_rate": 9.382076076948234e-06, "loss": 0.9572, "step": 7983 }, { "epoch": 0.19, "learning_rate": 9.381895209427277e-06, "loss": 0.9263, "step": 7984 }, { "epoch": 0.19, "learning_rate": 9.381714317183966e-06, "loss": 0.8283, "step": 7985 }, { "epoch": 0.19, "learning_rate": 9.381533400219319e-06, "loss": 0.7937, "step": 7986 }, { "epoch": 0.19, "learning_rate": 9.381352458534359e-06, "loss": 1.1148, "step": 7987 }, { "epoch": 0.19, "learning_rate": 9.381171492130108e-06, "loss": 0.9033, "step": 7988 }, { "epoch": 0.19, "learning_rate": 9.380990501007584e-06, "loss": 1.0578, "step": 7989 }, { "epoch": 0.19, "learning_rate": 9.38080948516781e-06, "loss": 0.9395, "step": 7990 }, { "epoch": 0.19, "learning_rate": 9.380628444611807e-06, "loss": 0.9034, "step": 7991 }, { "epoch": 0.19, "learning_rate": 9.380447379340596e-06, "loss": 0.8704, "step": 7992 }, { "epoch": 0.19, "learning_rate": 9.3802662893552e-06, "loss": 0.9502, "step": 7993 }, { "epoch": 0.19, "learning_rate": 9.380085174656638e-06, "loss": 0.9107, "step": 7994 }, { "epoch": 0.19, "learning_rate": 9.379904035245934e-06, "loss": 1.1688, "step": 7995 }, { "epoch": 0.19, "learning_rate": 9.379722871124109e-06, "loss": 0.9404, "step": 7996 }, { "epoch": 0.19, "learning_rate": 9.379541682292186e-06, "loss": 1.1225, "step": 7997 }, { "epoch": 0.19, "learning_rate": 9.379360468751187e-06, "loss": 0.948, "step": 7998 }, { "epoch": 0.19, "learning_rate": 9.379179230502133e-06, "loss": 1.0651, "step": 7999 }, { "epoch": 0.19, "learning_rate": 9.378997967546049e-06, "loss": 0.7847, "step": 8000 }, { "epoch": 0.19, "learning_rate": 9.378816679883956e-06, "loss": 1.19, "step": 8001 }, { "epoch": 0.19, "learning_rate": 9.378635367516875e-06, "loss": 1.0163, "step": 8002 }, { "epoch": 0.19, "learning_rate": 9.378454030445834e-06, "loss": 1.0036, "step": 8003 }, { "epoch": 0.19, "learning_rate": 9.378272668671852e-06, "loss": 1.0032, "step": 8004 }, { "epoch": 0.19, "learning_rate": 9.378091282195953e-06, "loss": 0.9086, "step": 8005 }, { "epoch": 0.19, "learning_rate": 9.377909871019162e-06, "loss": 0.9233, "step": 8006 }, { "epoch": 0.19, "learning_rate": 9.3777284351425e-06, "loss": 1.1434, "step": 8007 }, { "epoch": 0.19, "learning_rate": 9.377546974566994e-06, "loss": 0.8979, "step": 8008 }, { "epoch": 0.19, "learning_rate": 9.377365489293663e-06, "loss": 1.172, "step": 8009 }, { "epoch": 0.19, "learning_rate": 9.377183979323535e-06, "loss": 0.937, "step": 8010 }, { "epoch": 0.19, "learning_rate": 9.377002444657632e-06, "loss": 0.908, "step": 8011 }, { "epoch": 0.19, "learning_rate": 9.37682088529698e-06, "loss": 1.1365, "step": 8012 }, { "epoch": 0.19, "learning_rate": 9.376639301242602e-06, "loss": 1.2175, "step": 8013 }, { "epoch": 0.19, "learning_rate": 9.376457692495521e-06, "loss": 1.0405, "step": 8014 }, { "epoch": 0.19, "learning_rate": 9.376276059056766e-06, "loss": 0.9688, "step": 8015 }, { "epoch": 0.19, "learning_rate": 9.376094400927359e-06, "loss": 1.079, "step": 8016 }, { "epoch": 0.19, "learning_rate": 9.375912718108323e-06, "loss": 0.9196, "step": 8017 }, { "epoch": 0.19, "learning_rate": 9.375731010600686e-06, "loss": 0.7672, "step": 8018 }, { "epoch": 0.19, "learning_rate": 9.375549278405473e-06, "loss": 1.046, "step": 8019 }, { "epoch": 0.19, "learning_rate": 9.375367521523708e-06, "loss": 0.9706, "step": 8020 }, { "epoch": 0.19, "learning_rate": 9.375185739956418e-06, "loss": 1.0087, "step": 8021 }, { "epoch": 0.19, "learning_rate": 9.375003933704625e-06, "loss": 1.0374, "step": 8022 }, { "epoch": 0.19, "learning_rate": 9.374822102769361e-06, "loss": 1.0872, "step": 8023 }, { "epoch": 0.19, "learning_rate": 9.374640247151647e-06, "loss": 0.7006, "step": 8024 }, { "epoch": 0.19, "learning_rate": 9.374458366852509e-06, "loss": 1.0104, "step": 8025 }, { "epoch": 0.19, "learning_rate": 9.374276461872975e-06, "loss": 0.7444, "step": 8026 }, { "epoch": 0.19, "learning_rate": 9.374094532214071e-06, "loss": 0.9484, "step": 8027 }, { "epoch": 0.19, "learning_rate": 9.373912577876823e-06, "loss": 0.9307, "step": 8028 }, { "epoch": 0.19, "learning_rate": 9.373730598862258e-06, "loss": 0.8553, "step": 8029 }, { "epoch": 0.19, "learning_rate": 9.373548595171403e-06, "loss": 1.0963, "step": 8030 }, { "epoch": 0.19, "learning_rate": 9.373366566805284e-06, "loss": 0.996, "step": 8031 }, { "epoch": 0.19, "learning_rate": 9.373184513764929e-06, "loss": 0.9625, "step": 8032 }, { "epoch": 0.19, "learning_rate": 9.373002436051362e-06, "loss": 1.0658, "step": 8033 }, { "epoch": 0.19, "learning_rate": 9.372820333665615e-06, "loss": 1.0024, "step": 8034 }, { "epoch": 0.19, "learning_rate": 9.372638206608711e-06, "loss": 0.8925, "step": 8035 }, { "epoch": 0.19, "learning_rate": 9.37245605488168e-06, "loss": 1.2976, "step": 8036 }, { "epoch": 0.19, "learning_rate": 9.372273878485552e-06, "loss": 1.0584, "step": 8037 }, { "epoch": 0.19, "learning_rate": 9.37209167742135e-06, "loss": 1.1021, "step": 8038 }, { "epoch": 0.19, "learning_rate": 9.371909451690105e-06, "loss": 1.0548, "step": 8039 }, { "epoch": 0.19, "learning_rate": 9.371727201292844e-06, "loss": 1.0423, "step": 8040 }, { "epoch": 0.19, "learning_rate": 9.371544926230596e-06, "loss": 0.8754, "step": 8041 }, { "epoch": 0.19, "learning_rate": 9.371362626504388e-06, "loss": 1.358, "step": 8042 }, { "epoch": 0.19, "learning_rate": 9.371180302115247e-06, "loss": 1.1902, "step": 8043 }, { "epoch": 0.19, "learning_rate": 9.370997953064209e-06, "loss": 1.0445, "step": 8044 }, { "epoch": 0.19, "learning_rate": 9.370815579352295e-06, "loss": 1.1023, "step": 8045 }, { "epoch": 0.19, "learning_rate": 9.370633180980537e-06, "loss": 0.94, "step": 8046 }, { "epoch": 0.19, "learning_rate": 9.370450757949965e-06, "loss": 1.1925, "step": 8047 }, { "epoch": 0.19, "learning_rate": 9.370268310261606e-06, "loss": 0.8721, "step": 8048 }, { "epoch": 0.19, "learning_rate": 9.37008583791649e-06, "loss": 0.944, "step": 8049 }, { "epoch": 0.19, "learning_rate": 9.36990334091565e-06, "loss": 0.9787, "step": 8050 }, { "epoch": 0.19, "learning_rate": 9.369720819260108e-06, "loss": 1.0477, "step": 8051 }, { "epoch": 0.19, "learning_rate": 9.369538272950902e-06, "loss": 1.1646, "step": 8052 }, { "epoch": 0.19, "learning_rate": 9.369355701989057e-06, "loss": 1.2252, "step": 8053 }, { "epoch": 0.19, "learning_rate": 9.369173106375605e-06, "loss": 1.2471, "step": 8054 }, { "epoch": 0.19, "learning_rate": 9.368990486111574e-06, "loss": 1.1929, "step": 8055 }, { "epoch": 0.19, "learning_rate": 9.368807841197996e-06, "loss": 0.8731, "step": 8056 }, { "epoch": 0.19, "learning_rate": 9.368625171635903e-06, "loss": 1.0036, "step": 8057 }, { "epoch": 0.19, "learning_rate": 9.368442477426322e-06, "loss": 1.2983, "step": 8058 }, { "epoch": 0.19, "learning_rate": 9.36825975857029e-06, "loss": 0.8862, "step": 8059 }, { "epoch": 0.19, "learning_rate": 9.368077015068828e-06, "loss": 1.0076, "step": 8060 }, { "epoch": 0.19, "learning_rate": 9.367894246922975e-06, "loss": 1.4149, "step": 8061 }, { "epoch": 0.19, "learning_rate": 9.367711454133759e-06, "loss": 1.3287, "step": 8062 }, { "epoch": 0.19, "learning_rate": 9.367528636702213e-06, "loss": 0.9464, "step": 8063 }, { "epoch": 0.19, "learning_rate": 9.367345794629367e-06, "loss": 0.9539, "step": 8064 }, { "epoch": 0.19, "learning_rate": 9.367162927916254e-06, "loss": 0.7979, "step": 8065 }, { "epoch": 0.19, "learning_rate": 9.366980036563904e-06, "loss": 0.9963, "step": 8066 }, { "epoch": 0.19, "learning_rate": 9.36679712057335e-06, "loss": 0.8122, "step": 8067 }, { "epoch": 0.19, "learning_rate": 9.366614179945623e-06, "loss": 0.912, "step": 8068 }, { "epoch": 0.19, "learning_rate": 9.366431214681758e-06, "loss": 1.0269, "step": 8069 }, { "epoch": 0.19, "learning_rate": 9.366248224782781e-06, "loss": 1.0658, "step": 8070 }, { "epoch": 0.19, "learning_rate": 9.366065210249731e-06, "loss": 0.7423, "step": 8071 }, { "epoch": 0.19, "learning_rate": 9.365882171083637e-06, "loss": 0.9297, "step": 8072 }, { "epoch": 0.19, "learning_rate": 9.365699107285535e-06, "loss": 1.1695, "step": 8073 }, { "epoch": 0.19, "learning_rate": 9.365516018856453e-06, "loss": 1.1343, "step": 8074 }, { "epoch": 0.19, "learning_rate": 9.36533290579743e-06, "loss": 1.04, "step": 8075 }, { "epoch": 0.19, "learning_rate": 9.365149768109492e-06, "loss": 1.068, "step": 8076 }, { "epoch": 0.19, "learning_rate": 9.364966605793677e-06, "loss": 0.933, "step": 8077 }, { "epoch": 0.19, "learning_rate": 9.364783418851019e-06, "loss": 1.1518, "step": 8078 }, { "epoch": 0.19, "learning_rate": 9.364600207282549e-06, "loss": 0.9761, "step": 8079 }, { "epoch": 0.19, "learning_rate": 9.364416971089301e-06, "loss": 1.1715, "step": 8080 }, { "epoch": 0.19, "learning_rate": 9.36423371027231e-06, "loss": 1.0152, "step": 8081 }, { "epoch": 0.19, "learning_rate": 9.364050424832608e-06, "loss": 1.0566, "step": 8082 }, { "epoch": 0.19, "learning_rate": 9.363867114771231e-06, "loss": 1.1613, "step": 8083 }, { "epoch": 0.19, "learning_rate": 9.363683780089213e-06, "loss": 0.9679, "step": 8084 }, { "epoch": 0.19, "learning_rate": 9.363500420787589e-06, "loss": 1.0514, "step": 8085 }, { "epoch": 0.19, "learning_rate": 9.363317036867389e-06, "loss": 1.1582, "step": 8086 }, { "epoch": 0.19, "learning_rate": 9.363133628329652e-06, "loss": 1.1884, "step": 8087 }, { "epoch": 0.19, "learning_rate": 9.362950195175414e-06, "loss": 0.9758, "step": 8088 }, { "epoch": 0.19, "learning_rate": 9.362766737405706e-06, "loss": 0.8899, "step": 8089 }, { "epoch": 0.19, "learning_rate": 9.362583255021567e-06, "loss": 0.8516, "step": 8090 }, { "epoch": 0.19, "learning_rate": 9.362399748024028e-06, "loss": 1.1741, "step": 8091 }, { "epoch": 0.19, "learning_rate": 9.362216216414127e-06, "loss": 1.0822, "step": 8092 }, { "epoch": 0.19, "learning_rate": 9.362032660192899e-06, "loss": 1.1959, "step": 8093 }, { "epoch": 0.19, "learning_rate": 9.361849079361378e-06, "loss": 1.0054, "step": 8094 }, { "epoch": 0.19, "learning_rate": 9.361665473920602e-06, "loss": 1.0054, "step": 8095 }, { "epoch": 0.19, "learning_rate": 9.361481843871607e-06, "loss": 1.0721, "step": 8096 }, { "epoch": 0.19, "learning_rate": 9.361298189215428e-06, "loss": 1.1041, "step": 8097 }, { "epoch": 0.19, "learning_rate": 9.3611145099531e-06, "loss": 1.0611, "step": 8098 }, { "epoch": 0.19, "learning_rate": 9.360930806085661e-06, "loss": 1.0314, "step": 8099 }, { "epoch": 0.19, "learning_rate": 9.36074707761415e-06, "loss": 0.9087, "step": 8100 }, { "epoch": 0.19, "learning_rate": 9.360563324539597e-06, "loss": 1.2747, "step": 8101 }, { "epoch": 0.19, "learning_rate": 9.360379546863043e-06, "loss": 0.9052, "step": 8102 }, { "epoch": 0.19, "learning_rate": 9.360195744585524e-06, "loss": 1.2758, "step": 8103 }, { "epoch": 0.19, "learning_rate": 9.360011917708079e-06, "loss": 1.0299, "step": 8104 }, { "epoch": 0.19, "learning_rate": 9.35982806623174e-06, "loss": 1.12, "step": 8105 }, { "epoch": 0.19, "learning_rate": 9.359644190157551e-06, "loss": 0.8774, "step": 8106 }, { "epoch": 0.19, "learning_rate": 9.359460289486544e-06, "loss": 0.9819, "step": 8107 }, { "epoch": 0.19, "learning_rate": 9.359276364219759e-06, "loss": 0.9576, "step": 8108 }, { "epoch": 0.19, "learning_rate": 9.359092414358234e-06, "loss": 1.0461, "step": 8109 }, { "epoch": 0.19, "learning_rate": 9.358908439903005e-06, "loss": 0.925, "step": 8110 }, { "epoch": 0.19, "learning_rate": 9.358724440855112e-06, "loss": 0.8961, "step": 8111 }, { "epoch": 0.19, "learning_rate": 9.358540417215592e-06, "loss": 0.9912, "step": 8112 }, { "epoch": 0.19, "learning_rate": 9.358356368985483e-06, "loss": 0.9563, "step": 8113 }, { "epoch": 0.19, "learning_rate": 9.358172296165824e-06, "loss": 1.0392, "step": 8114 }, { "epoch": 0.19, "learning_rate": 9.357988198757655e-06, "loss": 1.1218, "step": 8115 }, { "epoch": 0.19, "learning_rate": 9.357804076762012e-06, "loss": 1.0176, "step": 8116 }, { "epoch": 0.19, "learning_rate": 9.357619930179933e-06, "loss": 0.8075, "step": 8117 }, { "epoch": 0.19, "learning_rate": 9.357435759012462e-06, "loss": 0.9953, "step": 8118 }, { "epoch": 0.19, "learning_rate": 9.35725156326063e-06, "loss": 0.9772, "step": 8119 }, { "epoch": 0.19, "learning_rate": 9.357067342925485e-06, "loss": 0.8427, "step": 8120 }, { "epoch": 0.19, "learning_rate": 9.356883098008062e-06, "loss": 1.0421, "step": 8121 }, { "epoch": 0.19, "learning_rate": 9.3566988285094e-06, "loss": 1.1386, "step": 8122 }, { "epoch": 0.19, "learning_rate": 9.35651453443054e-06, "loss": 0.9404, "step": 8123 }, { "epoch": 0.19, "learning_rate": 9.356330215772522e-06, "loss": 0.9151, "step": 8124 }, { "epoch": 0.19, "learning_rate": 9.356145872536384e-06, "loss": 1.0863, "step": 8125 }, { "epoch": 0.19, "learning_rate": 9.355961504723167e-06, "loss": 0.9413, "step": 8126 }, { "epoch": 0.19, "learning_rate": 9.355777112333913e-06, "loss": 1.0325, "step": 8127 }, { "epoch": 0.19, "learning_rate": 9.355592695369659e-06, "loss": 1.0062, "step": 8128 }, { "epoch": 0.19, "learning_rate": 9.355408253831448e-06, "loss": 1.0623, "step": 8129 }, { "epoch": 0.19, "learning_rate": 9.35522378772032e-06, "loss": 1.1428, "step": 8130 }, { "epoch": 0.19, "learning_rate": 9.355039297037317e-06, "loss": 1.0002, "step": 8131 }, { "epoch": 0.19, "learning_rate": 9.354854781783479e-06, "loss": 0.7876, "step": 8132 }, { "epoch": 0.19, "learning_rate": 9.354670241959842e-06, "loss": 0.8999, "step": 8133 }, { "epoch": 0.19, "learning_rate": 9.354485677567456e-06, "loss": 0.9131, "step": 8134 }, { "epoch": 0.19, "learning_rate": 9.354301088607357e-06, "loss": 1.0792, "step": 8135 }, { "epoch": 0.19, "learning_rate": 9.354116475080586e-06, "loss": 0.9048, "step": 8136 }, { "epoch": 0.19, "learning_rate": 9.353931836988187e-06, "loss": 0.8914, "step": 8137 }, { "epoch": 0.19, "learning_rate": 9.3537471743312e-06, "loss": 1.0479, "step": 8138 }, { "epoch": 0.19, "learning_rate": 9.35356248711067e-06, "loss": 1.0255, "step": 8139 }, { "epoch": 0.19, "learning_rate": 9.353377775327634e-06, "loss": 0.9891, "step": 8140 }, { "epoch": 0.19, "learning_rate": 9.353193038983138e-06, "loss": 1.2564, "step": 8141 }, { "epoch": 0.19, "learning_rate": 9.353008278078222e-06, "loss": 0.9539, "step": 8142 }, { "epoch": 0.19, "learning_rate": 9.352823492613931e-06, "loss": 0.9943, "step": 8143 }, { "epoch": 0.19, "learning_rate": 9.352638682591304e-06, "loss": 0.9396, "step": 8144 }, { "epoch": 0.19, "learning_rate": 9.352453848011388e-06, "loss": 0.9374, "step": 8145 }, { "epoch": 0.19, "learning_rate": 9.352268988875222e-06, "loss": 1.0782, "step": 8146 }, { "epoch": 0.19, "learning_rate": 9.35208410518385e-06, "loss": 0.8151, "step": 8147 }, { "epoch": 0.19, "learning_rate": 9.351899196938316e-06, "loss": 1.0959, "step": 8148 }, { "epoch": 0.19, "learning_rate": 9.351714264139661e-06, "loss": 1.0027, "step": 8149 }, { "epoch": 0.19, "learning_rate": 9.351529306788933e-06, "loss": 0.9518, "step": 8150 }, { "epoch": 0.19, "learning_rate": 9.351344324887171e-06, "loss": 0.9823, "step": 8151 }, { "epoch": 0.19, "learning_rate": 9.35115931843542e-06, "loss": 1.0515, "step": 8152 }, { "epoch": 0.19, "learning_rate": 9.350974287434726e-06, "loss": 0.8245, "step": 8153 }, { "epoch": 0.19, "learning_rate": 9.35078923188613e-06, "loss": 1.1619, "step": 8154 }, { "epoch": 0.19, "learning_rate": 9.350604151790677e-06, "loss": 0.9187, "step": 8155 }, { "epoch": 0.19, "learning_rate": 9.350419047149411e-06, "loss": 0.9509, "step": 8156 }, { "epoch": 0.19, "learning_rate": 9.350233917963375e-06, "loss": 1.0809, "step": 8157 }, { "epoch": 0.19, "learning_rate": 9.35004876423362e-06, "loss": 0.8845, "step": 8158 }, { "epoch": 0.19, "learning_rate": 9.349863585961181e-06, "loss": 1.088, "step": 8159 }, { "epoch": 0.19, "learning_rate": 9.34967838314711e-06, "loss": 1.0989, "step": 8160 }, { "epoch": 0.19, "learning_rate": 9.349493155792449e-06, "loss": 0.9261, "step": 8161 }, { "epoch": 0.19, "learning_rate": 9.349307903898245e-06, "loss": 0.9713, "step": 8162 }, { "epoch": 0.19, "learning_rate": 9.349122627465538e-06, "loss": 1.131, "step": 8163 }, { "epoch": 0.19, "learning_rate": 9.34893732649538e-06, "loss": 1.0505, "step": 8164 }, { "epoch": 0.19, "learning_rate": 9.34875200098881e-06, "loss": 0.9728, "step": 8165 }, { "epoch": 0.19, "learning_rate": 9.34856665094688e-06, "loss": 1.0643, "step": 8166 }, { "epoch": 0.19, "learning_rate": 9.348381276370633e-06, "loss": 1.0382, "step": 8167 }, { "epoch": 0.19, "learning_rate": 9.348195877261113e-06, "loss": 1.2128, "step": 8168 }, { "epoch": 0.19, "learning_rate": 9.348010453619369e-06, "loss": 1.1298, "step": 8169 }, { "epoch": 0.19, "learning_rate": 9.347825005446444e-06, "loss": 0.996, "step": 8170 }, { "epoch": 0.19, "learning_rate": 9.347639532743388e-06, "loss": 1.1533, "step": 8171 }, { "epoch": 0.19, "learning_rate": 9.347454035511244e-06, "loss": 0.9761, "step": 8172 }, { "epoch": 0.19, "learning_rate": 9.34726851375106e-06, "loss": 1.0952, "step": 8173 }, { "epoch": 0.19, "learning_rate": 9.347082967463885e-06, "loss": 1.0165, "step": 8174 }, { "epoch": 0.19, "learning_rate": 9.34689739665076e-06, "loss": 1.3531, "step": 8175 }, { "epoch": 0.19, "learning_rate": 9.346711801312738e-06, "loss": 0.8306, "step": 8176 }, { "epoch": 0.19, "learning_rate": 9.346526181450863e-06, "loss": 0.9607, "step": 8177 }, { "epoch": 0.19, "learning_rate": 9.346340537066184e-06, "loss": 0.7712, "step": 8178 }, { "epoch": 0.19, "learning_rate": 9.346154868159748e-06, "loss": 0.9306, "step": 8179 }, { "epoch": 0.19, "learning_rate": 9.345969174732599e-06, "loss": 0.9432, "step": 8180 }, { "epoch": 0.19, "learning_rate": 9.345783456785788e-06, "loss": 0.9269, "step": 8181 }, { "epoch": 0.19, "learning_rate": 9.345597714320363e-06, "loss": 0.9069, "step": 8182 }, { "epoch": 0.19, "learning_rate": 9.345411947337373e-06, "loss": 1.1089, "step": 8183 }, { "epoch": 0.19, "learning_rate": 9.345226155837861e-06, "loss": 0.9845, "step": 8184 }, { "epoch": 0.19, "learning_rate": 9.345040339822882e-06, "loss": 0.9953, "step": 8185 }, { "epoch": 0.19, "learning_rate": 9.34485449929348e-06, "loss": 0.8918, "step": 8186 }, { "epoch": 0.19, "learning_rate": 9.344668634250701e-06, "loss": 0.9153, "step": 8187 }, { "epoch": 0.19, "learning_rate": 9.344482744695601e-06, "loss": 1.0701, "step": 8188 }, { "epoch": 0.19, "learning_rate": 9.344296830629225e-06, "loss": 1.0969, "step": 8189 }, { "epoch": 0.19, "learning_rate": 9.34411089205262e-06, "loss": 1.1287, "step": 8190 }, { "epoch": 0.19, "learning_rate": 9.343924928966838e-06, "loss": 0.9643, "step": 8191 }, { "epoch": 0.19, "learning_rate": 9.343738941372926e-06, "loss": 0.9616, "step": 8192 }, { "epoch": 0.19, "learning_rate": 9.343552929271935e-06, "loss": 0.8245, "step": 8193 }, { "epoch": 0.19, "learning_rate": 9.343366892664914e-06, "loss": 0.9174, "step": 8194 }, { "epoch": 0.19, "learning_rate": 9.343180831552911e-06, "loss": 0.9232, "step": 8195 }, { "epoch": 0.19, "learning_rate": 9.342994745936979e-06, "loss": 1.1817, "step": 8196 }, { "epoch": 0.19, "learning_rate": 9.342808635818165e-06, "loss": 1.1292, "step": 8197 }, { "epoch": 0.19, "learning_rate": 9.34262250119752e-06, "loss": 0.9899, "step": 8198 }, { "epoch": 0.19, "learning_rate": 9.342436342076096e-06, "loss": 1.1631, "step": 8199 }, { "epoch": 0.19, "learning_rate": 9.34225015845494e-06, "loss": 0.8471, "step": 8200 }, { "epoch": 0.19, "learning_rate": 9.342063950335102e-06, "loss": 1.0911, "step": 8201 }, { "epoch": 0.19, "learning_rate": 9.341877717717638e-06, "loss": 1.0802, "step": 8202 }, { "epoch": 0.19, "learning_rate": 9.341691460603594e-06, "loss": 0.9318, "step": 8203 }, { "epoch": 0.19, "learning_rate": 9.341505178994022e-06, "loss": 0.8675, "step": 8204 }, { "epoch": 0.19, "learning_rate": 9.341318872889972e-06, "loss": 1.2334, "step": 8205 }, { "epoch": 0.19, "learning_rate": 9.341132542292497e-06, "loss": 0.9992, "step": 8206 }, { "epoch": 0.19, "learning_rate": 9.340946187202648e-06, "loss": 0.8398, "step": 8207 }, { "epoch": 0.19, "learning_rate": 9.340759807621477e-06, "loss": 0.9748, "step": 8208 }, { "epoch": 0.19, "learning_rate": 9.340573403550033e-06, "loss": 1.0762, "step": 8209 }, { "epoch": 0.19, "learning_rate": 9.340386974989369e-06, "loss": 1.1049, "step": 8210 }, { "epoch": 0.19, "learning_rate": 9.340200521940537e-06, "loss": 0.7866, "step": 8211 }, { "epoch": 0.19, "learning_rate": 9.340014044404588e-06, "loss": 0.8604, "step": 8212 }, { "epoch": 0.19, "learning_rate": 9.339827542382576e-06, "loss": 0.9493, "step": 8213 }, { "epoch": 0.19, "learning_rate": 9.339641015875554e-06, "loss": 0.9516, "step": 8214 }, { "epoch": 0.19, "learning_rate": 9.33945446488457e-06, "loss": 0.7596, "step": 8215 }, { "epoch": 0.19, "learning_rate": 9.339267889410678e-06, "loss": 0.9102, "step": 8216 }, { "epoch": 0.19, "learning_rate": 9.339081289454934e-06, "loss": 0.8196, "step": 8217 }, { "epoch": 0.19, "learning_rate": 9.33889466501839e-06, "loss": 0.942, "step": 8218 }, { "epoch": 0.19, "learning_rate": 9.338708016102094e-06, "loss": 0.9382, "step": 8219 }, { "epoch": 0.19, "learning_rate": 9.338521342707104e-06, "loss": 0.8012, "step": 8220 }, { "epoch": 0.19, "learning_rate": 9.338334644834473e-06, "loss": 1.0448, "step": 8221 }, { "epoch": 0.19, "learning_rate": 9.338147922485251e-06, "loss": 0.859, "step": 8222 }, { "epoch": 0.19, "learning_rate": 9.337961175660496e-06, "loss": 1.0751, "step": 8223 }, { "epoch": 0.19, "learning_rate": 9.337774404361255e-06, "loss": 1.1692, "step": 8224 }, { "epoch": 0.19, "learning_rate": 9.337587608588588e-06, "loss": 1.0796, "step": 8225 }, { "epoch": 0.19, "learning_rate": 9.337400788343547e-06, "loss": 0.7539, "step": 8226 }, { "epoch": 0.19, "learning_rate": 9.337213943627185e-06, "loss": 0.8537, "step": 8227 }, { "epoch": 0.19, "learning_rate": 9.337027074440558e-06, "loss": 0.9557, "step": 8228 }, { "epoch": 0.19, "learning_rate": 9.33684018078472e-06, "loss": 1.1359, "step": 8229 }, { "epoch": 0.19, "learning_rate": 9.336653262660724e-06, "loss": 0.9921, "step": 8230 }, { "epoch": 0.19, "learning_rate": 9.336466320069624e-06, "loss": 1.0718, "step": 8231 }, { "epoch": 0.19, "learning_rate": 9.336279353012477e-06, "loss": 0.9663, "step": 8232 }, { "epoch": 0.19, "learning_rate": 9.336092361490336e-06, "loss": 0.9219, "step": 8233 }, { "epoch": 0.19, "learning_rate": 9.335905345504258e-06, "loss": 0.763, "step": 8234 }, { "epoch": 0.19, "learning_rate": 9.335718305055296e-06, "loss": 1.2238, "step": 8235 }, { "epoch": 0.19, "learning_rate": 9.335531240144507e-06, "loss": 1.0352, "step": 8236 }, { "epoch": 0.19, "learning_rate": 9.335344150772946e-06, "loss": 1.122, "step": 8237 }, { "epoch": 0.19, "learning_rate": 9.335157036941667e-06, "loss": 1.0946, "step": 8238 }, { "epoch": 0.19, "learning_rate": 9.334969898651728e-06, "loss": 1.1731, "step": 8239 }, { "epoch": 0.19, "learning_rate": 9.334782735904183e-06, "loss": 1.1573, "step": 8240 }, { "epoch": 0.19, "learning_rate": 9.33459554870009e-06, "loss": 1.1263, "step": 8241 }, { "epoch": 0.19, "learning_rate": 9.334408337040502e-06, "loss": 0.8976, "step": 8242 }, { "epoch": 0.19, "learning_rate": 9.334221100926476e-06, "loss": 1.1775, "step": 8243 }, { "epoch": 0.19, "learning_rate": 9.33403384035907e-06, "loss": 0.8518, "step": 8244 }, { "epoch": 0.19, "learning_rate": 9.333846555339343e-06, "loss": 0.9526, "step": 8245 }, { "epoch": 0.19, "learning_rate": 9.333659245868346e-06, "loss": 1.0291, "step": 8246 }, { "epoch": 0.19, "learning_rate": 9.333471911947139e-06, "loss": 1.1814, "step": 8247 }, { "epoch": 0.19, "learning_rate": 9.333284553576777e-06, "loss": 1.075, "step": 8248 }, { "epoch": 0.19, "learning_rate": 9.333097170758319e-06, "loss": 0.8623, "step": 8249 }, { "epoch": 0.19, "learning_rate": 9.332909763492822e-06, "loss": 0.9693, "step": 8250 }, { "epoch": 0.19, "learning_rate": 9.332722331781343e-06, "loss": 1.3421, "step": 8251 }, { "epoch": 0.19, "learning_rate": 9.33253487562494e-06, "loss": 1.1368, "step": 8252 }, { "epoch": 0.19, "learning_rate": 9.332347395024668e-06, "loss": 1.115, "step": 8253 }, { "epoch": 0.19, "learning_rate": 9.332159889981587e-06, "loss": 1.1658, "step": 8254 }, { "epoch": 0.19, "learning_rate": 9.331972360496755e-06, "loss": 1.0797, "step": 8255 }, { "epoch": 0.19, "learning_rate": 9.331784806571231e-06, "loss": 0.9271, "step": 8256 }, { "epoch": 0.19, "learning_rate": 9.331597228206069e-06, "loss": 0.8529, "step": 8257 }, { "epoch": 0.19, "learning_rate": 9.331409625402333e-06, "loss": 1.1105, "step": 8258 }, { "epoch": 0.19, "learning_rate": 9.331221998161074e-06, "loss": 0.8629, "step": 8259 }, { "epoch": 0.19, "learning_rate": 9.33103434648336e-06, "loss": 0.9147, "step": 8260 }, { "epoch": 0.19, "learning_rate": 9.330846670370243e-06, "loss": 1.4245, "step": 8261 }, { "epoch": 0.19, "learning_rate": 9.330658969822784e-06, "loss": 1.0464, "step": 8262 }, { "epoch": 0.19, "learning_rate": 9.330471244842042e-06, "loss": 0.9661, "step": 8263 }, { "epoch": 0.19, "learning_rate": 9.330283495429074e-06, "loss": 1.0723, "step": 8264 }, { "epoch": 0.19, "learning_rate": 9.330095721584942e-06, "loss": 1.0962, "step": 8265 }, { "epoch": 0.19, "learning_rate": 9.329907923310703e-06, "loss": 1.0997, "step": 8266 }, { "epoch": 0.19, "learning_rate": 9.329720100607422e-06, "loss": 1.0288, "step": 8267 }, { "epoch": 0.19, "learning_rate": 9.329532253476151e-06, "loss": 1.3111, "step": 8268 }, { "epoch": 0.19, "learning_rate": 9.329344381917955e-06, "loss": 1.0424, "step": 8269 }, { "epoch": 0.19, "learning_rate": 9.329156485933893e-06, "loss": 1.1296, "step": 8270 }, { "epoch": 0.19, "learning_rate": 9.328968565525023e-06, "loss": 0.8772, "step": 8271 }, { "epoch": 0.19, "learning_rate": 9.328780620692408e-06, "loss": 0.8583, "step": 8272 }, { "epoch": 0.19, "learning_rate": 9.328592651437108e-06, "loss": 1.0069, "step": 8273 }, { "epoch": 0.19, "learning_rate": 9.328404657760179e-06, "loss": 1.1084, "step": 8274 }, { "epoch": 0.19, "learning_rate": 9.328216639662689e-06, "loss": 0.7635, "step": 8275 }, { "epoch": 0.19, "learning_rate": 9.328028597145694e-06, "loss": 0.9164, "step": 8276 }, { "epoch": 0.19, "learning_rate": 9.327840530210257e-06, "loss": 0.7251, "step": 8277 }, { "epoch": 0.19, "learning_rate": 9.327652438857435e-06, "loss": 1.02, "step": 8278 }, { "epoch": 0.19, "learning_rate": 9.327464323088295e-06, "loss": 1.2471, "step": 8279 }, { "epoch": 0.19, "learning_rate": 9.327276182903896e-06, "loss": 0.7867, "step": 8280 }, { "epoch": 0.19, "learning_rate": 9.327088018305298e-06, "loss": 1.0749, "step": 8281 }, { "epoch": 0.19, "learning_rate": 9.326899829293564e-06, "loss": 1.0833, "step": 8282 }, { "epoch": 0.19, "learning_rate": 9.326711615869755e-06, "loss": 0.9818, "step": 8283 }, { "epoch": 0.19, "learning_rate": 9.326523378034935e-06, "loss": 0.9836, "step": 8284 }, { "epoch": 0.19, "learning_rate": 9.326335115790163e-06, "loss": 0.9895, "step": 8285 }, { "epoch": 0.19, "learning_rate": 9.326146829136503e-06, "loss": 1.239, "step": 8286 }, { "epoch": 0.19, "learning_rate": 9.325958518075016e-06, "loss": 0.9194, "step": 8287 }, { "epoch": 0.19, "learning_rate": 9.325770182606765e-06, "loss": 0.9764, "step": 8288 }, { "epoch": 0.19, "learning_rate": 9.325581822732814e-06, "loss": 1.2053, "step": 8289 }, { "epoch": 0.19, "learning_rate": 9.325393438454225e-06, "loss": 1.0987, "step": 8290 }, { "epoch": 0.19, "learning_rate": 9.32520502977206e-06, "loss": 1.0711, "step": 8291 }, { "epoch": 0.19, "learning_rate": 9.325016596687383e-06, "loss": 1.0356, "step": 8292 }, { "epoch": 0.19, "learning_rate": 9.324828139201255e-06, "loss": 1.1116, "step": 8293 }, { "epoch": 0.19, "learning_rate": 9.324639657314742e-06, "loss": 1.2172, "step": 8294 }, { "epoch": 0.19, "learning_rate": 9.324451151028906e-06, "loss": 1.1118, "step": 8295 }, { "epoch": 0.19, "learning_rate": 9.32426262034481e-06, "loss": 1.0037, "step": 8296 }, { "epoch": 0.19, "learning_rate": 9.32407406526352e-06, "loss": 1.0471, "step": 8297 }, { "epoch": 0.19, "learning_rate": 9.323885485786095e-06, "loss": 0.9333, "step": 8298 }, { "epoch": 0.19, "learning_rate": 9.323696881913606e-06, "loss": 0.8275, "step": 8299 }, { "epoch": 0.19, "learning_rate": 9.323508253647111e-06, "loss": 1.0547, "step": 8300 }, { "epoch": 0.19, "learning_rate": 9.323319600987677e-06, "loss": 0.9493, "step": 8301 }, { "epoch": 0.19, "learning_rate": 9.323130923936369e-06, "loss": 1.3354, "step": 8302 }, { "epoch": 0.19, "learning_rate": 9.322942222494249e-06, "loss": 1.1276, "step": 8303 }, { "epoch": 0.19, "learning_rate": 9.322753496662385e-06, "loss": 1.2185, "step": 8304 }, { "epoch": 0.19, "learning_rate": 9.322564746441838e-06, "loss": 1.2814, "step": 8305 }, { "epoch": 0.19, "learning_rate": 9.322375971833674e-06, "loss": 0.8147, "step": 8306 }, { "epoch": 0.19, "learning_rate": 9.32218717283896e-06, "loss": 1.3165, "step": 8307 }, { "epoch": 0.19, "learning_rate": 9.321998349458761e-06, "loss": 1.2267, "step": 8308 }, { "epoch": 0.19, "learning_rate": 9.32180950169414e-06, "loss": 1.3555, "step": 8309 }, { "epoch": 0.19, "learning_rate": 9.321620629546163e-06, "loss": 1.1789, "step": 8310 }, { "epoch": 0.19, "learning_rate": 9.321431733015897e-06, "loss": 1.0557, "step": 8311 }, { "epoch": 0.19, "learning_rate": 9.321242812104407e-06, "loss": 1.023, "step": 8312 }, { "epoch": 0.19, "learning_rate": 9.32105386681276e-06, "loss": 0.8312, "step": 8313 }, { "epoch": 0.19, "learning_rate": 9.32086489714202e-06, "loss": 1.0973, "step": 8314 }, { "epoch": 0.19, "learning_rate": 9.320675903093254e-06, "loss": 0.8768, "step": 8315 }, { "epoch": 0.19, "learning_rate": 9.32048688466753e-06, "loss": 0.9898, "step": 8316 }, { "epoch": 0.19, "learning_rate": 9.320297841865912e-06, "loss": 0.8648, "step": 8317 }, { "epoch": 0.19, "learning_rate": 9.320108774689467e-06, "loss": 0.9852, "step": 8318 }, { "epoch": 0.19, "learning_rate": 9.319919683139262e-06, "loss": 1.0201, "step": 8319 }, { "epoch": 0.19, "learning_rate": 9.319730567216366e-06, "loss": 1.5113, "step": 8320 }, { "epoch": 0.19, "learning_rate": 9.31954142692184e-06, "loss": 0.7555, "step": 8321 }, { "epoch": 0.19, "learning_rate": 9.319352262256758e-06, "loss": 1.0537, "step": 8322 }, { "epoch": 0.19, "learning_rate": 9.319163073222184e-06, "loss": 0.8994, "step": 8323 }, { "epoch": 0.19, "learning_rate": 9.318973859819185e-06, "loss": 1.166, "step": 8324 }, { "epoch": 0.19, "learning_rate": 9.31878462204883e-06, "loss": 1.3368, "step": 8325 }, { "epoch": 0.19, "learning_rate": 9.318595359912186e-06, "loss": 0.7737, "step": 8326 }, { "epoch": 0.19, "learning_rate": 9.318406073410321e-06, "loss": 1.1254, "step": 8327 }, { "epoch": 0.19, "learning_rate": 9.318216762544301e-06, "loss": 1.3218, "step": 8328 }, { "epoch": 0.19, "learning_rate": 9.318027427315198e-06, "loss": 1.0958, "step": 8329 }, { "epoch": 0.19, "learning_rate": 9.317838067724077e-06, "loss": 0.9275, "step": 8330 }, { "epoch": 0.19, "learning_rate": 9.317648683772007e-06, "loss": 1.02, "step": 8331 }, { "epoch": 0.19, "learning_rate": 9.317459275460057e-06, "loss": 0.9057, "step": 8332 }, { "epoch": 0.19, "learning_rate": 9.317269842789297e-06, "loss": 0.8942, "step": 8333 }, { "epoch": 0.19, "learning_rate": 9.317080385760791e-06, "loss": 1.3218, "step": 8334 }, { "epoch": 0.19, "learning_rate": 9.316890904375612e-06, "loss": 0.8587, "step": 8335 }, { "epoch": 0.19, "learning_rate": 9.31670139863483e-06, "loss": 0.7959, "step": 8336 }, { "epoch": 0.19, "learning_rate": 9.31651186853951e-06, "loss": 1.1062, "step": 8337 }, { "epoch": 0.19, "learning_rate": 9.316322314090726e-06, "loss": 1.0209, "step": 8338 }, { "epoch": 0.19, "learning_rate": 9.316132735289543e-06, "loss": 1.0071, "step": 8339 }, { "epoch": 0.19, "learning_rate": 9.315943132137034e-06, "loss": 1.1287, "step": 8340 }, { "epoch": 0.19, "learning_rate": 9.315753504634267e-06, "loss": 1.1344, "step": 8341 }, { "epoch": 0.19, "learning_rate": 9.315563852782312e-06, "loss": 1.1925, "step": 8342 }, { "epoch": 0.19, "learning_rate": 9.31537417658224e-06, "loss": 0.7542, "step": 8343 }, { "epoch": 0.19, "learning_rate": 9.31518447603512e-06, "loss": 0.8346, "step": 8344 }, { "epoch": 0.19, "learning_rate": 9.314994751142023e-06, "loss": 1.2029, "step": 8345 }, { "epoch": 0.19, "learning_rate": 9.31480500190402e-06, "loss": 1.2579, "step": 8346 }, { "epoch": 0.19, "learning_rate": 9.31461522832218e-06, "loss": 0.8092, "step": 8347 }, { "epoch": 0.19, "learning_rate": 9.314425430397573e-06, "loss": 1.0673, "step": 8348 }, { "epoch": 0.19, "learning_rate": 9.314235608131272e-06, "loss": 0.6525, "step": 8349 }, { "epoch": 0.19, "learning_rate": 9.314045761524347e-06, "loss": 0.8341, "step": 8350 }, { "epoch": 0.19, "learning_rate": 9.31385589057787e-06, "loss": 1.3426, "step": 8351 }, { "epoch": 0.19, "learning_rate": 9.313665995292911e-06, "loss": 1.0628, "step": 8352 }, { "epoch": 0.19, "learning_rate": 9.313476075670543e-06, "loss": 1.0983, "step": 8353 }, { "epoch": 0.19, "learning_rate": 9.313286131711834e-06, "loss": 0.9825, "step": 8354 }, { "epoch": 0.19, "learning_rate": 9.31309616341786e-06, "loss": 0.9904, "step": 8355 }, { "epoch": 0.19, "learning_rate": 9.31290617078969e-06, "loss": 0.9069, "step": 8356 }, { "epoch": 0.19, "learning_rate": 9.312716153828397e-06, "loss": 0.9402, "step": 8357 }, { "epoch": 0.19, "learning_rate": 9.312526112535051e-06, "loss": 1.1296, "step": 8358 }, { "epoch": 0.19, "learning_rate": 9.31233604691073e-06, "loss": 0.8295, "step": 8359 }, { "epoch": 0.19, "learning_rate": 9.312145956956499e-06, "loss": 1.0532, "step": 8360 }, { "epoch": 0.19, "learning_rate": 9.311955842673435e-06, "loss": 0.8634, "step": 8361 }, { "epoch": 0.19, "learning_rate": 9.311765704062609e-06, "loss": 0.9934, "step": 8362 }, { "epoch": 0.19, "learning_rate": 9.311575541125095e-06, "loss": 0.6492, "step": 8363 }, { "epoch": 0.19, "learning_rate": 9.311385353861965e-06, "loss": 1.1128, "step": 8364 }, { "epoch": 0.19, "learning_rate": 9.311195142274292e-06, "loss": 1.1505, "step": 8365 }, { "epoch": 0.19, "learning_rate": 9.311004906363149e-06, "loss": 1.1058, "step": 8366 }, { "epoch": 0.19, "learning_rate": 9.31081464612961e-06, "loss": 1.1246, "step": 8367 }, { "epoch": 0.19, "learning_rate": 9.310624361574746e-06, "loss": 1.0947, "step": 8368 }, { "epoch": 0.19, "learning_rate": 9.310434052699633e-06, "loss": 1.0479, "step": 8369 }, { "epoch": 0.19, "learning_rate": 9.310243719505346e-06, "loss": 1.0214, "step": 8370 }, { "epoch": 0.19, "learning_rate": 9.310053361992956e-06, "loss": 1.0888, "step": 8371 }, { "epoch": 0.19, "learning_rate": 9.30986298016354e-06, "loss": 1.2043, "step": 8372 }, { "epoch": 0.19, "learning_rate": 9.309672574018169e-06, "loss": 1.2084, "step": 8373 }, { "epoch": 0.19, "learning_rate": 9.309482143557917e-06, "loss": 0.9868, "step": 8374 }, { "epoch": 0.19, "learning_rate": 9.309291688783862e-06, "loss": 0.859, "step": 8375 }, { "epoch": 0.19, "learning_rate": 9.309101209697075e-06, "loss": 0.8574, "step": 8376 }, { "epoch": 0.19, "learning_rate": 9.308910706298632e-06, "loss": 0.9654, "step": 8377 }, { "epoch": 0.19, "learning_rate": 9.30872017858961e-06, "loss": 1.1652, "step": 8378 }, { "epoch": 0.19, "learning_rate": 9.30852962657108e-06, "loss": 1.1953, "step": 8379 }, { "epoch": 0.19, "learning_rate": 9.30833905024412e-06, "loss": 0.8861, "step": 8380 }, { "epoch": 0.19, "learning_rate": 9.308148449609802e-06, "loss": 1.1391, "step": 8381 }, { "epoch": 0.19, "learning_rate": 9.307957824669204e-06, "loss": 0.8482, "step": 8382 }, { "epoch": 0.19, "learning_rate": 9.307767175423404e-06, "loss": 1.0239, "step": 8383 }, { "epoch": 0.19, "learning_rate": 9.307576501873472e-06, "loss": 1.1779, "step": 8384 }, { "epoch": 0.19, "learning_rate": 9.307385804020486e-06, "loss": 0.9924, "step": 8385 }, { "epoch": 0.19, "learning_rate": 9.307195081865524e-06, "loss": 0.8593, "step": 8386 }, { "epoch": 0.19, "learning_rate": 9.30700433540966e-06, "loss": 1.0306, "step": 8387 }, { "epoch": 0.19, "learning_rate": 9.30681356465397e-06, "loss": 1.1345, "step": 8388 }, { "epoch": 0.19, "learning_rate": 9.30662276959953e-06, "loss": 0.8978, "step": 8389 }, { "epoch": 0.19, "learning_rate": 9.306431950247418e-06, "loss": 1.0637, "step": 8390 }, { "epoch": 0.19, "learning_rate": 9.30624110659871e-06, "loss": 1.0485, "step": 8391 }, { "epoch": 0.19, "learning_rate": 9.306050238654483e-06, "loss": 0.977, "step": 8392 }, { "epoch": 0.19, "learning_rate": 9.305859346415813e-06, "loss": 1.0398, "step": 8393 }, { "epoch": 0.19, "learning_rate": 9.305668429883777e-06, "loss": 0.7933, "step": 8394 }, { "epoch": 0.19, "learning_rate": 9.305477489059452e-06, "loss": 0.7671, "step": 8395 }, { "epoch": 0.19, "learning_rate": 9.305286523943917e-06, "loss": 0.9752, "step": 8396 }, { "epoch": 0.19, "learning_rate": 9.305095534538249e-06, "loss": 1.1444, "step": 8397 }, { "epoch": 0.19, "learning_rate": 9.304904520843523e-06, "loss": 1.1336, "step": 8398 }, { "epoch": 0.19, "learning_rate": 9.30471348286082e-06, "loss": 1.0724, "step": 8399 }, { "epoch": 0.19, "learning_rate": 9.304522420591215e-06, "loss": 1.1997, "step": 8400 }, { "epoch": 0.19, "learning_rate": 9.30433133403579e-06, "loss": 0.9896, "step": 8401 }, { "epoch": 0.19, "learning_rate": 9.304140223195617e-06, "loss": 0.8297, "step": 8402 }, { "epoch": 0.19, "learning_rate": 9.30394908807178e-06, "loss": 0.8915, "step": 8403 }, { "epoch": 0.19, "learning_rate": 9.303757928665354e-06, "loss": 1.0606, "step": 8404 }, { "epoch": 0.19, "learning_rate": 9.303566744977417e-06, "loss": 0.9454, "step": 8405 }, { "epoch": 0.19, "learning_rate": 9.303375537009052e-06, "loss": 1.1942, "step": 8406 }, { "epoch": 0.19, "learning_rate": 9.303184304761333e-06, "loss": 1.0086, "step": 8407 }, { "epoch": 0.19, "learning_rate": 9.302993048235343e-06, "loss": 1.1072, "step": 8408 }, { "epoch": 0.2, "learning_rate": 9.302801767432156e-06, "loss": 1.0134, "step": 8409 }, { "epoch": 0.2, "learning_rate": 9.302610462352857e-06, "loss": 1.0632, "step": 8410 }, { "epoch": 0.2, "learning_rate": 9.302419132998521e-06, "loss": 1.1635, "step": 8411 }, { "epoch": 0.2, "learning_rate": 9.302227779370227e-06, "loss": 1.3039, "step": 8412 }, { "epoch": 0.2, "learning_rate": 9.30203640146906e-06, "loss": 0.9307, "step": 8413 }, { "epoch": 0.2, "learning_rate": 9.301844999296095e-06, "loss": 0.8687, "step": 8414 }, { "epoch": 0.2, "learning_rate": 9.301653572852412e-06, "loss": 0.992, "step": 8415 }, { "epoch": 0.2, "learning_rate": 9.301462122139093e-06, "loss": 1.1932, "step": 8416 }, { "epoch": 0.2, "learning_rate": 9.301270647157217e-06, "loss": 0.8466, "step": 8417 }, { "epoch": 0.2, "learning_rate": 9.301079147907866e-06, "loss": 1.0712, "step": 8418 }, { "epoch": 0.2, "learning_rate": 9.300887624392116e-06, "loss": 1.1809, "step": 8419 }, { "epoch": 0.2, "learning_rate": 9.300696076611053e-06, "loss": 0.8851, "step": 8420 }, { "epoch": 0.2, "learning_rate": 9.300504504565756e-06, "loss": 0.9718, "step": 8421 }, { "epoch": 0.2, "learning_rate": 9.300312908257303e-06, "loss": 1.0979, "step": 8422 }, { "epoch": 0.2, "learning_rate": 9.300121287686778e-06, "loss": 1.0953, "step": 8423 }, { "epoch": 0.2, "learning_rate": 9.29992964285526e-06, "loss": 0.9661, "step": 8424 }, { "epoch": 0.2, "learning_rate": 9.299737973763834e-06, "loss": 1.0395, "step": 8425 }, { "epoch": 0.2, "learning_rate": 9.299546280413578e-06, "loss": 0.8247, "step": 8426 }, { "epoch": 0.2, "learning_rate": 9.299354562805572e-06, "loss": 1.2922, "step": 8427 }, { "epoch": 0.2, "learning_rate": 9.299162820940902e-06, "loss": 1.0441, "step": 8428 }, { "epoch": 0.2, "learning_rate": 9.298971054820648e-06, "loss": 1.0843, "step": 8429 }, { "epoch": 0.2, "learning_rate": 9.29877926444589e-06, "loss": 0.9149, "step": 8430 }, { "epoch": 0.2, "learning_rate": 9.298587449817713e-06, "loss": 0.9884, "step": 8431 }, { "epoch": 0.2, "learning_rate": 9.2983956109372e-06, "loss": 0.9421, "step": 8432 }, { "epoch": 0.2, "learning_rate": 9.298203747805428e-06, "loss": 0.9356, "step": 8433 }, { "epoch": 0.2, "learning_rate": 9.298011860423484e-06, "loss": 0.8844, "step": 8434 }, { "epoch": 0.2, "learning_rate": 9.297819948792451e-06, "loss": 1.0874, "step": 8435 }, { "epoch": 0.2, "learning_rate": 9.297628012913407e-06, "loss": 0.9355, "step": 8436 }, { "epoch": 0.2, "learning_rate": 9.29743605278744e-06, "loss": 1.0482, "step": 8437 }, { "epoch": 0.2, "learning_rate": 9.297244068415632e-06, "loss": 0.9807, "step": 8438 }, { "epoch": 0.2, "learning_rate": 9.297052059799064e-06, "loss": 0.8641, "step": 8439 }, { "epoch": 0.2, "learning_rate": 9.29686002693882e-06, "loss": 0.9041, "step": 8440 }, { "epoch": 0.2, "learning_rate": 9.296667969835986e-06, "loss": 0.6946, "step": 8441 }, { "epoch": 0.2, "learning_rate": 9.296475888491642e-06, "loss": 1.0378, "step": 8442 }, { "epoch": 0.2, "learning_rate": 9.296283782906873e-06, "loss": 1.0932, "step": 8443 }, { "epoch": 0.2, "learning_rate": 9.296091653082764e-06, "loss": 1.0767, "step": 8444 }, { "epoch": 0.2, "learning_rate": 9.295899499020398e-06, "loss": 1.0024, "step": 8445 }, { "epoch": 0.2, "learning_rate": 9.295707320720859e-06, "loss": 0.7635, "step": 8446 }, { "epoch": 0.2, "learning_rate": 9.295515118185232e-06, "loss": 1.29, "step": 8447 }, { "epoch": 0.2, "learning_rate": 9.2953228914146e-06, "loss": 0.9712, "step": 8448 }, { "epoch": 0.2, "learning_rate": 9.295130640410048e-06, "loss": 0.985, "step": 8449 }, { "epoch": 0.2, "learning_rate": 9.294938365172663e-06, "loss": 0.9715, "step": 8450 }, { "epoch": 0.2, "learning_rate": 9.294746065703528e-06, "loss": 0.9094, "step": 8451 }, { "epoch": 0.2, "learning_rate": 9.294553742003725e-06, "loss": 1.0916, "step": 8452 }, { "epoch": 0.2, "learning_rate": 9.294361394074346e-06, "loss": 1.0749, "step": 8453 }, { "epoch": 0.2, "learning_rate": 9.294169021916468e-06, "loss": 1.3345, "step": 8454 }, { "epoch": 0.2, "learning_rate": 9.293976625531183e-06, "loss": 0.9621, "step": 8455 }, { "epoch": 0.2, "learning_rate": 9.293784204919573e-06, "loss": 1.0676, "step": 8456 }, { "epoch": 0.2, "learning_rate": 9.293591760082724e-06, "loss": 1.0609, "step": 8457 }, { "epoch": 0.2, "learning_rate": 9.293399291021724e-06, "loss": 0.9915, "step": 8458 }, { "epoch": 0.2, "learning_rate": 9.293206797737655e-06, "loss": 1.0298, "step": 8459 }, { "epoch": 0.2, "learning_rate": 9.293014280231607e-06, "loss": 0.9686, "step": 8460 }, { "epoch": 0.2, "learning_rate": 9.292821738504665e-06, "loss": 1.0347, "step": 8461 }, { "epoch": 0.2, "learning_rate": 9.292629172557912e-06, "loss": 0.8548, "step": 8462 }, { "epoch": 0.2, "learning_rate": 9.292436582392439e-06, "loss": 0.9478, "step": 8463 }, { "epoch": 0.2, "learning_rate": 9.292243968009332e-06, "loss": 0.6817, "step": 8464 }, { "epoch": 0.2, "learning_rate": 9.292051329409675e-06, "loss": 1.0361, "step": 8465 }, { "epoch": 0.2, "learning_rate": 9.291858666594557e-06, "loss": 0.7765, "step": 8466 }, { "epoch": 0.2, "learning_rate": 9.291665979565064e-06, "loss": 0.9276, "step": 8467 }, { "epoch": 0.2, "learning_rate": 9.291473268322282e-06, "loss": 1.0059, "step": 8468 }, { "epoch": 0.2, "learning_rate": 9.291280532867301e-06, "loss": 0.9665, "step": 8469 }, { "epoch": 0.2, "learning_rate": 9.291087773201208e-06, "loss": 1.0807, "step": 8470 }, { "epoch": 0.2, "learning_rate": 9.290894989325088e-06, "loss": 0.942, "step": 8471 }, { "epoch": 0.2, "learning_rate": 9.290702181240032e-06, "loss": 0.8538, "step": 8472 }, { "epoch": 0.2, "learning_rate": 9.290509348947125e-06, "loss": 0.9249, "step": 8473 }, { "epoch": 0.2, "learning_rate": 9.290316492447456e-06, "loss": 1.1118, "step": 8474 }, { "epoch": 0.2, "learning_rate": 9.290123611742115e-06, "loss": 0.9457, "step": 8475 }, { "epoch": 0.2, "learning_rate": 9.289930706832187e-06, "loss": 1.1329, "step": 8476 }, { "epoch": 0.2, "learning_rate": 9.289737777718762e-06, "loss": 0.8973, "step": 8477 }, { "epoch": 0.2, "learning_rate": 9.289544824402927e-06, "loss": 1.0095, "step": 8478 }, { "epoch": 0.2, "learning_rate": 9.289351846885772e-06, "loss": 1.2209, "step": 8479 }, { "epoch": 0.2, "learning_rate": 9.289158845168388e-06, "loss": 0.8804, "step": 8480 }, { "epoch": 0.2, "learning_rate": 9.28896581925186e-06, "loss": 1.0038, "step": 8481 }, { "epoch": 0.2, "learning_rate": 9.288772769137278e-06, "loss": 1.0869, "step": 8482 }, { "epoch": 0.2, "learning_rate": 9.288579694825731e-06, "loss": 1.2604, "step": 8483 }, { "epoch": 0.2, "learning_rate": 9.288386596318312e-06, "loss": 1.1799, "step": 8484 }, { "epoch": 0.2, "learning_rate": 9.288193473616107e-06, "loss": 0.9547, "step": 8485 }, { "epoch": 0.2, "learning_rate": 9.288000326720206e-06, "loss": 0.8387, "step": 8486 }, { "epoch": 0.2, "learning_rate": 9.287807155631696e-06, "loss": 0.8592, "step": 8487 }, { "epoch": 0.2, "learning_rate": 9.287613960351674e-06, "loss": 0.8118, "step": 8488 }, { "epoch": 0.2, "learning_rate": 9.287420740881221e-06, "loss": 0.8782, "step": 8489 }, { "epoch": 0.2, "learning_rate": 9.287227497221435e-06, "loss": 0.9006, "step": 8490 }, { "epoch": 0.2, "learning_rate": 9.287034229373402e-06, "loss": 1.2222, "step": 8491 }, { "epoch": 0.2, "learning_rate": 9.286840937338215e-06, "loss": 1.0731, "step": 8492 }, { "epoch": 0.2, "learning_rate": 9.286647621116962e-06, "loss": 0.8014, "step": 8493 }, { "epoch": 0.2, "learning_rate": 9.286454280710733e-06, "loss": 1.101, "step": 8494 }, { "epoch": 0.2, "learning_rate": 9.286260916120622e-06, "loss": 1.2009, "step": 8495 }, { "epoch": 0.2, "learning_rate": 9.28606752734772e-06, "loss": 0.9537, "step": 8496 }, { "epoch": 0.2, "learning_rate": 9.285874114393113e-06, "loss": 0.8834, "step": 8497 }, { "epoch": 0.2, "learning_rate": 9.285680677257897e-06, "loss": 0.9635, "step": 8498 }, { "epoch": 0.2, "learning_rate": 9.285487215943165e-06, "loss": 0.9902, "step": 8499 }, { "epoch": 0.2, "learning_rate": 9.285293730450002e-06, "loss": 1.0074, "step": 8500 }, { "epoch": 0.2, "learning_rate": 9.285100220779506e-06, "loss": 0.7166, "step": 8501 }, { "epoch": 0.2, "learning_rate": 9.284906686932764e-06, "loss": 1.1631, "step": 8502 }, { "epoch": 0.2, "learning_rate": 9.284713128910871e-06, "loss": 0.9136, "step": 8503 }, { "epoch": 0.2, "learning_rate": 9.284519546714918e-06, "loss": 1.0685, "step": 8504 }, { "epoch": 0.2, "learning_rate": 9.284325940345997e-06, "loss": 1.0019, "step": 8505 }, { "epoch": 0.2, "learning_rate": 9.2841323098052e-06, "loss": 1.0051, "step": 8506 }, { "epoch": 0.2, "learning_rate": 9.283938655093621e-06, "loss": 1.0264, "step": 8507 }, { "epoch": 0.2, "learning_rate": 9.28374497621235e-06, "loss": 0.9951, "step": 8508 }, { "epoch": 0.2, "learning_rate": 9.28355127316248e-06, "loss": 0.9705, "step": 8509 }, { "epoch": 0.2, "learning_rate": 9.283357545945109e-06, "loss": 1.0497, "step": 8510 }, { "epoch": 0.2, "learning_rate": 9.283163794561323e-06, "loss": 0.9798, "step": 8511 }, { "epoch": 0.2, "learning_rate": 9.28297001901222e-06, "loss": 0.8754, "step": 8512 }, { "epoch": 0.2, "learning_rate": 9.28277621929889e-06, "loss": 0.9306, "step": 8513 }, { "epoch": 0.2, "learning_rate": 9.282582395422431e-06, "loss": 1.1093, "step": 8514 }, { "epoch": 0.2, "learning_rate": 9.282388547383929e-06, "loss": 1.1874, "step": 8515 }, { "epoch": 0.2, "learning_rate": 9.282194675184485e-06, "loss": 1.0145, "step": 8516 }, { "epoch": 0.2, "learning_rate": 9.282000778825189e-06, "loss": 0.8264, "step": 8517 }, { "epoch": 0.2, "learning_rate": 9.281806858307137e-06, "loss": 1.0998, "step": 8518 }, { "epoch": 0.2, "learning_rate": 9.28161291363142e-06, "loss": 0.818, "step": 8519 }, { "epoch": 0.2, "learning_rate": 9.281418944799135e-06, "loss": 1.022, "step": 8520 }, { "epoch": 0.2, "learning_rate": 9.281224951811376e-06, "loss": 0.9828, "step": 8521 }, { "epoch": 0.2, "learning_rate": 9.281030934669238e-06, "loss": 1.0838, "step": 8522 }, { "epoch": 0.2, "learning_rate": 9.280836893373813e-06, "loss": 1.0422, "step": 8523 }, { "epoch": 0.2, "learning_rate": 9.280642827926197e-06, "loss": 1.2987, "step": 8524 }, { "epoch": 0.2, "learning_rate": 9.280448738327486e-06, "loss": 1.151, "step": 8525 }, { "epoch": 0.2, "learning_rate": 9.280254624578776e-06, "loss": 0.9268, "step": 8526 }, { "epoch": 0.2, "learning_rate": 9.280060486681157e-06, "loss": 1.0574, "step": 8527 }, { "epoch": 0.2, "learning_rate": 9.27986632463573e-06, "loss": 0.9182, "step": 8528 }, { "epoch": 0.2, "learning_rate": 9.27967213844359e-06, "loss": 0.7991, "step": 8529 }, { "epoch": 0.2, "learning_rate": 9.279477928105829e-06, "loss": 0.9312, "step": 8530 }, { "epoch": 0.2, "learning_rate": 9.279283693623544e-06, "loss": 1.0889, "step": 8531 }, { "epoch": 0.2, "learning_rate": 9.279089434997833e-06, "loss": 0.9949, "step": 8532 }, { "epoch": 0.2, "learning_rate": 9.27889515222979e-06, "loss": 1.1691, "step": 8533 }, { "epoch": 0.2, "learning_rate": 9.278700845320509e-06, "loss": 1.0423, "step": 8534 }, { "epoch": 0.2, "learning_rate": 9.278506514271093e-06, "loss": 0.925, "step": 8535 }, { "epoch": 0.2, "learning_rate": 9.278312159082632e-06, "loss": 1.0027, "step": 8536 }, { "epoch": 0.2, "learning_rate": 9.278117779756225e-06, "loss": 0.9106, "step": 8537 }, { "epoch": 0.2, "learning_rate": 9.277923376292968e-06, "loss": 1.1059, "step": 8538 }, { "epoch": 0.2, "learning_rate": 9.277728948693961e-06, "loss": 0.9065, "step": 8539 }, { "epoch": 0.2, "learning_rate": 9.277534496960295e-06, "loss": 0.9029, "step": 8540 }, { "epoch": 0.2, "learning_rate": 9.277340021093071e-06, "loss": 0.8714, "step": 8541 }, { "epoch": 0.2, "learning_rate": 9.277145521093386e-06, "loss": 1.1641, "step": 8542 }, { "epoch": 0.2, "learning_rate": 9.276950996962337e-06, "loss": 1.0037, "step": 8543 }, { "epoch": 0.2, "learning_rate": 9.276756448701023e-06, "loss": 0.9503, "step": 8544 }, { "epoch": 0.2, "learning_rate": 9.276561876310538e-06, "loss": 1.1465, "step": 8545 }, { "epoch": 0.2, "learning_rate": 9.276367279791982e-06, "loss": 1.0359, "step": 8546 }, { "epoch": 0.2, "learning_rate": 9.276172659146453e-06, "loss": 0.9086, "step": 8547 }, { "epoch": 0.2, "learning_rate": 9.275978014375049e-06, "loss": 1.1941, "step": 8548 }, { "epoch": 0.2, "learning_rate": 9.275783345478868e-06, "loss": 0.9869, "step": 8549 }, { "epoch": 0.2, "learning_rate": 9.275588652459007e-06, "loss": 0.9428, "step": 8550 }, { "epoch": 0.2, "learning_rate": 9.275393935316567e-06, "loss": 1.0708, "step": 8551 }, { "epoch": 0.2, "learning_rate": 9.275199194052644e-06, "loss": 1.0885, "step": 8552 }, { "epoch": 0.2, "learning_rate": 9.27500442866834e-06, "loss": 1.2637, "step": 8553 }, { "epoch": 0.2, "learning_rate": 9.274809639164751e-06, "loss": 0.8379, "step": 8554 }, { "epoch": 0.2, "learning_rate": 9.274614825542975e-06, "loss": 0.9914, "step": 8555 }, { "epoch": 0.2, "learning_rate": 9.274419987804113e-06, "loss": 0.9491, "step": 8556 }, { "epoch": 0.2, "learning_rate": 9.274225125949266e-06, "loss": 1.2918, "step": 8557 }, { "epoch": 0.2, "learning_rate": 9.274030239979532e-06, "loss": 0.8623, "step": 8558 }, { "epoch": 0.2, "learning_rate": 9.273835329896009e-06, "loss": 0.9599, "step": 8559 }, { "epoch": 0.2, "learning_rate": 9.273640395699796e-06, "loss": 1.1119, "step": 8560 }, { "epoch": 0.2, "learning_rate": 9.273445437391996e-06, "loss": 1.1117, "step": 8561 }, { "epoch": 0.2, "learning_rate": 9.273250454973708e-06, "loss": 1.4266, "step": 8562 }, { "epoch": 0.2, "learning_rate": 9.273055448446032e-06, "loss": 0.9928, "step": 8563 }, { "epoch": 0.2, "learning_rate": 9.272860417810068e-06, "loss": 1.0723, "step": 8564 }, { "epoch": 0.2, "learning_rate": 9.272665363066915e-06, "loss": 1.0373, "step": 8565 }, { "epoch": 0.2, "learning_rate": 9.272470284217675e-06, "loss": 0.8819, "step": 8566 }, { "epoch": 0.2, "learning_rate": 9.272275181263447e-06, "loss": 1.0076, "step": 8567 }, { "epoch": 0.2, "learning_rate": 9.272080054205336e-06, "loss": 0.8904, "step": 8568 }, { "epoch": 0.2, "learning_rate": 9.271884903044439e-06, "loss": 0.8179, "step": 8569 }, { "epoch": 0.2, "learning_rate": 9.271689727781857e-06, "loss": 1.022, "step": 8570 }, { "epoch": 0.2, "learning_rate": 9.271494528418691e-06, "loss": 0.9686, "step": 8571 }, { "epoch": 0.2, "learning_rate": 9.271299304956045e-06, "loss": 1.2722, "step": 8572 }, { "epoch": 0.2, "learning_rate": 9.27110405739502e-06, "loss": 0.9157, "step": 8573 }, { "epoch": 0.2, "learning_rate": 9.270908785736715e-06, "loss": 1.2042, "step": 8574 }, { "epoch": 0.2, "learning_rate": 9.270713489982232e-06, "loss": 0.9714, "step": 8575 }, { "epoch": 0.2, "learning_rate": 9.270518170132676e-06, "loss": 0.9564, "step": 8576 }, { "epoch": 0.2, "learning_rate": 9.270322826189145e-06, "loss": 0.8573, "step": 8577 }, { "epoch": 0.2, "learning_rate": 9.270127458152745e-06, "loss": 0.8688, "step": 8578 }, { "epoch": 0.2, "learning_rate": 9.269932066024577e-06, "loss": 0.9723, "step": 8579 }, { "epoch": 0.2, "learning_rate": 9.26973664980574e-06, "loss": 1.101, "step": 8580 }, { "epoch": 0.2, "learning_rate": 9.26954120949734e-06, "loss": 1.0208, "step": 8581 }, { "epoch": 0.2, "learning_rate": 9.26934574510048e-06, "loss": 0.8713, "step": 8582 }, { "epoch": 0.2, "learning_rate": 9.269150256616262e-06, "loss": 0.9995, "step": 8583 }, { "epoch": 0.2, "learning_rate": 9.268954744045787e-06, "loss": 1.09, "step": 8584 }, { "epoch": 0.2, "learning_rate": 9.26875920739016e-06, "loss": 0.9962, "step": 8585 }, { "epoch": 0.2, "learning_rate": 9.268563646650485e-06, "loss": 0.9591, "step": 8586 }, { "epoch": 0.2, "learning_rate": 9.268368061827864e-06, "loss": 0.9474, "step": 8587 }, { "epoch": 0.2, "learning_rate": 9.268172452923402e-06, "loss": 0.9664, "step": 8588 }, { "epoch": 0.2, "learning_rate": 9.267976819938197e-06, "loss": 0.8796, "step": 8589 }, { "epoch": 0.2, "learning_rate": 9.267781162873361e-06, "loss": 1.1629, "step": 8590 }, { "epoch": 0.2, "learning_rate": 9.267585481729992e-06, "loss": 1.2064, "step": 8591 }, { "epoch": 0.2, "learning_rate": 9.267389776509196e-06, "loss": 1.2502, "step": 8592 }, { "epoch": 0.2, "learning_rate": 9.267194047212078e-06, "loss": 1.0, "step": 8593 }, { "epoch": 0.2, "learning_rate": 9.266998293839743e-06, "loss": 1.057, "step": 8594 }, { "epoch": 0.2, "learning_rate": 9.266802516393292e-06, "loss": 0.8635, "step": 8595 }, { "epoch": 0.2, "learning_rate": 9.266606714873832e-06, "loss": 1.0008, "step": 8596 }, { "epoch": 0.2, "learning_rate": 9.266410889282467e-06, "loss": 0.8992, "step": 8597 }, { "epoch": 0.2, "learning_rate": 9.2662150396203e-06, "loss": 1.3147, "step": 8598 }, { "epoch": 0.2, "learning_rate": 9.26601916588844e-06, "loss": 1.0487, "step": 8599 }, { "epoch": 0.2, "learning_rate": 9.26582326808799e-06, "loss": 0.7445, "step": 8600 }, { "epoch": 0.2, "learning_rate": 9.265627346220056e-06, "loss": 1.008, "step": 8601 }, { "epoch": 0.2, "learning_rate": 9.265431400285742e-06, "loss": 1.0939, "step": 8602 }, { "epoch": 0.2, "learning_rate": 9.265235430286154e-06, "loss": 0.9999, "step": 8603 }, { "epoch": 0.2, "learning_rate": 9.265039436222397e-06, "loss": 1.1438, "step": 8604 }, { "epoch": 0.2, "learning_rate": 9.264843418095579e-06, "loss": 1.1185, "step": 8605 }, { "epoch": 0.2, "learning_rate": 9.264647375906803e-06, "loss": 0.9948, "step": 8606 }, { "epoch": 0.2, "learning_rate": 9.264451309657177e-06, "loss": 1.3481, "step": 8607 }, { "epoch": 0.2, "learning_rate": 9.264255219347809e-06, "loss": 1.1627, "step": 8608 }, { "epoch": 0.2, "learning_rate": 9.2640591049798e-06, "loss": 0.9557, "step": 8609 }, { "epoch": 0.2, "learning_rate": 9.263862966554262e-06, "loss": 0.8885, "step": 8610 }, { "epoch": 0.2, "learning_rate": 9.263666804072298e-06, "loss": 1.1428, "step": 8611 }, { "epoch": 0.2, "learning_rate": 9.263470617535015e-06, "loss": 0.863, "step": 8612 }, { "epoch": 0.2, "learning_rate": 9.263274406943522e-06, "loss": 1.26, "step": 8613 }, { "epoch": 0.2, "learning_rate": 9.263078172298925e-06, "loss": 1.1197, "step": 8614 }, { "epoch": 0.2, "learning_rate": 9.262881913602331e-06, "loss": 0.9966, "step": 8615 }, { "epoch": 0.2, "learning_rate": 9.262685630854846e-06, "loss": 1.2628, "step": 8616 }, { "epoch": 0.2, "learning_rate": 9.26248932405758e-06, "loss": 0.827, "step": 8617 }, { "epoch": 0.2, "learning_rate": 9.262292993211638e-06, "loss": 0.8086, "step": 8618 }, { "epoch": 0.2, "learning_rate": 9.26209663831813e-06, "loss": 1.1538, "step": 8619 }, { "epoch": 0.2, "learning_rate": 9.26190025937816e-06, "loss": 0.9385, "step": 8620 }, { "epoch": 0.2, "learning_rate": 9.261703856392842e-06, "loss": 0.9223, "step": 8621 }, { "epoch": 0.2, "learning_rate": 9.26150742936328e-06, "loss": 1.1122, "step": 8622 }, { "epoch": 0.2, "learning_rate": 9.26131097829058e-06, "loss": 1.0898, "step": 8623 }, { "epoch": 0.2, "learning_rate": 9.261114503175857e-06, "loss": 1.0215, "step": 8624 }, { "epoch": 0.2, "learning_rate": 9.260918004020214e-06, "loss": 1.0312, "step": 8625 }, { "epoch": 0.2, "learning_rate": 9.260721480824763e-06, "loss": 1.0305, "step": 8626 }, { "epoch": 0.2, "learning_rate": 9.260524933590608e-06, "loss": 1.0443, "step": 8627 }, { "epoch": 0.2, "learning_rate": 9.260328362318865e-06, "loss": 1.1267, "step": 8628 }, { "epoch": 0.2, "learning_rate": 9.260131767010637e-06, "loss": 0.9305, "step": 8629 }, { "epoch": 0.2, "learning_rate": 9.259935147667037e-06, "loss": 1.0137, "step": 8630 }, { "epoch": 0.2, "learning_rate": 9.25973850428917e-06, "loss": 0.9908, "step": 8631 }, { "epoch": 0.2, "learning_rate": 9.25954183687815e-06, "loss": 1.2124, "step": 8632 }, { "epoch": 0.2, "learning_rate": 9.259345145435084e-06, "loss": 0.8639, "step": 8633 }, { "epoch": 0.2, "learning_rate": 9.259148429961082e-06, "loss": 1.017, "step": 8634 }, { "epoch": 0.2, "learning_rate": 9.258951690457257e-06, "loss": 1.1784, "step": 8635 }, { "epoch": 0.2, "learning_rate": 9.258754926924713e-06, "loss": 1.2677, "step": 8636 }, { "epoch": 0.2, "learning_rate": 9.258558139364563e-06, "loss": 0.9388, "step": 8637 }, { "epoch": 0.2, "learning_rate": 9.258361327777921e-06, "loss": 1.0608, "step": 8638 }, { "epoch": 0.2, "learning_rate": 9.25816449216589e-06, "loss": 1.0374, "step": 8639 }, { "epoch": 0.2, "learning_rate": 9.257967632529588e-06, "loss": 1.0769, "step": 8640 }, { "epoch": 0.2, "learning_rate": 9.25777074887012e-06, "loss": 1.093, "step": 8641 }, { "epoch": 0.2, "learning_rate": 9.257573841188602e-06, "loss": 0.9679, "step": 8642 }, { "epoch": 0.2, "learning_rate": 9.25737690948614e-06, "loss": 0.9456, "step": 8643 }, { "epoch": 0.2, "learning_rate": 9.257179953763846e-06, "loss": 0.9089, "step": 8644 }, { "epoch": 0.2, "learning_rate": 9.256982974022834e-06, "loss": 1.1831, "step": 8645 }, { "epoch": 0.2, "learning_rate": 9.256785970264213e-06, "loss": 1.0703, "step": 8646 }, { "epoch": 0.2, "learning_rate": 9.256588942489096e-06, "loss": 1.1513, "step": 8647 }, { "epoch": 0.2, "learning_rate": 9.256391890698592e-06, "loss": 1.0611, "step": 8648 }, { "epoch": 0.2, "learning_rate": 9.256194814893815e-06, "loss": 1.2413, "step": 8649 }, { "epoch": 0.2, "learning_rate": 9.255997715075877e-06, "loss": 0.9986, "step": 8650 }, { "epoch": 0.2, "learning_rate": 9.255800591245889e-06, "loss": 1.254, "step": 8651 }, { "epoch": 0.2, "learning_rate": 9.255603443404963e-06, "loss": 1.0352, "step": 8652 }, { "epoch": 0.2, "learning_rate": 9.255406271554214e-06, "loss": 0.785, "step": 8653 }, { "epoch": 0.2, "learning_rate": 9.25520907569475e-06, "loss": 1.089, "step": 8654 }, { "epoch": 0.2, "learning_rate": 9.255011855827687e-06, "loss": 1.0663, "step": 8655 }, { "epoch": 0.2, "learning_rate": 9.254814611954137e-06, "loss": 0.7287, "step": 8656 }, { "epoch": 0.2, "learning_rate": 9.254617344075211e-06, "loss": 0.7964, "step": 8657 }, { "epoch": 0.2, "learning_rate": 9.254420052192024e-06, "loss": 0.8562, "step": 8658 }, { "epoch": 0.2, "learning_rate": 9.254222736305687e-06, "loss": 0.9079, "step": 8659 }, { "epoch": 0.2, "learning_rate": 9.254025396417316e-06, "loss": 1.0207, "step": 8660 }, { "epoch": 0.2, "learning_rate": 9.253828032528023e-06, "loss": 0.8401, "step": 8661 }, { "epoch": 0.2, "learning_rate": 9.253630644638922e-06, "loss": 1.0363, "step": 8662 }, { "epoch": 0.2, "learning_rate": 9.253433232751126e-06, "loss": 0.9792, "step": 8663 }, { "epoch": 0.2, "learning_rate": 9.25323579686575e-06, "loss": 0.957, "step": 8664 }, { "epoch": 0.2, "learning_rate": 9.253038336983904e-06, "loss": 1.0332, "step": 8665 }, { "epoch": 0.2, "learning_rate": 9.252840853106709e-06, "loss": 0.9252, "step": 8666 }, { "epoch": 0.2, "learning_rate": 9.252643345235272e-06, "loss": 1.0552, "step": 8667 }, { "epoch": 0.2, "learning_rate": 9.252445813370712e-06, "loss": 0.9931, "step": 8668 }, { "epoch": 0.2, "learning_rate": 9.25224825751414e-06, "loss": 0.8469, "step": 8669 }, { "epoch": 0.2, "learning_rate": 9.252050677666676e-06, "loss": 0.9419, "step": 8670 }, { "epoch": 0.2, "learning_rate": 9.251853073829428e-06, "loss": 0.8676, "step": 8671 }, { "epoch": 0.2, "learning_rate": 9.251655446003516e-06, "loss": 0.9302, "step": 8672 }, { "epoch": 0.2, "learning_rate": 9.251457794190053e-06, "loss": 1.1521, "step": 8673 }, { "epoch": 0.2, "learning_rate": 9.251260118390154e-06, "loss": 0.9922, "step": 8674 }, { "epoch": 0.2, "learning_rate": 9.251062418604934e-06, "loss": 0.9522, "step": 8675 }, { "epoch": 0.2, "learning_rate": 9.250864694835509e-06, "loss": 0.8313, "step": 8676 }, { "epoch": 0.2, "learning_rate": 9.250666947082996e-06, "loss": 0.9737, "step": 8677 }, { "epoch": 0.2, "learning_rate": 9.25046917534851e-06, "loss": 1.2137, "step": 8678 }, { "epoch": 0.2, "learning_rate": 9.250271379633163e-06, "loss": 1.0032, "step": 8679 }, { "epoch": 0.2, "learning_rate": 9.250073559938075e-06, "loss": 0.9317, "step": 8680 }, { "epoch": 0.2, "learning_rate": 9.249875716264361e-06, "loss": 0.966, "step": 8681 }, { "epoch": 0.2, "learning_rate": 9.249677848613137e-06, "loss": 1.1369, "step": 8682 }, { "epoch": 0.2, "learning_rate": 9.249479956985521e-06, "loss": 0.919, "step": 8683 }, { "epoch": 0.2, "learning_rate": 9.249282041382629e-06, "loss": 1.1045, "step": 8684 }, { "epoch": 0.2, "learning_rate": 9.249084101805575e-06, "loss": 0.8694, "step": 8685 }, { "epoch": 0.2, "learning_rate": 9.248886138255478e-06, "loss": 0.9447, "step": 8686 }, { "epoch": 0.2, "learning_rate": 9.248688150733454e-06, "loss": 1.1355, "step": 8687 }, { "epoch": 0.2, "learning_rate": 9.24849013924062e-06, "loss": 1.1315, "step": 8688 }, { "epoch": 0.2, "learning_rate": 9.248292103778095e-06, "loss": 1.133, "step": 8689 }, { "epoch": 0.2, "learning_rate": 9.248094044346993e-06, "loss": 1.0105, "step": 8690 }, { "epoch": 0.2, "learning_rate": 9.247895960948434e-06, "loss": 1.0298, "step": 8691 }, { "epoch": 0.2, "learning_rate": 9.247697853583536e-06, "loss": 1.0676, "step": 8692 }, { "epoch": 0.2, "learning_rate": 9.247499722253415e-06, "loss": 1.0911, "step": 8693 }, { "epoch": 0.2, "learning_rate": 9.24730156695919e-06, "loss": 1.0303, "step": 8694 }, { "epoch": 0.2, "learning_rate": 9.247103387701977e-06, "loss": 1.1271, "step": 8695 }, { "epoch": 0.2, "learning_rate": 9.246905184482897e-06, "loss": 0.8832, "step": 8696 }, { "epoch": 0.2, "learning_rate": 9.246706957303066e-06, "loss": 0.9199, "step": 8697 }, { "epoch": 0.2, "learning_rate": 9.246508706163603e-06, "loss": 1.0436, "step": 8698 }, { "epoch": 0.2, "learning_rate": 9.246310431065628e-06, "loss": 0.82, "step": 8699 }, { "epoch": 0.2, "learning_rate": 9.246112132010258e-06, "loss": 0.867, "step": 8700 }, { "epoch": 0.2, "learning_rate": 9.245913808998613e-06, "loss": 0.8731, "step": 8701 }, { "epoch": 0.2, "learning_rate": 9.24571546203181e-06, "loss": 0.9794, "step": 8702 }, { "epoch": 0.2, "learning_rate": 9.24551709111097e-06, "loss": 1.0197, "step": 8703 }, { "epoch": 0.2, "learning_rate": 9.245318696237208e-06, "loss": 1.0878, "step": 8704 }, { "epoch": 0.2, "learning_rate": 9.24512027741165e-06, "loss": 0.8098, "step": 8705 }, { "epoch": 0.2, "learning_rate": 9.244921834635412e-06, "loss": 1.1095, "step": 8706 }, { "epoch": 0.2, "learning_rate": 9.244723367909612e-06, "loss": 1.0232, "step": 8707 }, { "epoch": 0.2, "learning_rate": 9.244524877235374e-06, "loss": 0.7183, "step": 8708 }, { "epoch": 0.2, "learning_rate": 9.244326362613814e-06, "loss": 1.0246, "step": 8709 }, { "epoch": 0.2, "learning_rate": 9.244127824046053e-06, "loss": 0.9812, "step": 8710 }, { "epoch": 0.2, "learning_rate": 9.24392926153321e-06, "loss": 0.9514, "step": 8711 }, { "epoch": 0.2, "learning_rate": 9.24373067507641e-06, "loss": 1.0619, "step": 8712 }, { "epoch": 0.2, "learning_rate": 9.24353206467677e-06, "loss": 1.0611, "step": 8713 }, { "epoch": 0.2, "learning_rate": 9.243333430335408e-06, "loss": 0.7999, "step": 8714 }, { "epoch": 0.2, "learning_rate": 9.243134772053451e-06, "loss": 0.9817, "step": 8715 }, { "epoch": 0.2, "learning_rate": 9.242936089832013e-06, "loss": 1.1018, "step": 8716 }, { "epoch": 0.2, "learning_rate": 9.24273738367222e-06, "loss": 0.9604, "step": 8717 }, { "epoch": 0.2, "learning_rate": 9.24253865357519e-06, "loss": 1.0454, "step": 8718 }, { "epoch": 0.2, "learning_rate": 9.242339899542046e-06, "loss": 0.9873, "step": 8719 }, { "epoch": 0.2, "learning_rate": 9.242141121573908e-06, "loss": 1.1096, "step": 8720 }, { "epoch": 0.2, "learning_rate": 9.2419423196719e-06, "loss": 1.299, "step": 8721 }, { "epoch": 0.2, "learning_rate": 9.241743493837141e-06, "loss": 0.783, "step": 8722 }, { "epoch": 0.2, "learning_rate": 9.241544644070754e-06, "loss": 0.9662, "step": 8723 }, { "epoch": 0.2, "learning_rate": 9.241345770373862e-06, "loss": 1.1554, "step": 8724 }, { "epoch": 0.2, "learning_rate": 9.241146872747585e-06, "loss": 0.9409, "step": 8725 }, { "epoch": 0.2, "learning_rate": 9.240947951193045e-06, "loss": 1.0014, "step": 8726 }, { "epoch": 0.2, "learning_rate": 9.240749005711365e-06, "loss": 1.0444, "step": 8727 }, { "epoch": 0.2, "learning_rate": 9.240550036303667e-06, "loss": 0.9606, "step": 8728 }, { "epoch": 0.2, "learning_rate": 9.240351042971076e-06, "loss": 1.63, "step": 8729 }, { "epoch": 0.2, "learning_rate": 9.240152025714711e-06, "loss": 1.0707, "step": 8730 }, { "epoch": 0.2, "learning_rate": 9.239952984535697e-06, "loss": 1.1402, "step": 8731 }, { "epoch": 0.2, "learning_rate": 9.239753919435158e-06, "loss": 1.0593, "step": 8732 }, { "epoch": 0.2, "learning_rate": 9.239554830414215e-06, "loss": 1.0848, "step": 8733 }, { "epoch": 0.2, "learning_rate": 9.239355717473993e-06, "loss": 1.032, "step": 8734 }, { "epoch": 0.2, "learning_rate": 9.239156580615611e-06, "loss": 0.9392, "step": 8735 }, { "epoch": 0.2, "learning_rate": 9.238957419840198e-06, "loss": 1.0436, "step": 8736 }, { "epoch": 0.2, "learning_rate": 9.238758235148878e-06, "loss": 0.9747, "step": 8737 }, { "epoch": 0.2, "learning_rate": 9.23855902654277e-06, "loss": 1.2198, "step": 8738 }, { "epoch": 0.2, "learning_rate": 9.238359794023e-06, "loss": 0.8818, "step": 8739 }, { "epoch": 0.2, "learning_rate": 9.238160537590693e-06, "loss": 1.1105, "step": 8740 }, { "epoch": 0.2, "learning_rate": 9.237961257246973e-06, "loss": 1.0766, "step": 8741 }, { "epoch": 0.2, "learning_rate": 9.237761952992962e-06, "loss": 0.9333, "step": 8742 }, { "epoch": 0.2, "learning_rate": 9.237562624829788e-06, "loss": 1.1153, "step": 8743 }, { "epoch": 0.2, "learning_rate": 9.237363272758573e-06, "loss": 1.0272, "step": 8744 }, { "epoch": 0.2, "learning_rate": 9.237163896780443e-06, "loss": 0.8042, "step": 8745 }, { "epoch": 0.2, "learning_rate": 9.236964496896523e-06, "loss": 0.9509, "step": 8746 }, { "epoch": 0.2, "learning_rate": 9.236765073107937e-06, "loss": 0.9829, "step": 8747 }, { "epoch": 0.2, "learning_rate": 9.236565625415811e-06, "loss": 1.0555, "step": 8748 }, { "epoch": 0.2, "learning_rate": 9.23636615382127e-06, "loss": 1.1195, "step": 8749 }, { "epoch": 0.2, "learning_rate": 9.236166658325438e-06, "loss": 0.9542, "step": 8750 }, { "epoch": 0.2, "learning_rate": 9.235967138929444e-06, "loss": 1.0191, "step": 8751 }, { "epoch": 0.2, "learning_rate": 9.235767595634409e-06, "loss": 1.1233, "step": 8752 }, { "epoch": 0.2, "learning_rate": 9.235568028441463e-06, "loss": 1.0971, "step": 8753 }, { "epoch": 0.2, "learning_rate": 9.23536843735173e-06, "loss": 1.0442, "step": 8754 }, { "epoch": 0.2, "learning_rate": 9.235168822366337e-06, "loss": 0.87, "step": 8755 }, { "epoch": 0.2, "learning_rate": 9.234969183486409e-06, "loss": 0.9385, "step": 8756 }, { "epoch": 0.2, "learning_rate": 9.234769520713073e-06, "loss": 1.1883, "step": 8757 }, { "epoch": 0.2, "learning_rate": 9.234569834047456e-06, "loss": 0.8661, "step": 8758 }, { "epoch": 0.2, "learning_rate": 9.234370123490682e-06, "loss": 1.017, "step": 8759 }, { "epoch": 0.2, "learning_rate": 9.234170389043881e-06, "loss": 1.0707, "step": 8760 }, { "epoch": 0.2, "learning_rate": 9.23397063070818e-06, "loss": 1.3161, "step": 8761 }, { "epoch": 0.2, "learning_rate": 9.233770848484702e-06, "loss": 0.8853, "step": 8762 }, { "epoch": 0.2, "learning_rate": 9.233571042374578e-06, "loss": 0.7523, "step": 8763 }, { "epoch": 0.2, "learning_rate": 9.233371212378935e-06, "loss": 0.7882, "step": 8764 }, { "epoch": 0.2, "learning_rate": 9.2331713584989e-06, "loss": 1.1084, "step": 8765 }, { "epoch": 0.2, "learning_rate": 9.2329714807356e-06, "loss": 1.1549, "step": 8766 }, { "epoch": 0.2, "learning_rate": 9.232771579090161e-06, "loss": 1.0816, "step": 8767 }, { "epoch": 0.2, "learning_rate": 9.232571653563713e-06, "loss": 0.8756, "step": 8768 }, { "epoch": 0.2, "learning_rate": 9.232371704157385e-06, "loss": 1.2157, "step": 8769 }, { "epoch": 0.2, "learning_rate": 9.232171730872304e-06, "loss": 0.9232, "step": 8770 }, { "epoch": 0.2, "learning_rate": 9.231971733709596e-06, "loss": 0.9337, "step": 8771 }, { "epoch": 0.2, "learning_rate": 9.231771712670392e-06, "loss": 1.0133, "step": 8772 }, { "epoch": 0.2, "learning_rate": 9.23157166775582e-06, "loss": 1.0779, "step": 8773 }, { "epoch": 0.2, "learning_rate": 9.23137159896701e-06, "loss": 0.9408, "step": 8774 }, { "epoch": 0.2, "learning_rate": 9.231171506305087e-06, "loss": 1.2001, "step": 8775 }, { "epoch": 0.2, "learning_rate": 9.230971389771183e-06, "loss": 1.1896, "step": 8776 }, { "epoch": 0.2, "learning_rate": 9.230771249366427e-06, "loss": 1.0649, "step": 8777 }, { "epoch": 0.2, "learning_rate": 9.230571085091946e-06, "loss": 0.9362, "step": 8778 }, { "epoch": 0.2, "learning_rate": 9.230370896948872e-06, "loss": 0.8628, "step": 8779 }, { "epoch": 0.2, "learning_rate": 9.230170684938334e-06, "loss": 0.8784, "step": 8780 }, { "epoch": 0.2, "learning_rate": 9.229970449061459e-06, "loss": 1.1947, "step": 8781 }, { "epoch": 0.2, "learning_rate": 9.229770189319377e-06, "loss": 0.6924, "step": 8782 }, { "epoch": 0.2, "learning_rate": 9.229569905713222e-06, "loss": 1.0448, "step": 8783 }, { "epoch": 0.2, "learning_rate": 9.22936959824412e-06, "loss": 0.9757, "step": 8784 }, { "epoch": 0.2, "learning_rate": 9.229169266913202e-06, "loss": 0.9538, "step": 8785 }, { "epoch": 0.2, "learning_rate": 9.2289689117216e-06, "loss": 1.2209, "step": 8786 }, { "epoch": 0.2, "learning_rate": 9.228768532670443e-06, "loss": 0.6676, "step": 8787 }, { "epoch": 0.2, "learning_rate": 9.22856812976086e-06, "loss": 1.127, "step": 8788 }, { "epoch": 0.2, "learning_rate": 9.228367702993986e-06, "loss": 1.0768, "step": 8789 }, { "epoch": 0.2, "learning_rate": 9.228167252370946e-06, "loss": 1.2284, "step": 8790 }, { "epoch": 0.2, "learning_rate": 9.227966777892876e-06, "loss": 0.8986, "step": 8791 }, { "epoch": 0.2, "learning_rate": 9.227766279560904e-06, "loss": 1.208, "step": 8792 }, { "epoch": 0.2, "learning_rate": 9.227565757376162e-06, "loss": 1.0707, "step": 8793 }, { "epoch": 0.2, "learning_rate": 9.227365211339782e-06, "loss": 1.4003, "step": 8794 }, { "epoch": 0.2, "learning_rate": 9.227164641452896e-06, "loss": 0.9503, "step": 8795 }, { "epoch": 0.2, "learning_rate": 9.226964047716634e-06, "loss": 1.0126, "step": 8796 }, { "epoch": 0.2, "learning_rate": 9.226763430132128e-06, "loss": 0.9672, "step": 8797 }, { "epoch": 0.2, "learning_rate": 9.22656278870051e-06, "loss": 0.8823, "step": 8798 }, { "epoch": 0.2, "learning_rate": 9.226362123422914e-06, "loss": 0.9185, "step": 8799 }, { "epoch": 0.2, "learning_rate": 9.226161434300467e-06, "loss": 0.7484, "step": 8800 }, { "epoch": 0.2, "learning_rate": 9.225960721334307e-06, "loss": 0.9952, "step": 8801 }, { "epoch": 0.2, "learning_rate": 9.225759984525565e-06, "loss": 1.0012, "step": 8802 }, { "epoch": 0.2, "learning_rate": 9.22555922387537e-06, "loss": 0.8515, "step": 8803 }, { "epoch": 0.2, "learning_rate": 9.22535843938486e-06, "loss": 0.8182, "step": 8804 }, { "epoch": 0.2, "learning_rate": 9.225157631055163e-06, "loss": 1.0646, "step": 8805 }, { "epoch": 0.2, "learning_rate": 9.224956798887415e-06, "loss": 0.8951, "step": 8806 }, { "epoch": 0.2, "learning_rate": 9.224755942882745e-06, "loss": 1.2194, "step": 8807 }, { "epoch": 0.2, "learning_rate": 9.224555063042294e-06, "loss": 0.7869, "step": 8808 }, { "epoch": 0.2, "learning_rate": 9.224354159367187e-06, "loss": 1.134, "step": 8809 }, { "epoch": 0.2, "learning_rate": 9.224153231858566e-06, "loss": 1.0361, "step": 8810 }, { "epoch": 0.2, "learning_rate": 9.223952280517556e-06, "loss": 1.1302, "step": 8811 }, { "epoch": 0.2, "learning_rate": 9.223751305345295e-06, "loss": 1.0322, "step": 8812 }, { "epoch": 0.2, "learning_rate": 9.223550306342917e-06, "loss": 1.0122, "step": 8813 }, { "epoch": 0.2, "learning_rate": 9.223349283511556e-06, "loss": 1.1232, "step": 8814 }, { "epoch": 0.2, "learning_rate": 9.223148236852345e-06, "loss": 0.9122, "step": 8815 }, { "epoch": 0.2, "learning_rate": 9.222947166366418e-06, "loss": 1.0729, "step": 8816 }, { "epoch": 0.2, "learning_rate": 9.22274607205491e-06, "loss": 1.1625, "step": 8817 }, { "epoch": 0.2, "learning_rate": 9.222544953918958e-06, "loss": 1.0948, "step": 8818 }, { "epoch": 0.2, "learning_rate": 9.222343811959694e-06, "loss": 0.767, "step": 8819 }, { "epoch": 0.2, "learning_rate": 9.222142646178253e-06, "loss": 0.8898, "step": 8820 }, { "epoch": 0.2, "learning_rate": 9.221941456575771e-06, "loss": 1.0375, "step": 8821 }, { "epoch": 0.2, "learning_rate": 9.22174024315338e-06, "loss": 0.8908, "step": 8822 }, { "epoch": 0.2, "learning_rate": 9.221539005912222e-06, "loss": 0.8241, "step": 8823 }, { "epoch": 0.2, "learning_rate": 9.221337744853425e-06, "loss": 1.0533, "step": 8824 }, { "epoch": 0.2, "learning_rate": 9.221136459978129e-06, "loss": 1.1262, "step": 8825 }, { "epoch": 0.2, "learning_rate": 9.220935151287466e-06, "loss": 1.2748, "step": 8826 }, { "epoch": 0.2, "learning_rate": 9.220733818782574e-06, "loss": 0.9683, "step": 8827 }, { "epoch": 0.2, "learning_rate": 9.22053246246459e-06, "loss": 1.0967, "step": 8828 }, { "epoch": 0.2, "learning_rate": 9.22033108233465e-06, "loss": 0.9763, "step": 8829 }, { "epoch": 0.2, "learning_rate": 9.22012967839389e-06, "loss": 0.9283, "step": 8830 }, { "epoch": 0.2, "learning_rate": 9.219928250643444e-06, "loss": 1.0872, "step": 8831 }, { "epoch": 0.2, "learning_rate": 9.219726799084449e-06, "loss": 1.1725, "step": 8832 }, { "epoch": 0.2, "learning_rate": 9.219525323718043e-06, "loss": 0.9532, "step": 8833 }, { "epoch": 0.2, "learning_rate": 9.219323824545362e-06, "loss": 0.8733, "step": 8834 }, { "epoch": 0.2, "learning_rate": 9.219122301567542e-06, "loss": 1.0925, "step": 8835 }, { "epoch": 0.2, "learning_rate": 9.218920754785723e-06, "loss": 1.0335, "step": 8836 }, { "epoch": 0.2, "learning_rate": 9.218719184201039e-06, "loss": 1.4022, "step": 8837 }, { "epoch": 0.2, "learning_rate": 9.218517589814628e-06, "loss": 1.2228, "step": 8838 }, { "epoch": 0.2, "learning_rate": 9.21831597162763e-06, "loss": 1.0857, "step": 8839 }, { "epoch": 0.21, "learning_rate": 9.218114329641177e-06, "loss": 0.9287, "step": 8840 }, { "epoch": 0.21, "learning_rate": 9.217912663856412e-06, "loss": 1.104, "step": 8841 }, { "epoch": 0.21, "learning_rate": 9.21771097427447e-06, "loss": 0.9424, "step": 8842 }, { "epoch": 0.21, "learning_rate": 9.217509260896489e-06, "loss": 0.8076, "step": 8843 }, { "epoch": 0.21, "learning_rate": 9.217307523723609e-06, "loss": 1.0301, "step": 8844 }, { "epoch": 0.21, "learning_rate": 9.217105762756966e-06, "loss": 0.8194, "step": 8845 }, { "epoch": 0.21, "learning_rate": 9.216903977997698e-06, "loss": 1.0267, "step": 8846 }, { "epoch": 0.21, "learning_rate": 9.216702169446947e-06, "loss": 1.0158, "step": 8847 }, { "epoch": 0.21, "learning_rate": 9.216500337105847e-06, "loss": 0.8446, "step": 8848 }, { "epoch": 0.21, "learning_rate": 9.216298480975541e-06, "loss": 0.9986, "step": 8849 }, { "epoch": 0.21, "learning_rate": 9.216096601057163e-06, "loss": 0.9908, "step": 8850 }, { "epoch": 0.21, "learning_rate": 9.215894697351857e-06, "loss": 1.0123, "step": 8851 }, { "epoch": 0.21, "learning_rate": 9.215692769860758e-06, "loss": 0.7278, "step": 8852 }, { "epoch": 0.21, "learning_rate": 9.21549081858501e-06, "loss": 1.1472, "step": 8853 }, { "epoch": 0.21, "learning_rate": 9.215288843525747e-06, "loss": 0.8247, "step": 8854 }, { "epoch": 0.21, "learning_rate": 9.215086844684112e-06, "loss": 1.0106, "step": 8855 }, { "epoch": 0.21, "learning_rate": 9.214884822061244e-06, "loss": 0.8538, "step": 8856 }, { "epoch": 0.21, "learning_rate": 9.214682775658283e-06, "loss": 0.875, "step": 8857 }, { "epoch": 0.21, "learning_rate": 9.214480705476367e-06, "loss": 1.1186, "step": 8858 }, { "epoch": 0.21, "learning_rate": 9.214278611516638e-06, "loss": 0.8488, "step": 8859 }, { "epoch": 0.21, "learning_rate": 9.214076493780235e-06, "loss": 1.0036, "step": 8860 }, { "epoch": 0.21, "learning_rate": 9.213874352268301e-06, "loss": 0.9645, "step": 8861 }, { "epoch": 0.21, "learning_rate": 9.213672186981974e-06, "loss": 0.9777, "step": 8862 }, { "epoch": 0.21, "learning_rate": 9.213469997922395e-06, "loss": 0.7171, "step": 8863 }, { "epoch": 0.21, "learning_rate": 9.213267785090704e-06, "loss": 0.9546, "step": 8864 }, { "epoch": 0.21, "learning_rate": 9.213065548488042e-06, "loss": 0.957, "step": 8865 }, { "epoch": 0.21, "learning_rate": 9.212863288115552e-06, "loss": 0.7293, "step": 8866 }, { "epoch": 0.21, "learning_rate": 9.212661003974374e-06, "loss": 0.9689, "step": 8867 }, { "epoch": 0.21, "learning_rate": 9.212458696065649e-06, "loss": 0.9045, "step": 8868 }, { "epoch": 0.21, "learning_rate": 9.212256364390519e-06, "loss": 1.0803, "step": 8869 }, { "epoch": 0.21, "learning_rate": 9.212054008950125e-06, "loss": 0.8793, "step": 8870 }, { "epoch": 0.21, "learning_rate": 9.21185162974561e-06, "loss": 1.2089, "step": 8871 }, { "epoch": 0.21, "learning_rate": 9.211649226778112e-06, "loss": 1.1666, "step": 8872 }, { "epoch": 0.21, "learning_rate": 9.211446800048777e-06, "loss": 0.7336, "step": 8873 }, { "epoch": 0.21, "learning_rate": 9.211244349558745e-06, "loss": 0.9713, "step": 8874 }, { "epoch": 0.21, "learning_rate": 9.21104187530916e-06, "loss": 0.9653, "step": 8875 }, { "epoch": 0.21, "learning_rate": 9.210839377301162e-06, "loss": 0.9369, "step": 8876 }, { "epoch": 0.21, "learning_rate": 9.210636855535896e-06, "loss": 1.0551, "step": 8877 }, { "epoch": 0.21, "learning_rate": 9.210434310014501e-06, "loss": 1.0174, "step": 8878 }, { "epoch": 0.21, "learning_rate": 9.210231740738122e-06, "loss": 1.0578, "step": 8879 }, { "epoch": 0.21, "learning_rate": 9.210029147707903e-06, "loss": 0.9764, "step": 8880 }, { "epoch": 0.21, "learning_rate": 9.209826530924989e-06, "loss": 0.702, "step": 8881 }, { "epoch": 0.21, "learning_rate": 9.209623890390516e-06, "loss": 1.1814, "step": 8882 }, { "epoch": 0.21, "learning_rate": 9.209421226105633e-06, "loss": 0.9961, "step": 8883 }, { "epoch": 0.21, "learning_rate": 9.20921853807148e-06, "loss": 1.3079, "step": 8884 }, { "epoch": 0.21, "learning_rate": 9.209015826289204e-06, "loss": 1.0825, "step": 8885 }, { "epoch": 0.21, "learning_rate": 9.208813090759946e-06, "loss": 0.7936, "step": 8886 }, { "epoch": 0.21, "learning_rate": 9.208610331484852e-06, "loss": 1.0026, "step": 8887 }, { "epoch": 0.21, "learning_rate": 9.208407548465064e-06, "loss": 0.8217, "step": 8888 }, { "epoch": 0.21, "learning_rate": 9.208204741701727e-06, "loss": 1.1381, "step": 8889 }, { "epoch": 0.21, "learning_rate": 9.208001911195984e-06, "loss": 1.2213, "step": 8890 }, { "epoch": 0.21, "learning_rate": 9.207799056948982e-06, "loss": 0.8421, "step": 8891 }, { "epoch": 0.21, "learning_rate": 9.207596178961864e-06, "loss": 1.2361, "step": 8892 }, { "epoch": 0.21, "learning_rate": 9.207393277235774e-06, "loss": 0.9947, "step": 8893 }, { "epoch": 0.21, "learning_rate": 9.207190351771858e-06, "loss": 1.0826, "step": 8894 }, { "epoch": 0.21, "learning_rate": 9.20698740257126e-06, "loss": 0.7871, "step": 8895 }, { "epoch": 0.21, "learning_rate": 9.206784429635124e-06, "loss": 1.0388, "step": 8896 }, { "epoch": 0.21, "learning_rate": 9.206581432964597e-06, "loss": 1.5848, "step": 8897 }, { "epoch": 0.21, "learning_rate": 9.206378412560823e-06, "loss": 0.7941, "step": 8898 }, { "epoch": 0.21, "learning_rate": 9.20617536842495e-06, "loss": 0.9632, "step": 8899 }, { "epoch": 0.21, "learning_rate": 9.205972300558121e-06, "loss": 1.3138, "step": 8900 }, { "epoch": 0.21, "learning_rate": 9.20576920896148e-06, "loss": 1.0169, "step": 8901 }, { "epoch": 0.21, "learning_rate": 9.20556609363618e-06, "loss": 0.8878, "step": 8902 }, { "epoch": 0.21, "learning_rate": 9.20536295458336e-06, "loss": 0.9241, "step": 8903 }, { "epoch": 0.21, "learning_rate": 9.205159791804165e-06, "loss": 0.7645, "step": 8904 }, { "epoch": 0.21, "learning_rate": 9.204956605299748e-06, "loss": 0.9002, "step": 8905 }, { "epoch": 0.21, "learning_rate": 9.20475339507125e-06, "loss": 0.8722, "step": 8906 }, { "epoch": 0.21, "learning_rate": 9.204550161119824e-06, "loss": 0.9862, "step": 8907 }, { "epoch": 0.21, "learning_rate": 9.204346903446605e-06, "loss": 0.9588, "step": 8908 }, { "epoch": 0.21, "learning_rate": 9.204143622052753e-06, "loss": 1.099, "step": 8909 }, { "epoch": 0.21, "learning_rate": 9.203940316939405e-06, "loss": 1.0039, "step": 8910 }, { "epoch": 0.21, "learning_rate": 9.203736988107713e-06, "loss": 0.9765, "step": 8911 }, { "epoch": 0.21, "learning_rate": 9.203533635558822e-06, "loss": 0.9195, "step": 8912 }, { "epoch": 0.21, "learning_rate": 9.203330259293879e-06, "loss": 0.9194, "step": 8913 }, { "epoch": 0.21, "learning_rate": 9.203126859314035e-06, "loss": 1.1099, "step": 8914 }, { "epoch": 0.21, "learning_rate": 9.202923435620435e-06, "loss": 1.1943, "step": 8915 }, { "epoch": 0.21, "learning_rate": 9.202719988214227e-06, "loss": 0.9866, "step": 8916 }, { "epoch": 0.21, "learning_rate": 9.202516517096556e-06, "loss": 0.9715, "step": 8917 }, { "epoch": 0.21, "learning_rate": 9.202313022268575e-06, "loss": 0.9851, "step": 8918 }, { "epoch": 0.21, "learning_rate": 9.20210950373143e-06, "loss": 0.8424, "step": 8919 }, { "epoch": 0.21, "learning_rate": 9.201905961486266e-06, "loss": 1.1197, "step": 8920 }, { "epoch": 0.21, "learning_rate": 9.201702395534238e-06, "loss": 1.0521, "step": 8921 }, { "epoch": 0.21, "learning_rate": 9.20149880587649e-06, "loss": 0.8478, "step": 8922 }, { "epoch": 0.21, "learning_rate": 9.20129519251417e-06, "loss": 1.143, "step": 8923 }, { "epoch": 0.21, "learning_rate": 9.20109155544843e-06, "loss": 0.9708, "step": 8924 }, { "epoch": 0.21, "learning_rate": 9.200887894680415e-06, "loss": 1.1477, "step": 8925 }, { "epoch": 0.21, "learning_rate": 9.20068421021128e-06, "loss": 1.0818, "step": 8926 }, { "epoch": 0.21, "learning_rate": 9.200480502042165e-06, "loss": 1.1724, "step": 8927 }, { "epoch": 0.21, "learning_rate": 9.20027677017423e-06, "loss": 1.1287, "step": 8928 }, { "epoch": 0.21, "learning_rate": 9.200073014608618e-06, "loss": 0.8353, "step": 8929 }, { "epoch": 0.21, "learning_rate": 9.199869235346476e-06, "loss": 0.8992, "step": 8930 }, { "epoch": 0.21, "learning_rate": 9.199665432388963e-06, "loss": 0.9579, "step": 8931 }, { "epoch": 0.21, "learning_rate": 9.199461605737219e-06, "loss": 1.1548, "step": 8932 }, { "epoch": 0.21, "learning_rate": 9.1992577553924e-06, "loss": 1.2351, "step": 8933 }, { "epoch": 0.21, "learning_rate": 9.199053881355654e-06, "loss": 0.8133, "step": 8934 }, { "epoch": 0.21, "learning_rate": 9.198849983628131e-06, "loss": 0.9526, "step": 8935 }, { "epoch": 0.21, "learning_rate": 9.198646062210985e-06, "loss": 1.1237, "step": 8936 }, { "epoch": 0.21, "learning_rate": 9.198442117105359e-06, "loss": 1.1284, "step": 8937 }, { "epoch": 0.21, "learning_rate": 9.198238148312411e-06, "loss": 0.7976, "step": 8938 }, { "epoch": 0.21, "learning_rate": 9.198034155833288e-06, "loss": 1.2567, "step": 8939 }, { "epoch": 0.21, "learning_rate": 9.197830139669144e-06, "loss": 1.0737, "step": 8940 }, { "epoch": 0.21, "learning_rate": 9.197626099821126e-06, "loss": 1.0758, "step": 8941 }, { "epoch": 0.21, "learning_rate": 9.197422036290386e-06, "loss": 1.0415, "step": 8942 }, { "epoch": 0.21, "learning_rate": 9.197217949078078e-06, "loss": 1.2695, "step": 8943 }, { "epoch": 0.21, "learning_rate": 9.197013838185352e-06, "loss": 0.9699, "step": 8944 }, { "epoch": 0.21, "learning_rate": 9.196809703613358e-06, "loss": 1.1982, "step": 8945 }, { "epoch": 0.21, "learning_rate": 9.19660554536325e-06, "loss": 1.1142, "step": 8946 }, { "epoch": 0.21, "learning_rate": 9.196401363436181e-06, "loss": 0.9482, "step": 8947 }, { "epoch": 0.21, "learning_rate": 9.196197157833297e-06, "loss": 1.0269, "step": 8948 }, { "epoch": 0.21, "learning_rate": 9.195992928555756e-06, "loss": 1.1995, "step": 8949 }, { "epoch": 0.21, "learning_rate": 9.195788675604708e-06, "loss": 0.8452, "step": 8950 }, { "epoch": 0.21, "learning_rate": 9.195584398981307e-06, "loss": 0.7947, "step": 8951 }, { "epoch": 0.21, "learning_rate": 9.195380098686703e-06, "loss": 1.0224, "step": 8952 }, { "epoch": 0.21, "learning_rate": 9.195175774722049e-06, "loss": 1.0325, "step": 8953 }, { "epoch": 0.21, "learning_rate": 9.194971427088501e-06, "loss": 0.8162, "step": 8954 }, { "epoch": 0.21, "learning_rate": 9.194767055787208e-06, "loss": 1.1268, "step": 8955 }, { "epoch": 0.21, "learning_rate": 9.194562660819324e-06, "loss": 1.1275, "step": 8956 }, { "epoch": 0.21, "learning_rate": 9.194358242186003e-06, "loss": 1.0742, "step": 8957 }, { "epoch": 0.21, "learning_rate": 9.194153799888398e-06, "loss": 1.1194, "step": 8958 }, { "epoch": 0.21, "learning_rate": 9.193949333927665e-06, "loss": 1.1178, "step": 8959 }, { "epoch": 0.21, "learning_rate": 9.193744844304952e-06, "loss": 0.917, "step": 8960 }, { "epoch": 0.21, "learning_rate": 9.193540331021418e-06, "loss": 0.9454, "step": 8961 }, { "epoch": 0.21, "learning_rate": 9.193335794078214e-06, "loss": 1.0112, "step": 8962 }, { "epoch": 0.21, "learning_rate": 9.193131233476495e-06, "loss": 0.914, "step": 8963 }, { "epoch": 0.21, "learning_rate": 9.192926649217414e-06, "loss": 1.0259, "step": 8964 }, { "epoch": 0.21, "learning_rate": 9.192722041302127e-06, "loss": 1.0816, "step": 8965 }, { "epoch": 0.21, "learning_rate": 9.192517409731787e-06, "loss": 1.1215, "step": 8966 }, { "epoch": 0.21, "learning_rate": 9.192312754507548e-06, "loss": 0.7409, "step": 8967 }, { "epoch": 0.21, "learning_rate": 9.192108075630565e-06, "loss": 0.969, "step": 8968 }, { "epoch": 0.21, "learning_rate": 9.191903373101995e-06, "loss": 0.9803, "step": 8969 }, { "epoch": 0.21, "learning_rate": 9.191698646922992e-06, "loss": 0.9914, "step": 8970 }, { "epoch": 0.21, "learning_rate": 9.19149389709471e-06, "loss": 0.8997, "step": 8971 }, { "epoch": 0.21, "learning_rate": 9.191289123618304e-06, "loss": 0.8755, "step": 8972 }, { "epoch": 0.21, "learning_rate": 9.19108432649493e-06, "loss": 0.9483, "step": 8973 }, { "epoch": 0.21, "learning_rate": 9.190879505725742e-06, "loss": 0.8416, "step": 8974 }, { "epoch": 0.21, "learning_rate": 9.190674661311899e-06, "loss": 0.969, "step": 8975 }, { "epoch": 0.21, "learning_rate": 9.190469793254554e-06, "loss": 1.0314, "step": 8976 }, { "epoch": 0.21, "learning_rate": 9.190264901554863e-06, "loss": 1.1432, "step": 8977 }, { "epoch": 0.21, "learning_rate": 9.190059986213982e-06, "loss": 1.0788, "step": 8978 }, { "epoch": 0.21, "learning_rate": 9.189855047233068e-06, "loss": 1.1056, "step": 8979 }, { "epoch": 0.21, "learning_rate": 9.189650084613278e-06, "loss": 1.1405, "step": 8980 }, { "epoch": 0.21, "learning_rate": 9.189445098355765e-06, "loss": 0.8744, "step": 8981 }, { "epoch": 0.21, "learning_rate": 9.18924008846169e-06, "loss": 0.9296, "step": 8982 }, { "epoch": 0.21, "learning_rate": 9.189035054932205e-06, "loss": 0.9511, "step": 8983 }, { "epoch": 0.21, "learning_rate": 9.188829997768471e-06, "loss": 0.7349, "step": 8984 }, { "epoch": 0.21, "learning_rate": 9.188624916971642e-06, "loss": 1.0181, "step": 8985 }, { "epoch": 0.21, "learning_rate": 9.188419812542877e-06, "loss": 0.9886, "step": 8986 }, { "epoch": 0.21, "learning_rate": 9.188214684483331e-06, "loss": 0.8766, "step": 8987 }, { "epoch": 0.21, "learning_rate": 9.188009532794165e-06, "loss": 0.8784, "step": 8988 }, { "epoch": 0.21, "learning_rate": 9.187804357476531e-06, "loss": 1.146, "step": 8989 }, { "epoch": 0.21, "learning_rate": 9.187599158531593e-06, "loss": 1.0059, "step": 8990 }, { "epoch": 0.21, "learning_rate": 9.187393935960502e-06, "loss": 0.8499, "step": 8991 }, { "epoch": 0.21, "learning_rate": 9.18718868976442e-06, "loss": 0.9821, "step": 8992 }, { "epoch": 0.21, "learning_rate": 9.186983419944506e-06, "loss": 1.1603, "step": 8993 }, { "epoch": 0.21, "learning_rate": 9.186778126501916e-06, "loss": 1.0468, "step": 8994 }, { "epoch": 0.21, "learning_rate": 9.186572809437808e-06, "loss": 1.0122, "step": 8995 }, { "epoch": 0.21, "learning_rate": 9.186367468753341e-06, "loss": 1.1107, "step": 8996 }, { "epoch": 0.21, "learning_rate": 9.186162104449674e-06, "loss": 1.3481, "step": 8997 }, { "epoch": 0.21, "learning_rate": 9.185956716527965e-06, "loss": 1.0424, "step": 8998 }, { "epoch": 0.21, "learning_rate": 9.185751304989372e-06, "loss": 0.9029, "step": 8999 }, { "epoch": 0.21, "learning_rate": 9.185545869835056e-06, "loss": 1.2179, "step": 9000 }, { "epoch": 0.21, "learning_rate": 9.185340411066175e-06, "loss": 1.0201, "step": 9001 }, { "epoch": 0.21, "learning_rate": 9.185134928683887e-06, "loss": 0.8106, "step": 9002 }, { "epoch": 0.21, "learning_rate": 9.184929422689353e-06, "loss": 1.0613, "step": 9003 }, { "epoch": 0.21, "learning_rate": 9.184723893083733e-06, "loss": 0.8276, "step": 9004 }, { "epoch": 0.21, "learning_rate": 9.184518339868183e-06, "loss": 1.1318, "step": 9005 }, { "epoch": 0.21, "learning_rate": 9.184312763043866e-06, "loss": 1.0124, "step": 9006 }, { "epoch": 0.21, "learning_rate": 9.184107162611942e-06, "loss": 1.058, "step": 9007 }, { "epoch": 0.21, "learning_rate": 9.18390153857357e-06, "loss": 1.0562, "step": 9008 }, { "epoch": 0.21, "learning_rate": 9.18369589092991e-06, "loss": 1.1256, "step": 9009 }, { "epoch": 0.21, "learning_rate": 9.18349021968212e-06, "loss": 1.2122, "step": 9010 }, { "epoch": 0.21, "learning_rate": 9.183284524831367e-06, "loss": 1.1077, "step": 9011 }, { "epoch": 0.21, "learning_rate": 9.183078806378803e-06, "loss": 0.7673, "step": 9012 }, { "epoch": 0.21, "learning_rate": 9.182873064325596e-06, "loss": 0.8753, "step": 9013 }, { "epoch": 0.21, "learning_rate": 9.182667298672902e-06, "loss": 1.1128, "step": 9014 }, { "epoch": 0.21, "learning_rate": 9.182461509421883e-06, "loss": 0.8765, "step": 9015 }, { "epoch": 0.21, "learning_rate": 9.182255696573703e-06, "loss": 1.0232, "step": 9016 }, { "epoch": 0.21, "learning_rate": 9.182049860129518e-06, "loss": 0.8933, "step": 9017 }, { "epoch": 0.21, "learning_rate": 9.181844000090495e-06, "loss": 0.9052, "step": 9018 }, { "epoch": 0.21, "learning_rate": 9.181638116457792e-06, "loss": 1.0648, "step": 9019 }, { "epoch": 0.21, "learning_rate": 9.18143220923257e-06, "loss": 0.8131, "step": 9020 }, { "epoch": 0.21, "learning_rate": 9.181226278415992e-06, "loss": 0.9747, "step": 9021 }, { "epoch": 0.21, "learning_rate": 9.18102032400922e-06, "loss": 1.0242, "step": 9022 }, { "epoch": 0.21, "learning_rate": 9.180814346013417e-06, "loss": 0.7888, "step": 9023 }, { "epoch": 0.21, "learning_rate": 9.180608344429741e-06, "loss": 1.1523, "step": 9024 }, { "epoch": 0.21, "learning_rate": 9.180402319259359e-06, "loss": 0.9874, "step": 9025 }, { "epoch": 0.21, "learning_rate": 9.180196270503432e-06, "loss": 1.1917, "step": 9026 }, { "epoch": 0.21, "learning_rate": 9.17999019816312e-06, "loss": 0.9242, "step": 9027 }, { "epoch": 0.21, "learning_rate": 9.17978410223959e-06, "loss": 0.6418, "step": 9028 }, { "epoch": 0.21, "learning_rate": 9.179577982734e-06, "loss": 0.9538, "step": 9029 }, { "epoch": 0.21, "learning_rate": 9.179371839647517e-06, "loss": 1.0375, "step": 9030 }, { "epoch": 0.21, "learning_rate": 9.179165672981301e-06, "loss": 1.0819, "step": 9031 }, { "epoch": 0.21, "learning_rate": 9.178959482736519e-06, "loss": 1.0513, "step": 9032 }, { "epoch": 0.21, "learning_rate": 9.17875326891433e-06, "loss": 1.0585, "step": 9033 }, { "epoch": 0.21, "learning_rate": 9.1785470315159e-06, "loss": 1.228, "step": 9034 }, { "epoch": 0.21, "learning_rate": 9.178340770542392e-06, "loss": 1.0872, "step": 9035 }, { "epoch": 0.21, "learning_rate": 9.178134485994968e-06, "loss": 1.1577, "step": 9036 }, { "epoch": 0.21, "learning_rate": 9.177928177874795e-06, "loss": 1.1062, "step": 9037 }, { "epoch": 0.21, "learning_rate": 9.177721846183034e-06, "loss": 1.0946, "step": 9038 }, { "epoch": 0.21, "learning_rate": 9.177515490920853e-06, "loss": 1.0572, "step": 9039 }, { "epoch": 0.21, "learning_rate": 9.177309112089412e-06, "loss": 0.8249, "step": 9040 }, { "epoch": 0.21, "learning_rate": 9.177102709689876e-06, "loss": 0.9344, "step": 9041 }, { "epoch": 0.21, "learning_rate": 9.176896283723414e-06, "loss": 0.8974, "step": 9042 }, { "epoch": 0.21, "learning_rate": 9.176689834191184e-06, "loss": 0.9349, "step": 9043 }, { "epoch": 0.21, "learning_rate": 9.176483361094355e-06, "loss": 1.2562, "step": 9044 }, { "epoch": 0.21, "learning_rate": 9.176276864434092e-06, "loss": 0.9417, "step": 9045 }, { "epoch": 0.21, "learning_rate": 9.176070344211558e-06, "loss": 1.2389, "step": 9046 }, { "epoch": 0.21, "learning_rate": 9.175863800427919e-06, "loss": 1.028, "step": 9047 }, { "epoch": 0.21, "learning_rate": 9.175657233084341e-06, "loss": 1.1366, "step": 9048 }, { "epoch": 0.21, "learning_rate": 9.175450642181988e-06, "loss": 0.8789, "step": 9049 }, { "epoch": 0.21, "learning_rate": 9.175244027722028e-06, "loss": 1.0977, "step": 9050 }, { "epoch": 0.21, "learning_rate": 9.175037389705624e-06, "loss": 1.0273, "step": 9051 }, { "epoch": 0.21, "learning_rate": 9.174830728133942e-06, "loss": 1.0357, "step": 9052 }, { "epoch": 0.21, "learning_rate": 9.174624043008153e-06, "loss": 1.1851, "step": 9053 }, { "epoch": 0.21, "learning_rate": 9.174417334329416e-06, "loss": 1.065, "step": 9054 }, { "epoch": 0.21, "learning_rate": 9.174210602098902e-06, "loss": 1.0319, "step": 9055 }, { "epoch": 0.21, "learning_rate": 9.174003846317774e-06, "loss": 0.9807, "step": 9056 }, { "epoch": 0.21, "learning_rate": 9.173797066987201e-06, "loss": 1.1394, "step": 9057 }, { "epoch": 0.21, "learning_rate": 9.173590264108348e-06, "loss": 0.8625, "step": 9058 }, { "epoch": 0.21, "learning_rate": 9.173383437682384e-06, "loss": 0.9863, "step": 9059 }, { "epoch": 0.21, "learning_rate": 9.173176587710475e-06, "loss": 1.1782, "step": 9060 }, { "epoch": 0.21, "learning_rate": 9.172969714193785e-06, "loss": 0.7631, "step": 9061 }, { "epoch": 0.21, "learning_rate": 9.172762817133486e-06, "loss": 0.9414, "step": 9062 }, { "epoch": 0.21, "learning_rate": 9.172555896530742e-06, "loss": 1.1519, "step": 9063 }, { "epoch": 0.21, "learning_rate": 9.172348952386722e-06, "loss": 1.4884, "step": 9064 }, { "epoch": 0.21, "learning_rate": 9.172141984702591e-06, "loss": 0.8662, "step": 9065 }, { "epoch": 0.21, "learning_rate": 9.17193499347952e-06, "loss": 0.807, "step": 9066 }, { "epoch": 0.21, "learning_rate": 9.171727978718677e-06, "loss": 1.1039, "step": 9067 }, { "epoch": 0.21, "learning_rate": 9.171520940421228e-06, "loss": 1.0823, "step": 9068 }, { "epoch": 0.21, "learning_rate": 9.171313878588342e-06, "loss": 1.0287, "step": 9069 }, { "epoch": 0.21, "learning_rate": 9.171106793221185e-06, "loss": 0.8853, "step": 9070 }, { "epoch": 0.21, "learning_rate": 9.170899684320928e-06, "loss": 0.8875, "step": 9071 }, { "epoch": 0.21, "learning_rate": 9.17069255188874e-06, "loss": 1.2038, "step": 9072 }, { "epoch": 0.21, "learning_rate": 9.170485395925785e-06, "loss": 1.0229, "step": 9073 }, { "epoch": 0.21, "learning_rate": 9.170278216433238e-06, "loss": 1.029, "step": 9074 }, { "epoch": 0.21, "learning_rate": 9.170071013412263e-06, "loss": 1.1305, "step": 9075 }, { "epoch": 0.21, "learning_rate": 9.169863786864034e-06, "loss": 1.1258, "step": 9076 }, { "epoch": 0.21, "learning_rate": 9.169656536789715e-06, "loss": 1.0457, "step": 9077 }, { "epoch": 0.21, "learning_rate": 9.169449263190477e-06, "loss": 1.1389, "step": 9078 }, { "epoch": 0.21, "learning_rate": 9.169241966067491e-06, "loss": 0.9861, "step": 9079 }, { "epoch": 0.21, "learning_rate": 9.169034645421924e-06, "loss": 0.9386, "step": 9080 }, { "epoch": 0.21, "learning_rate": 9.168827301254948e-06, "loss": 0.8946, "step": 9081 }, { "epoch": 0.21, "learning_rate": 9.168619933567733e-06, "loss": 0.913, "step": 9082 }, { "epoch": 0.21, "learning_rate": 9.168412542361447e-06, "loss": 1.1002, "step": 9083 }, { "epoch": 0.21, "learning_rate": 9.16820512763726e-06, "loss": 0.6726, "step": 9084 }, { "epoch": 0.21, "learning_rate": 9.167997689396344e-06, "loss": 0.9327, "step": 9085 }, { "epoch": 0.21, "learning_rate": 9.167790227639869e-06, "loss": 1.3334, "step": 9086 }, { "epoch": 0.21, "learning_rate": 9.167582742369005e-06, "loss": 1.0665, "step": 9087 }, { "epoch": 0.21, "learning_rate": 9.167375233584922e-06, "loss": 1.1264, "step": 9088 }, { "epoch": 0.21, "learning_rate": 9.167167701288791e-06, "loss": 1.0519, "step": 9089 }, { "epoch": 0.21, "learning_rate": 9.166960145481784e-06, "loss": 0.9782, "step": 9090 }, { "epoch": 0.21, "learning_rate": 9.16675256616507e-06, "loss": 0.4997, "step": 9091 }, { "epoch": 0.21, "learning_rate": 9.166544963339825e-06, "loss": 1.1692, "step": 9092 }, { "epoch": 0.21, "learning_rate": 9.166337337007213e-06, "loss": 0.7461, "step": 9093 }, { "epoch": 0.21, "learning_rate": 9.166129687168412e-06, "loss": 0.6608, "step": 9094 }, { "epoch": 0.21, "learning_rate": 9.165922013824589e-06, "loss": 1.0187, "step": 9095 }, { "epoch": 0.21, "learning_rate": 9.165714316976916e-06, "loss": 0.7988, "step": 9096 }, { "epoch": 0.21, "learning_rate": 9.16550659662657e-06, "loss": 0.7934, "step": 9097 }, { "epoch": 0.21, "learning_rate": 9.165298852774716e-06, "loss": 1.1005, "step": 9098 }, { "epoch": 0.21, "learning_rate": 9.16509108542253e-06, "loss": 0.9819, "step": 9099 }, { "epoch": 0.21, "learning_rate": 9.164883294571182e-06, "loss": 1.1731, "step": 9100 }, { "epoch": 0.21, "learning_rate": 9.16467548022185e-06, "loss": 1.1801, "step": 9101 }, { "epoch": 0.21, "learning_rate": 9.1644676423757e-06, "loss": 1.3033, "step": 9102 }, { "epoch": 0.21, "learning_rate": 9.164259781033904e-06, "loss": 0.9994, "step": 9103 }, { "epoch": 0.21, "learning_rate": 9.164051896197642e-06, "loss": 1.3402, "step": 9104 }, { "epoch": 0.21, "learning_rate": 9.16384398786808e-06, "loss": 0.8614, "step": 9105 }, { "epoch": 0.21, "learning_rate": 9.163636056046393e-06, "loss": 1.1135, "step": 9106 }, { "epoch": 0.21, "learning_rate": 9.163428100733755e-06, "loss": 0.8069, "step": 9107 }, { "epoch": 0.21, "learning_rate": 9.16322012193134e-06, "loss": 1.0396, "step": 9108 }, { "epoch": 0.21, "learning_rate": 9.163012119640319e-06, "loss": 0.8323, "step": 9109 }, { "epoch": 0.21, "learning_rate": 9.162804093861868e-06, "loss": 1.0093, "step": 9110 }, { "epoch": 0.21, "learning_rate": 9.162596044597159e-06, "loss": 1.2095, "step": 9111 }, { "epoch": 0.21, "learning_rate": 9.162387971847364e-06, "loss": 0.8777, "step": 9112 }, { "epoch": 0.21, "learning_rate": 9.162179875613661e-06, "loss": 0.8965, "step": 9113 }, { "epoch": 0.21, "learning_rate": 9.161971755897224e-06, "loss": 0.8799, "step": 9114 }, { "epoch": 0.21, "learning_rate": 9.161763612699224e-06, "loss": 0.9565, "step": 9115 }, { "epoch": 0.21, "learning_rate": 9.161555446020835e-06, "loss": 0.9064, "step": 9116 }, { "epoch": 0.21, "learning_rate": 9.161347255863236e-06, "loss": 1.0245, "step": 9117 }, { "epoch": 0.21, "learning_rate": 9.161139042227599e-06, "loss": 0.9118, "step": 9118 }, { "epoch": 0.21, "learning_rate": 9.160930805115095e-06, "loss": 1.0241, "step": 9119 }, { "epoch": 0.21, "learning_rate": 9.160722544526906e-06, "loss": 0.8584, "step": 9120 }, { "epoch": 0.21, "learning_rate": 9.160514260464201e-06, "loss": 0.9019, "step": 9121 }, { "epoch": 0.21, "learning_rate": 9.160305952928159e-06, "loss": 0.9025, "step": 9122 }, { "epoch": 0.21, "learning_rate": 9.160097621919953e-06, "loss": 0.9699, "step": 9123 }, { "epoch": 0.21, "learning_rate": 9.15988926744076e-06, "loss": 0.7148, "step": 9124 }, { "epoch": 0.21, "learning_rate": 9.159680889491756e-06, "loss": 1.0743, "step": 9125 }, { "epoch": 0.21, "learning_rate": 9.159472488074112e-06, "loss": 1.0419, "step": 9126 }, { "epoch": 0.21, "learning_rate": 9.159264063189009e-06, "loss": 1.0885, "step": 9127 }, { "epoch": 0.21, "learning_rate": 9.15905561483762e-06, "loss": 0.9227, "step": 9128 }, { "epoch": 0.21, "learning_rate": 9.158847143021123e-06, "loss": 1.0365, "step": 9129 }, { "epoch": 0.21, "learning_rate": 9.158638647740694e-06, "loss": 1.1664, "step": 9130 }, { "epoch": 0.21, "learning_rate": 9.158430128997508e-06, "loss": 1.1265, "step": 9131 }, { "epoch": 0.21, "learning_rate": 9.158221586792742e-06, "loss": 1.0951, "step": 9132 }, { "epoch": 0.21, "learning_rate": 9.158013021127575e-06, "loss": 1.0925, "step": 9133 }, { "epoch": 0.21, "learning_rate": 9.157804432003178e-06, "loss": 0.8382, "step": 9134 }, { "epoch": 0.21, "learning_rate": 9.157595819420732e-06, "loss": 1.1725, "step": 9135 }, { "epoch": 0.21, "learning_rate": 9.157387183381414e-06, "loss": 1.2906, "step": 9136 }, { "epoch": 0.21, "learning_rate": 9.157178523886399e-06, "loss": 1.0674, "step": 9137 }, { "epoch": 0.21, "learning_rate": 9.156969840936867e-06, "loss": 1.2405, "step": 9138 }, { "epoch": 0.21, "learning_rate": 9.156761134533992e-06, "loss": 1.0161, "step": 9139 }, { "epoch": 0.21, "learning_rate": 9.156552404678956e-06, "loss": 0.9052, "step": 9140 }, { "epoch": 0.21, "learning_rate": 9.156343651372932e-06, "loss": 0.7656, "step": 9141 }, { "epoch": 0.21, "learning_rate": 9.1561348746171e-06, "loss": 1.1365, "step": 9142 }, { "epoch": 0.21, "learning_rate": 9.155926074412638e-06, "loss": 0.9148, "step": 9143 }, { "epoch": 0.21, "learning_rate": 9.155717250760725e-06, "loss": 0.8179, "step": 9144 }, { "epoch": 0.21, "learning_rate": 9.155508403662536e-06, "loss": 1.0951, "step": 9145 }, { "epoch": 0.21, "learning_rate": 9.155299533119253e-06, "loss": 0.8419, "step": 9146 }, { "epoch": 0.21, "learning_rate": 9.155090639132052e-06, "loss": 0.7049, "step": 9147 }, { "epoch": 0.21, "learning_rate": 9.154881721702113e-06, "loss": 0.8649, "step": 9148 }, { "epoch": 0.21, "learning_rate": 9.154672780830613e-06, "loss": 1.0679, "step": 9149 }, { "epoch": 0.21, "learning_rate": 9.15446381651873e-06, "loss": 1.0058, "step": 9150 }, { "epoch": 0.21, "learning_rate": 9.154254828767648e-06, "loss": 1.0062, "step": 9151 }, { "epoch": 0.21, "learning_rate": 9.154045817578541e-06, "loss": 0.9712, "step": 9152 }, { "epoch": 0.21, "learning_rate": 9.153836782952591e-06, "loss": 1.1558, "step": 9153 }, { "epoch": 0.21, "learning_rate": 9.153627724890976e-06, "loss": 0.9693, "step": 9154 }, { "epoch": 0.21, "learning_rate": 9.153418643394875e-06, "loss": 0.9596, "step": 9155 }, { "epoch": 0.21, "learning_rate": 9.15320953846547e-06, "loss": 0.9405, "step": 9156 }, { "epoch": 0.21, "learning_rate": 9.153000410103938e-06, "loss": 1.0363, "step": 9157 }, { "epoch": 0.21, "learning_rate": 9.152791258311463e-06, "loss": 1.0424, "step": 9158 }, { "epoch": 0.21, "learning_rate": 9.15258208308922e-06, "loss": 1.13, "step": 9159 }, { "epoch": 0.21, "learning_rate": 9.15237288443839e-06, "loss": 1.0243, "step": 9160 }, { "epoch": 0.21, "learning_rate": 9.152163662360157e-06, "loss": 1.3677, "step": 9161 }, { "epoch": 0.21, "learning_rate": 9.151954416855697e-06, "loss": 1.1424, "step": 9162 }, { "epoch": 0.21, "learning_rate": 9.151745147926194e-06, "loss": 1.0416, "step": 9163 }, { "epoch": 0.21, "learning_rate": 9.151535855572826e-06, "loss": 0.8621, "step": 9164 }, { "epoch": 0.21, "learning_rate": 9.151326539796777e-06, "loss": 0.9597, "step": 9165 }, { "epoch": 0.21, "learning_rate": 9.151117200599224e-06, "loss": 1.0331, "step": 9166 }, { "epoch": 0.21, "learning_rate": 9.150907837981351e-06, "loss": 1.0118, "step": 9167 }, { "epoch": 0.21, "learning_rate": 9.150698451944339e-06, "loss": 1.1123, "step": 9168 }, { "epoch": 0.21, "learning_rate": 9.150489042489368e-06, "loss": 0.9101, "step": 9169 }, { "epoch": 0.21, "learning_rate": 9.15027960961762e-06, "loss": 1.0249, "step": 9170 }, { "epoch": 0.21, "learning_rate": 9.150070153330277e-06, "loss": 1.2266, "step": 9171 }, { "epoch": 0.21, "learning_rate": 9.14986067362852e-06, "loss": 0.99, "step": 9172 }, { "epoch": 0.21, "learning_rate": 9.149651170513534e-06, "loss": 1.345, "step": 9173 }, { "epoch": 0.21, "learning_rate": 9.149441643986495e-06, "loss": 0.6364, "step": 9174 }, { "epoch": 0.21, "learning_rate": 9.14923209404859e-06, "loss": 0.8865, "step": 9175 }, { "epoch": 0.21, "learning_rate": 9.149022520700999e-06, "loss": 1.0569, "step": 9176 }, { "epoch": 0.21, "learning_rate": 9.148812923944905e-06, "loss": 1.1862, "step": 9177 }, { "epoch": 0.21, "learning_rate": 9.148603303781493e-06, "loss": 1.2473, "step": 9178 }, { "epoch": 0.21, "learning_rate": 9.148393660211941e-06, "loss": 1.0511, "step": 9179 }, { "epoch": 0.21, "learning_rate": 9.148183993237436e-06, "loss": 1.0091, "step": 9180 }, { "epoch": 0.21, "learning_rate": 9.147974302859158e-06, "loss": 0.8396, "step": 9181 }, { "epoch": 0.21, "learning_rate": 9.14776458907829e-06, "loss": 1.0105, "step": 9182 }, { "epoch": 0.21, "learning_rate": 9.147554851896017e-06, "loss": 1.0366, "step": 9183 }, { "epoch": 0.21, "learning_rate": 9.147345091313522e-06, "loss": 1.088, "step": 9184 }, { "epoch": 0.21, "learning_rate": 9.147135307331988e-06, "loss": 0.7981, "step": 9185 }, { "epoch": 0.21, "learning_rate": 9.146925499952599e-06, "loss": 0.9902, "step": 9186 }, { "epoch": 0.21, "learning_rate": 9.146715669176538e-06, "loss": 1.1698, "step": 9187 }, { "epoch": 0.21, "learning_rate": 9.146505815004988e-06, "loss": 0.9495, "step": 9188 }, { "epoch": 0.21, "learning_rate": 9.146295937439137e-06, "loss": 1.0573, "step": 9189 }, { "epoch": 0.21, "learning_rate": 9.146086036480164e-06, "loss": 1.0217, "step": 9190 }, { "epoch": 0.21, "learning_rate": 9.145876112129257e-06, "loss": 0.9871, "step": 9191 }, { "epoch": 0.21, "learning_rate": 9.145666164387599e-06, "loss": 0.9156, "step": 9192 }, { "epoch": 0.21, "learning_rate": 9.145456193256375e-06, "loss": 1.0123, "step": 9193 }, { "epoch": 0.21, "learning_rate": 9.145246198736768e-06, "loss": 0.946, "step": 9194 }, { "epoch": 0.21, "learning_rate": 9.145036180829964e-06, "loss": 1.0252, "step": 9195 }, { "epoch": 0.21, "learning_rate": 9.144826139537147e-06, "loss": 0.926, "step": 9196 }, { "epoch": 0.21, "learning_rate": 9.144616074859504e-06, "loss": 1.1591, "step": 9197 }, { "epoch": 0.21, "learning_rate": 9.144405986798219e-06, "loss": 1.1763, "step": 9198 }, { "epoch": 0.21, "learning_rate": 9.144195875354477e-06, "loss": 1.0177, "step": 9199 }, { "epoch": 0.21, "learning_rate": 9.143985740529464e-06, "loss": 0.9261, "step": 9200 }, { "epoch": 0.21, "learning_rate": 9.143775582324366e-06, "loss": 1.2197, "step": 9201 }, { "epoch": 0.21, "learning_rate": 9.143565400740367e-06, "loss": 0.9037, "step": 9202 }, { "epoch": 0.21, "learning_rate": 9.143355195778653e-06, "loss": 1.1353, "step": 9203 }, { "epoch": 0.21, "learning_rate": 9.143144967440413e-06, "loss": 1.0108, "step": 9204 }, { "epoch": 0.21, "learning_rate": 9.14293471572683e-06, "loss": 0.9614, "step": 9205 }, { "epoch": 0.21, "learning_rate": 9.142724440639091e-06, "loss": 0.8612, "step": 9206 }, { "epoch": 0.21, "learning_rate": 9.142514142178383e-06, "loss": 0.9898, "step": 9207 }, { "epoch": 0.21, "learning_rate": 9.14230382034589e-06, "loss": 1.0072, "step": 9208 }, { "epoch": 0.21, "learning_rate": 9.1420934751428e-06, "loss": 0.8971, "step": 9209 }, { "epoch": 0.21, "learning_rate": 9.141883106570304e-06, "loss": 0.8672, "step": 9210 }, { "epoch": 0.21, "learning_rate": 9.141672714629584e-06, "loss": 1.0624, "step": 9211 }, { "epoch": 0.21, "learning_rate": 9.141462299321828e-06, "loss": 0.9487, "step": 9212 }, { "epoch": 0.21, "learning_rate": 9.141251860648224e-06, "loss": 1.0737, "step": 9213 }, { "epoch": 0.21, "learning_rate": 9.141041398609958e-06, "loss": 1.3635, "step": 9214 }, { "epoch": 0.21, "learning_rate": 9.140830913208217e-06, "loss": 1.0352, "step": 9215 }, { "epoch": 0.21, "learning_rate": 9.140620404444192e-06, "loss": 1.2062, "step": 9216 }, { "epoch": 0.21, "learning_rate": 9.140409872319067e-06, "loss": 1.1632, "step": 9217 }, { "epoch": 0.21, "learning_rate": 9.14019931683403e-06, "loss": 0.876, "step": 9218 }, { "epoch": 0.21, "learning_rate": 9.139988737990272e-06, "loss": 1.0371, "step": 9219 }, { "epoch": 0.21, "learning_rate": 9.139778135788978e-06, "loss": 0.9266, "step": 9220 }, { "epoch": 0.21, "learning_rate": 9.139567510231337e-06, "loss": 0.821, "step": 9221 }, { "epoch": 0.21, "learning_rate": 9.13935686131854e-06, "loss": 0.9877, "step": 9222 }, { "epoch": 0.21, "learning_rate": 9.139146189051772e-06, "loss": 0.926, "step": 9223 }, { "epoch": 0.21, "learning_rate": 9.138935493432222e-06, "loss": 1.0016, "step": 9224 }, { "epoch": 0.21, "learning_rate": 9.138724774461079e-06, "loss": 0.9179, "step": 9225 }, { "epoch": 0.21, "learning_rate": 9.138514032139534e-06, "loss": 0.9811, "step": 9226 }, { "epoch": 0.21, "learning_rate": 9.138303266468773e-06, "loss": 1.0799, "step": 9227 }, { "epoch": 0.21, "learning_rate": 9.138092477449987e-06, "loss": 1.4307, "step": 9228 }, { "epoch": 0.21, "learning_rate": 9.137881665084365e-06, "loss": 0.8412, "step": 9229 }, { "epoch": 0.21, "learning_rate": 9.137670829373095e-06, "loss": 0.7818, "step": 9230 }, { "epoch": 0.21, "learning_rate": 9.137459970317368e-06, "loss": 0.9355, "step": 9231 }, { "epoch": 0.21, "learning_rate": 9.137249087918375e-06, "loss": 0.8927, "step": 9232 }, { "epoch": 0.21, "learning_rate": 9.137038182177303e-06, "loss": 1.0184, "step": 9233 }, { "epoch": 0.21, "learning_rate": 9.136827253095341e-06, "loss": 0.8957, "step": 9234 }, { "epoch": 0.21, "learning_rate": 9.136616300673684e-06, "loss": 0.9089, "step": 9235 }, { "epoch": 0.21, "learning_rate": 9.136405324913517e-06, "loss": 0.9191, "step": 9236 }, { "epoch": 0.21, "learning_rate": 9.136194325816035e-06, "loss": 0.8884, "step": 9237 }, { "epoch": 0.21, "learning_rate": 9.135983303382423e-06, "loss": 1.1938, "step": 9238 }, { "epoch": 0.21, "learning_rate": 9.135772257613878e-06, "loss": 1.1784, "step": 9239 }, { "epoch": 0.21, "learning_rate": 9.135561188511583e-06, "loss": 1.021, "step": 9240 }, { "epoch": 0.21, "learning_rate": 9.135350096076735e-06, "loss": 0.885, "step": 9241 }, { "epoch": 0.21, "learning_rate": 9.135138980310524e-06, "loss": 1.0871, "step": 9242 }, { "epoch": 0.21, "learning_rate": 9.134927841214141e-06, "loss": 0.6939, "step": 9243 }, { "epoch": 0.21, "learning_rate": 9.134716678788773e-06, "loss": 1.2216, "step": 9244 }, { "epoch": 0.21, "learning_rate": 9.134505493035618e-06, "loss": 1.2621, "step": 9245 }, { "epoch": 0.21, "learning_rate": 9.134294283955863e-06, "loss": 1.149, "step": 9246 }, { "epoch": 0.21, "learning_rate": 9.1340830515507e-06, "loss": 1.0468, "step": 9247 }, { "epoch": 0.21, "learning_rate": 9.133871795821323e-06, "loss": 1.3379, "step": 9248 }, { "epoch": 0.21, "learning_rate": 9.13366051676892e-06, "loss": 0.9247, "step": 9249 }, { "epoch": 0.21, "learning_rate": 9.133449214394688e-06, "loss": 0.8953, "step": 9250 }, { "epoch": 0.21, "learning_rate": 9.133237888699816e-06, "loss": 1.0619, "step": 9251 }, { "epoch": 0.21, "learning_rate": 9.133026539685497e-06, "loss": 1.2378, "step": 9252 }, { "epoch": 0.21, "learning_rate": 9.132815167352924e-06, "loss": 0.8659, "step": 9253 }, { "epoch": 0.21, "learning_rate": 9.132603771703288e-06, "loss": 1.0307, "step": 9254 }, { "epoch": 0.21, "learning_rate": 9.132392352737783e-06, "loss": 0.7667, "step": 9255 }, { "epoch": 0.21, "learning_rate": 9.132180910457603e-06, "loss": 0.9923, "step": 9256 }, { "epoch": 0.21, "learning_rate": 9.131969444863937e-06, "loss": 0.876, "step": 9257 }, { "epoch": 0.21, "learning_rate": 9.131757955957981e-06, "loss": 1.0119, "step": 9258 }, { "epoch": 0.21, "learning_rate": 9.131546443740927e-06, "loss": 1.0646, "step": 9259 }, { "epoch": 0.21, "learning_rate": 9.13133490821397e-06, "loss": 0.9181, "step": 9260 }, { "epoch": 0.21, "learning_rate": 9.131123349378303e-06, "loss": 0.9916, "step": 9261 }, { "epoch": 0.21, "learning_rate": 9.130911767235118e-06, "loss": 0.9972, "step": 9262 }, { "epoch": 0.21, "learning_rate": 9.130700161785611e-06, "loss": 0.9283, "step": 9263 }, { "epoch": 0.21, "learning_rate": 9.130488533030973e-06, "loss": 1.1828, "step": 9264 }, { "epoch": 0.21, "learning_rate": 9.130276880972401e-06, "loss": 1.0757, "step": 9265 }, { "epoch": 0.21, "learning_rate": 9.130065205611087e-06, "loss": 0.9209, "step": 9266 }, { "epoch": 0.21, "learning_rate": 9.129853506948226e-06, "loss": 1.0945, "step": 9267 }, { "epoch": 0.21, "learning_rate": 9.129641784985013e-06, "loss": 0.7974, "step": 9268 }, { "epoch": 0.21, "learning_rate": 9.129430039722642e-06, "loss": 1.2118, "step": 9269 }, { "epoch": 0.21, "learning_rate": 9.129218271162307e-06, "loss": 0.8909, "step": 9270 }, { "epoch": 0.22, "learning_rate": 9.129006479305204e-06, "loss": 1.2373, "step": 9271 }, { "epoch": 0.22, "learning_rate": 9.128794664152527e-06, "loss": 1.0807, "step": 9272 }, { "epoch": 0.22, "learning_rate": 9.128582825705473e-06, "loss": 1.1232, "step": 9273 }, { "epoch": 0.22, "learning_rate": 9.128370963965233e-06, "loss": 0.9689, "step": 9274 }, { "epoch": 0.22, "learning_rate": 9.128159078933006e-06, "loss": 0.8886, "step": 9275 }, { "epoch": 0.22, "learning_rate": 9.127947170609986e-06, "loss": 0.8573, "step": 9276 }, { "epoch": 0.22, "learning_rate": 9.127735238997368e-06, "loss": 0.8229, "step": 9277 }, { "epoch": 0.22, "learning_rate": 9.12752328409635e-06, "loss": 1.2682, "step": 9278 }, { "epoch": 0.22, "learning_rate": 9.127311305908124e-06, "loss": 1.1257, "step": 9279 }, { "epoch": 0.22, "learning_rate": 9.12709930443389e-06, "loss": 0.8005, "step": 9280 }, { "epoch": 0.22, "learning_rate": 9.126887279674843e-06, "loss": 1.0281, "step": 9281 }, { "epoch": 0.22, "learning_rate": 9.126675231632178e-06, "loss": 1.1911, "step": 9282 }, { "epoch": 0.22, "learning_rate": 9.126463160307093e-06, "loss": 1.0822, "step": 9283 }, { "epoch": 0.22, "learning_rate": 9.126251065700783e-06, "loss": 1.0402, "step": 9284 }, { "epoch": 0.22, "learning_rate": 9.126038947814445e-06, "loss": 0.8665, "step": 9285 }, { "epoch": 0.22, "learning_rate": 9.125826806649275e-06, "loss": 0.8512, "step": 9286 }, { "epoch": 0.22, "learning_rate": 9.125614642206473e-06, "loss": 1.0523, "step": 9287 }, { "epoch": 0.22, "learning_rate": 9.125402454487232e-06, "loss": 0.849, "step": 9288 }, { "epoch": 0.22, "learning_rate": 9.125190243492753e-06, "loss": 1.2583, "step": 9289 }, { "epoch": 0.22, "learning_rate": 9.124978009224227e-06, "loss": 1.1414, "step": 9290 }, { "epoch": 0.22, "learning_rate": 9.12476575168286e-06, "loss": 1.0313, "step": 9291 }, { "epoch": 0.22, "learning_rate": 9.124553470869844e-06, "loss": 0.999, "step": 9292 }, { "epoch": 0.22, "learning_rate": 9.124341166786377e-06, "loss": 0.8945, "step": 9293 }, { "epoch": 0.22, "learning_rate": 9.124128839433657e-06, "loss": 0.7629, "step": 9294 }, { "epoch": 0.22, "learning_rate": 9.123916488812884e-06, "loss": 1.0041, "step": 9295 }, { "epoch": 0.22, "learning_rate": 9.123704114925255e-06, "loss": 1.1276, "step": 9296 }, { "epoch": 0.22, "learning_rate": 9.123491717771966e-06, "loss": 1.0182, "step": 9297 }, { "epoch": 0.22, "learning_rate": 9.12327929735422e-06, "loss": 1.0355, "step": 9298 }, { "epoch": 0.22, "learning_rate": 9.12306685367321e-06, "loss": 0.7685, "step": 9299 }, { "epoch": 0.22, "learning_rate": 9.122854386730139e-06, "loss": 1.2932, "step": 9300 }, { "epoch": 0.22, "learning_rate": 9.122641896526202e-06, "loss": 0.8761, "step": 9301 }, { "epoch": 0.22, "learning_rate": 9.122429383062604e-06, "loss": 0.7634, "step": 9302 }, { "epoch": 0.22, "learning_rate": 9.122216846340536e-06, "loss": 0.7061, "step": 9303 }, { "epoch": 0.22, "learning_rate": 9.122004286361202e-06, "loss": 0.9074, "step": 9304 }, { "epoch": 0.22, "learning_rate": 9.1217917031258e-06, "loss": 1.0116, "step": 9305 }, { "epoch": 0.22, "learning_rate": 9.12157909663553e-06, "loss": 1.1293, "step": 9306 }, { "epoch": 0.22, "learning_rate": 9.12136646689159e-06, "loss": 0.7801, "step": 9307 }, { "epoch": 0.22, "learning_rate": 9.121153813895183e-06, "loss": 0.9518, "step": 9308 }, { "epoch": 0.22, "learning_rate": 9.120941137647506e-06, "loss": 0.6549, "step": 9309 }, { "epoch": 0.22, "learning_rate": 9.120728438149758e-06, "loss": 1.1128, "step": 9310 }, { "epoch": 0.22, "learning_rate": 9.120515715403139e-06, "loss": 0.9693, "step": 9311 }, { "epoch": 0.22, "learning_rate": 9.120302969408854e-06, "loss": 1.4327, "step": 9312 }, { "epoch": 0.22, "learning_rate": 9.120090200168097e-06, "loss": 0.8454, "step": 9313 }, { "epoch": 0.22, "learning_rate": 9.119877407682075e-06, "loss": 0.7679, "step": 9314 }, { "epoch": 0.22, "learning_rate": 9.119664591951982e-06, "loss": 1.124, "step": 9315 }, { "epoch": 0.22, "learning_rate": 9.119451752979021e-06, "loss": 0.8277, "step": 9316 }, { "epoch": 0.22, "learning_rate": 9.119238890764394e-06, "loss": 0.8869, "step": 9317 }, { "epoch": 0.22, "learning_rate": 9.119026005309304e-06, "loss": 1.0582, "step": 9318 }, { "epoch": 0.22, "learning_rate": 9.118813096614947e-06, "loss": 0.9851, "step": 9319 }, { "epoch": 0.22, "learning_rate": 9.118600164682527e-06, "loss": 1.0182, "step": 9320 }, { "epoch": 0.22, "learning_rate": 9.118387209513246e-06, "loss": 0.9947, "step": 9321 }, { "epoch": 0.22, "learning_rate": 9.118174231108304e-06, "loss": 1.0261, "step": 9322 }, { "epoch": 0.22, "learning_rate": 9.117961229468903e-06, "loss": 1.012, "step": 9323 }, { "epoch": 0.22, "learning_rate": 9.117748204596243e-06, "loss": 1.0241, "step": 9324 }, { "epoch": 0.22, "learning_rate": 9.11753515649153e-06, "loss": 1.1538, "step": 9325 }, { "epoch": 0.22, "learning_rate": 9.117322085155964e-06, "loss": 0.9984, "step": 9326 }, { "epoch": 0.22, "learning_rate": 9.117108990590745e-06, "loss": 0.967, "step": 9327 }, { "epoch": 0.22, "learning_rate": 9.116895872797078e-06, "loss": 1.0544, "step": 9328 }, { "epoch": 0.22, "learning_rate": 9.116682731776166e-06, "loss": 0.9033, "step": 9329 }, { "epoch": 0.22, "learning_rate": 9.116469567529209e-06, "loss": 0.8316, "step": 9330 }, { "epoch": 0.22, "learning_rate": 9.11625638005741e-06, "loss": 1.1019, "step": 9331 }, { "epoch": 0.22, "learning_rate": 9.116043169361973e-06, "loss": 1.3506, "step": 9332 }, { "epoch": 0.22, "learning_rate": 9.115829935444101e-06, "loss": 1.2498, "step": 9333 }, { "epoch": 0.22, "learning_rate": 9.115616678304996e-06, "loss": 1.1, "step": 9334 }, { "epoch": 0.22, "learning_rate": 9.115403397945861e-06, "loss": 0.891, "step": 9335 }, { "epoch": 0.22, "learning_rate": 9.1151900943679e-06, "loss": 1.0073, "step": 9336 }, { "epoch": 0.22, "learning_rate": 9.114976767572317e-06, "loss": 1.0022, "step": 9337 }, { "epoch": 0.22, "learning_rate": 9.114763417560314e-06, "loss": 0.9943, "step": 9338 }, { "epoch": 0.22, "learning_rate": 9.114550044333097e-06, "loss": 0.8524, "step": 9339 }, { "epoch": 0.22, "learning_rate": 9.114336647891868e-06, "loss": 0.9781, "step": 9340 }, { "epoch": 0.22, "learning_rate": 9.11412322823783e-06, "loss": 0.8939, "step": 9341 }, { "epoch": 0.22, "learning_rate": 9.11390978537219e-06, "loss": 1.125, "step": 9342 }, { "epoch": 0.22, "learning_rate": 9.113696319296152e-06, "loss": 0.8503, "step": 9343 }, { "epoch": 0.22, "learning_rate": 9.113482830010918e-06, "loss": 1.14, "step": 9344 }, { "epoch": 0.22, "learning_rate": 9.113269317517693e-06, "loss": 1.0576, "step": 9345 }, { "epoch": 0.22, "learning_rate": 9.113055781817683e-06, "loss": 0.7865, "step": 9346 }, { "epoch": 0.22, "learning_rate": 9.112842222912092e-06, "loss": 1.0188, "step": 9347 }, { "epoch": 0.22, "learning_rate": 9.112628640802125e-06, "loss": 0.972, "step": 9348 }, { "epoch": 0.22, "learning_rate": 9.112415035488987e-06, "loss": 1.0394, "step": 9349 }, { "epoch": 0.22, "learning_rate": 9.112201406973883e-06, "loss": 0.81, "step": 9350 }, { "epoch": 0.22, "learning_rate": 9.111987755258018e-06, "loss": 0.9999, "step": 9351 }, { "epoch": 0.22, "learning_rate": 9.111774080342598e-06, "loss": 1.2354, "step": 9352 }, { "epoch": 0.22, "learning_rate": 9.111560382228828e-06, "loss": 0.8239, "step": 9353 }, { "epoch": 0.22, "learning_rate": 9.111346660917916e-06, "loss": 1.0509, "step": 9354 }, { "epoch": 0.22, "learning_rate": 9.111132916411064e-06, "loss": 0.8379, "step": 9355 }, { "epoch": 0.22, "learning_rate": 9.11091914870948e-06, "loss": 1.1556, "step": 9356 }, { "epoch": 0.22, "learning_rate": 9.11070535781437e-06, "loss": 1.2714, "step": 9357 }, { "epoch": 0.22, "learning_rate": 9.11049154372694e-06, "loss": 1.0593, "step": 9358 }, { "epoch": 0.22, "learning_rate": 9.110277706448396e-06, "loss": 0.882, "step": 9359 }, { "epoch": 0.22, "learning_rate": 9.110063845979945e-06, "loss": 0.9035, "step": 9360 }, { "epoch": 0.22, "learning_rate": 9.109849962322793e-06, "loss": 0.9871, "step": 9361 }, { "epoch": 0.22, "learning_rate": 9.109636055478148e-06, "loss": 0.8809, "step": 9362 }, { "epoch": 0.22, "learning_rate": 9.109422125447214e-06, "loss": 1.1059, "step": 9363 }, { "epoch": 0.22, "learning_rate": 9.109208172231201e-06, "loss": 0.9636, "step": 9364 }, { "epoch": 0.22, "learning_rate": 9.108994195831316e-06, "loss": 1.0667, "step": 9365 }, { "epoch": 0.22, "learning_rate": 9.108780196248764e-06, "loss": 1.1349, "step": 9366 }, { "epoch": 0.22, "learning_rate": 9.108566173484755e-06, "loss": 0.8041, "step": 9367 }, { "epoch": 0.22, "learning_rate": 9.108352127540493e-06, "loss": 0.908, "step": 9368 }, { "epoch": 0.22, "learning_rate": 9.108138058417188e-06, "loss": 1.1976, "step": 9369 }, { "epoch": 0.22, "learning_rate": 9.10792396611605e-06, "loss": 1.038, "step": 9370 }, { "epoch": 0.22, "learning_rate": 9.107709850638283e-06, "loss": 1.1078, "step": 9371 }, { "epoch": 0.22, "learning_rate": 9.107495711985094e-06, "loss": 1.1722, "step": 9372 }, { "epoch": 0.22, "learning_rate": 9.107281550157696e-06, "loss": 0.8818, "step": 9373 }, { "epoch": 0.22, "learning_rate": 9.107067365157295e-06, "loss": 0.8004, "step": 9374 }, { "epoch": 0.22, "learning_rate": 9.106853156985098e-06, "loss": 0.9742, "step": 9375 }, { "epoch": 0.22, "learning_rate": 9.106638925642317e-06, "loss": 0.9701, "step": 9376 }, { "epoch": 0.22, "learning_rate": 9.106424671130158e-06, "loss": 1.2796, "step": 9377 }, { "epoch": 0.22, "learning_rate": 9.106210393449828e-06, "loss": 1.3182, "step": 9378 }, { "epoch": 0.22, "learning_rate": 9.10599609260254e-06, "loss": 1.1905, "step": 9379 }, { "epoch": 0.22, "learning_rate": 9.105781768589502e-06, "loss": 1.0352, "step": 9380 }, { "epoch": 0.22, "learning_rate": 9.10556742141192e-06, "loss": 0.7711, "step": 9381 }, { "epoch": 0.22, "learning_rate": 9.105353051071009e-06, "loss": 1.0539, "step": 9382 }, { "epoch": 0.22, "learning_rate": 9.105138657567973e-06, "loss": 0.9523, "step": 9383 }, { "epoch": 0.22, "learning_rate": 9.104924240904024e-06, "loss": 0.831, "step": 9384 }, { "epoch": 0.22, "learning_rate": 9.104709801080374e-06, "loss": 0.9271, "step": 9385 }, { "epoch": 0.22, "learning_rate": 9.10449533809823e-06, "loss": 0.9422, "step": 9386 }, { "epoch": 0.22, "learning_rate": 9.1042808519588e-06, "loss": 0.9086, "step": 9387 }, { "epoch": 0.22, "learning_rate": 9.104066342663298e-06, "loss": 0.8201, "step": 9388 }, { "epoch": 0.22, "learning_rate": 9.103851810212934e-06, "loss": 0.8399, "step": 9389 }, { "epoch": 0.22, "learning_rate": 9.103637254608915e-06, "loss": 0.9284, "step": 9390 }, { "epoch": 0.22, "learning_rate": 9.103422675852456e-06, "loss": 0.9829, "step": 9391 }, { "epoch": 0.22, "learning_rate": 9.103208073944763e-06, "loss": 0.9759, "step": 9392 }, { "epoch": 0.22, "learning_rate": 9.102993448887052e-06, "loss": 0.8469, "step": 9393 }, { "epoch": 0.22, "learning_rate": 9.10277880068053e-06, "loss": 1.1174, "step": 9394 }, { "epoch": 0.22, "learning_rate": 9.102564129326408e-06, "loss": 0.8476, "step": 9395 }, { "epoch": 0.22, "learning_rate": 9.102349434825898e-06, "loss": 1.1058, "step": 9396 }, { "epoch": 0.22, "learning_rate": 9.102134717180213e-06, "loss": 1.1318, "step": 9397 }, { "epoch": 0.22, "learning_rate": 9.101919976390562e-06, "loss": 0.9744, "step": 9398 }, { "epoch": 0.22, "learning_rate": 9.101705212458159e-06, "loss": 1.1586, "step": 9399 }, { "epoch": 0.22, "learning_rate": 9.101490425384212e-06, "loss": 1.0431, "step": 9400 }, { "epoch": 0.22, "learning_rate": 9.101275615169935e-06, "loss": 0.853, "step": 9401 }, { "epoch": 0.22, "learning_rate": 9.101060781816542e-06, "loss": 1.021, "step": 9402 }, { "epoch": 0.22, "learning_rate": 9.100845925325242e-06, "loss": 0.907, "step": 9403 }, { "epoch": 0.22, "learning_rate": 9.100631045697248e-06, "loss": 1.1688, "step": 9404 }, { "epoch": 0.22, "learning_rate": 9.100416142933773e-06, "loss": 1.0553, "step": 9405 }, { "epoch": 0.22, "learning_rate": 9.100201217036029e-06, "loss": 1.0485, "step": 9406 }, { "epoch": 0.22, "learning_rate": 9.099986268005227e-06, "loss": 0.6032, "step": 9407 }, { "epoch": 0.22, "learning_rate": 9.099771295842584e-06, "loss": 0.8512, "step": 9408 }, { "epoch": 0.22, "learning_rate": 9.099556300549309e-06, "loss": 0.8852, "step": 9409 }, { "epoch": 0.22, "learning_rate": 9.099341282126615e-06, "loss": 1.0551, "step": 9410 }, { "epoch": 0.22, "learning_rate": 9.099126240575719e-06, "loss": 1.3033, "step": 9411 }, { "epoch": 0.22, "learning_rate": 9.098911175897828e-06, "loss": 1.0379, "step": 9412 }, { "epoch": 0.22, "learning_rate": 9.098696088094163e-06, "loss": 0.9821, "step": 9413 }, { "epoch": 0.22, "learning_rate": 9.09848097716593e-06, "loss": 0.9932, "step": 9414 }, { "epoch": 0.22, "learning_rate": 9.098265843114349e-06, "loss": 0.8627, "step": 9415 }, { "epoch": 0.22, "learning_rate": 9.09805068594063e-06, "loss": 1.1951, "step": 9416 }, { "epoch": 0.22, "learning_rate": 9.097835505645986e-06, "loss": 0.8343, "step": 9417 }, { "epoch": 0.22, "learning_rate": 9.097620302231634e-06, "loss": 0.8193, "step": 9418 }, { "epoch": 0.22, "learning_rate": 9.097405075698788e-06, "loss": 1.0317, "step": 9419 }, { "epoch": 0.22, "learning_rate": 9.09718982604866e-06, "loss": 1.3381, "step": 9420 }, { "epoch": 0.22, "learning_rate": 9.096974553282467e-06, "loss": 0.8494, "step": 9421 }, { "epoch": 0.22, "learning_rate": 9.09675925740142e-06, "loss": 0.9098, "step": 9422 }, { "epoch": 0.22, "learning_rate": 9.096543938406738e-06, "loss": 1.0191, "step": 9423 }, { "epoch": 0.22, "learning_rate": 9.096328596299632e-06, "loss": 0.9603, "step": 9424 }, { "epoch": 0.22, "learning_rate": 9.09611323108132e-06, "loss": 0.9933, "step": 9425 }, { "epoch": 0.22, "learning_rate": 9.095897842753016e-06, "loss": 0.8612, "step": 9426 }, { "epoch": 0.22, "learning_rate": 9.095682431315933e-06, "loss": 1.1635, "step": 9427 }, { "epoch": 0.22, "learning_rate": 9.095466996771291e-06, "loss": 0.9893, "step": 9428 }, { "epoch": 0.22, "learning_rate": 9.095251539120303e-06, "loss": 0.97, "step": 9429 }, { "epoch": 0.22, "learning_rate": 9.095036058364182e-06, "loss": 0.8677, "step": 9430 }, { "epoch": 0.22, "learning_rate": 9.094820554504147e-06, "loss": 0.8495, "step": 9431 }, { "epoch": 0.22, "learning_rate": 9.094605027541411e-06, "loss": 0.992, "step": 9432 }, { "epoch": 0.22, "learning_rate": 9.094389477477194e-06, "loss": 0.9143, "step": 9433 }, { "epoch": 0.22, "learning_rate": 9.094173904312711e-06, "loss": 1.0704, "step": 9434 }, { "epoch": 0.22, "learning_rate": 9.093958308049176e-06, "loss": 0.8339, "step": 9435 }, { "epoch": 0.22, "learning_rate": 9.093742688687807e-06, "loss": 0.8574, "step": 9436 }, { "epoch": 0.22, "learning_rate": 9.09352704622982e-06, "loss": 1.1058, "step": 9437 }, { "epoch": 0.22, "learning_rate": 9.093311380676432e-06, "loss": 1.041, "step": 9438 }, { "epoch": 0.22, "learning_rate": 9.09309569202886e-06, "loss": 1.1126, "step": 9439 }, { "epoch": 0.22, "learning_rate": 9.092879980288321e-06, "loss": 0.995, "step": 9440 }, { "epoch": 0.22, "learning_rate": 9.09266424545603e-06, "loss": 1.0437, "step": 9441 }, { "epoch": 0.22, "learning_rate": 9.092448487533207e-06, "loss": 0.9956, "step": 9442 }, { "epoch": 0.22, "learning_rate": 9.092232706521067e-06, "loss": 1.2699, "step": 9443 }, { "epoch": 0.22, "learning_rate": 9.092016902420829e-06, "loss": 0.9625, "step": 9444 }, { "epoch": 0.22, "learning_rate": 9.09180107523371e-06, "loss": 0.8523, "step": 9445 }, { "epoch": 0.22, "learning_rate": 9.091585224960928e-06, "loss": 1.2662, "step": 9446 }, { "epoch": 0.22, "learning_rate": 9.091369351603698e-06, "loss": 0.7305, "step": 9447 }, { "epoch": 0.22, "learning_rate": 9.091153455163244e-06, "loss": 1.3025, "step": 9448 }, { "epoch": 0.22, "learning_rate": 9.090937535640779e-06, "loss": 0.9604, "step": 9449 }, { "epoch": 0.22, "learning_rate": 9.090721593037521e-06, "loss": 1.1791, "step": 9450 }, { "epoch": 0.22, "learning_rate": 9.090505627354692e-06, "loss": 1.2547, "step": 9451 }, { "epoch": 0.22, "learning_rate": 9.090289638593507e-06, "loss": 0.9201, "step": 9452 }, { "epoch": 0.22, "learning_rate": 9.09007362675519e-06, "loss": 1.1015, "step": 9453 }, { "epoch": 0.22, "learning_rate": 9.089857591840951e-06, "loss": 0.9861, "step": 9454 }, { "epoch": 0.22, "learning_rate": 9.089641533852016e-06, "loss": 1.1064, "step": 9455 }, { "epoch": 0.22, "learning_rate": 9.089425452789602e-06, "loss": 0.805, "step": 9456 }, { "epoch": 0.22, "learning_rate": 9.089209348654926e-06, "loss": 0.9935, "step": 9457 }, { "epoch": 0.22, "learning_rate": 9.08899322144921e-06, "loss": 0.8853, "step": 9458 }, { "epoch": 0.22, "learning_rate": 9.088777071173674e-06, "loss": 0.9144, "step": 9459 }, { "epoch": 0.22, "learning_rate": 9.088560897829532e-06, "loss": 0.9361, "step": 9460 }, { "epoch": 0.22, "learning_rate": 9.08834470141801e-06, "loss": 1.2629, "step": 9461 }, { "epoch": 0.22, "learning_rate": 9.088128481940326e-06, "loss": 1.1144, "step": 9462 }, { "epoch": 0.22, "learning_rate": 9.087912239397699e-06, "loss": 0.8091, "step": 9463 }, { "epoch": 0.22, "learning_rate": 9.087695973791349e-06, "loss": 0.796, "step": 9464 }, { "epoch": 0.22, "learning_rate": 9.087479685122494e-06, "loss": 1.2855, "step": 9465 }, { "epoch": 0.22, "learning_rate": 9.08726337339236e-06, "loss": 1.0864, "step": 9466 }, { "epoch": 0.22, "learning_rate": 9.087047038602161e-06, "loss": 1.0975, "step": 9467 }, { "epoch": 0.22, "learning_rate": 9.086830680753122e-06, "loss": 0.9264, "step": 9468 }, { "epoch": 0.22, "learning_rate": 9.086614299846464e-06, "loss": 0.9112, "step": 9469 }, { "epoch": 0.22, "learning_rate": 9.086397895883402e-06, "loss": 1.2455, "step": 9470 }, { "epoch": 0.22, "learning_rate": 9.086181468865165e-06, "loss": 1.0292, "step": 9471 }, { "epoch": 0.22, "learning_rate": 9.085965018792968e-06, "loss": 0.9621, "step": 9472 }, { "epoch": 0.22, "learning_rate": 9.085748545668037e-06, "loss": 1.2426, "step": 9473 }, { "epoch": 0.22, "learning_rate": 9.085532049491588e-06, "loss": 1.0217, "step": 9474 }, { "epoch": 0.22, "learning_rate": 9.085315530264845e-06, "loss": 0.9429, "step": 9475 }, { "epoch": 0.22, "learning_rate": 9.08509898798903e-06, "loss": 1.2271, "step": 9476 }, { "epoch": 0.22, "learning_rate": 9.084882422665364e-06, "loss": 0.988, "step": 9477 }, { "epoch": 0.22, "learning_rate": 9.08466583429507e-06, "loss": 0.9878, "step": 9478 }, { "epoch": 0.22, "learning_rate": 9.08444922287937e-06, "loss": 1.1919, "step": 9479 }, { "epoch": 0.22, "learning_rate": 9.084232588419483e-06, "loss": 1.1792, "step": 9480 }, { "epoch": 0.22, "learning_rate": 9.084015930916637e-06, "loss": 0.8336, "step": 9481 }, { "epoch": 0.22, "learning_rate": 9.083799250372048e-06, "loss": 1.1296, "step": 9482 }, { "epoch": 0.22, "learning_rate": 9.083582546786942e-06, "loss": 1.0583, "step": 9483 }, { "epoch": 0.22, "learning_rate": 9.083365820162542e-06, "loss": 1.0808, "step": 9484 }, { "epoch": 0.22, "learning_rate": 9.083149070500069e-06, "loss": 1.0864, "step": 9485 }, { "epoch": 0.22, "learning_rate": 9.082932297800746e-06, "loss": 1.1213, "step": 9486 }, { "epoch": 0.22, "learning_rate": 9.082715502065798e-06, "loss": 0.9457, "step": 9487 }, { "epoch": 0.22, "learning_rate": 9.082498683296445e-06, "loss": 1.0001, "step": 9488 }, { "epoch": 0.22, "learning_rate": 9.082281841493915e-06, "loss": 1.0925, "step": 9489 }, { "epoch": 0.22, "learning_rate": 9.082064976659428e-06, "loss": 0.9204, "step": 9490 }, { "epoch": 0.22, "learning_rate": 9.081848088794206e-06, "loss": 0.9576, "step": 9491 }, { "epoch": 0.22, "learning_rate": 9.081631177899476e-06, "loss": 1.1457, "step": 9492 }, { "epoch": 0.22, "learning_rate": 9.08141424397646e-06, "loss": 1.144, "step": 9493 }, { "epoch": 0.22, "learning_rate": 9.081197287026383e-06, "loss": 0.7771, "step": 9494 }, { "epoch": 0.22, "learning_rate": 9.080980307050469e-06, "loss": 0.8408, "step": 9495 }, { "epoch": 0.22, "learning_rate": 9.08076330404994e-06, "loss": 0.9248, "step": 9496 }, { "epoch": 0.22, "learning_rate": 9.080546278026023e-06, "loss": 0.8819, "step": 9497 }, { "epoch": 0.22, "learning_rate": 9.080329228979942e-06, "loss": 1.3996, "step": 9498 }, { "epoch": 0.22, "learning_rate": 9.08011215691292e-06, "loss": 0.9872, "step": 9499 }, { "epoch": 0.22, "learning_rate": 9.079895061826182e-06, "loss": 0.9543, "step": 9500 }, { "epoch": 0.22, "learning_rate": 9.079677943720958e-06, "loss": 1.0953, "step": 9501 }, { "epoch": 0.22, "learning_rate": 9.079460802598463e-06, "loss": 0.9078, "step": 9502 }, { "epoch": 0.22, "learning_rate": 9.07924363845993e-06, "loss": 1.2032, "step": 9503 }, { "epoch": 0.22, "learning_rate": 9.079026451306583e-06, "loss": 1.3027, "step": 9504 }, { "epoch": 0.22, "learning_rate": 9.078809241139645e-06, "loss": 0.8923, "step": 9505 }, { "epoch": 0.22, "learning_rate": 9.078592007960342e-06, "loss": 1.1519, "step": 9506 }, { "epoch": 0.22, "learning_rate": 9.078374751769901e-06, "loss": 0.9547, "step": 9507 }, { "epoch": 0.22, "learning_rate": 9.078157472569547e-06, "loss": 1.0712, "step": 9508 }, { "epoch": 0.22, "learning_rate": 9.077940170360507e-06, "loss": 0.8659, "step": 9509 }, { "epoch": 0.22, "learning_rate": 9.077722845144004e-06, "loss": 1.0845, "step": 9510 }, { "epoch": 0.22, "learning_rate": 9.077505496921266e-06, "loss": 1.2045, "step": 9511 }, { "epoch": 0.22, "learning_rate": 9.077288125693522e-06, "loss": 0.864, "step": 9512 }, { "epoch": 0.22, "learning_rate": 9.077070731461994e-06, "loss": 1.0635, "step": 9513 }, { "epoch": 0.22, "learning_rate": 9.07685331422791e-06, "loss": 1.2617, "step": 9514 }, { "epoch": 0.22, "learning_rate": 9.076635873992498e-06, "loss": 1.0673, "step": 9515 }, { "epoch": 0.22, "learning_rate": 9.076418410756984e-06, "loss": 0.84, "step": 9516 }, { "epoch": 0.22, "learning_rate": 9.076200924522592e-06, "loss": 0.9723, "step": 9517 }, { "epoch": 0.22, "learning_rate": 9.075983415290555e-06, "loss": 0.9252, "step": 9518 }, { "epoch": 0.22, "learning_rate": 9.075765883062093e-06, "loss": 0.7536, "step": 9519 }, { "epoch": 0.22, "learning_rate": 9.07554832783844e-06, "loss": 0.8766, "step": 9520 }, { "epoch": 0.22, "learning_rate": 9.075330749620819e-06, "loss": 1.1579, "step": 9521 }, { "epoch": 0.22, "learning_rate": 9.07511314841046e-06, "loss": 1.073, "step": 9522 }, { "epoch": 0.22, "learning_rate": 9.07489552420859e-06, "loss": 0.9806, "step": 9523 }, { "epoch": 0.22, "learning_rate": 9.074677877016436e-06, "loss": 1.0472, "step": 9524 }, { "epoch": 0.22, "learning_rate": 9.074460206835227e-06, "loss": 0.9827, "step": 9525 }, { "epoch": 0.22, "learning_rate": 9.074242513666192e-06, "loss": 1.0928, "step": 9526 }, { "epoch": 0.22, "learning_rate": 9.074024797510557e-06, "loss": 0.9485, "step": 9527 }, { "epoch": 0.22, "learning_rate": 9.07380705836955e-06, "loss": 0.9876, "step": 9528 }, { "epoch": 0.22, "learning_rate": 9.0735892962444e-06, "loss": 1.284, "step": 9529 }, { "epoch": 0.22, "learning_rate": 9.073371511136337e-06, "loss": 0.9358, "step": 9530 }, { "epoch": 0.22, "learning_rate": 9.07315370304659e-06, "loss": 1.141, "step": 9531 }, { "epoch": 0.22, "learning_rate": 9.072935871976387e-06, "loss": 0.8957, "step": 9532 }, { "epoch": 0.22, "learning_rate": 9.072718017926957e-06, "loss": 1.0459, "step": 9533 }, { "epoch": 0.22, "learning_rate": 9.072500140899528e-06, "loss": 1.1884, "step": 9534 }, { "epoch": 0.22, "learning_rate": 9.07228224089533e-06, "loss": 1.0954, "step": 9535 }, { "epoch": 0.22, "learning_rate": 9.072064317915593e-06, "loss": 1.2003, "step": 9536 }, { "epoch": 0.22, "learning_rate": 9.071846371961547e-06, "loss": 1.0171, "step": 9537 }, { "epoch": 0.22, "learning_rate": 9.07162840303442e-06, "loss": 1.3258, "step": 9538 }, { "epoch": 0.22, "learning_rate": 9.071410411135442e-06, "loss": 0.9908, "step": 9539 }, { "epoch": 0.22, "learning_rate": 9.071192396265845e-06, "loss": 0.8502, "step": 9540 }, { "epoch": 0.22, "learning_rate": 9.070974358426854e-06, "loss": 1.2542, "step": 9541 }, { "epoch": 0.22, "learning_rate": 9.070756297619706e-06, "loss": 1.2058, "step": 9542 }, { "epoch": 0.22, "learning_rate": 9.070538213845627e-06, "loss": 1.192, "step": 9543 }, { "epoch": 0.22, "learning_rate": 9.070320107105847e-06, "loss": 1.0073, "step": 9544 }, { "epoch": 0.22, "learning_rate": 9.0701019774016e-06, "loss": 0.8306, "step": 9545 }, { "epoch": 0.22, "learning_rate": 9.069883824734113e-06, "loss": 0.8013, "step": 9546 }, { "epoch": 0.22, "learning_rate": 9.069665649104617e-06, "loss": 0.9991, "step": 9547 }, { "epoch": 0.22, "learning_rate": 9.069447450514346e-06, "loss": 0.9535, "step": 9548 }, { "epoch": 0.22, "learning_rate": 9.069229228964531e-06, "loss": 1.091, "step": 9549 }, { "epoch": 0.22, "learning_rate": 9.069010984456399e-06, "loss": 1.1855, "step": 9550 }, { "epoch": 0.22, "learning_rate": 9.068792716991184e-06, "loss": 1.1423, "step": 9551 }, { "epoch": 0.22, "learning_rate": 9.068574426570118e-06, "loss": 1.0483, "step": 9552 }, { "epoch": 0.22, "learning_rate": 9.068356113194431e-06, "loss": 0.9203, "step": 9553 }, { "epoch": 0.22, "learning_rate": 9.068137776865356e-06, "loss": 1.1496, "step": 9554 }, { "epoch": 0.22, "learning_rate": 9.067919417584125e-06, "loss": 1.1435, "step": 9555 }, { "epoch": 0.22, "learning_rate": 9.067701035351968e-06, "loss": 0.9498, "step": 9556 }, { "epoch": 0.22, "learning_rate": 9.067482630170119e-06, "loss": 0.7571, "step": 9557 }, { "epoch": 0.22, "learning_rate": 9.067264202039811e-06, "loss": 1.1481, "step": 9558 }, { "epoch": 0.22, "learning_rate": 9.067045750962273e-06, "loss": 1.1033, "step": 9559 }, { "epoch": 0.22, "learning_rate": 9.066827276938742e-06, "loss": 1.0493, "step": 9560 }, { "epoch": 0.22, "learning_rate": 9.066608779970444e-06, "loss": 1.0607, "step": 9561 }, { "epoch": 0.22, "learning_rate": 9.06639026005862e-06, "loss": 1.0673, "step": 9562 }, { "epoch": 0.22, "learning_rate": 9.066171717204498e-06, "loss": 1.0198, "step": 9563 }, { "epoch": 0.22, "learning_rate": 9.06595315140931e-06, "loss": 0.9935, "step": 9564 }, { "epoch": 0.22, "learning_rate": 9.065734562674292e-06, "loss": 0.9886, "step": 9565 }, { "epoch": 0.22, "learning_rate": 9.065515951000676e-06, "loss": 0.8589, "step": 9566 }, { "epoch": 0.22, "learning_rate": 9.065297316389696e-06, "loss": 1.1213, "step": 9567 }, { "epoch": 0.22, "learning_rate": 9.065078658842583e-06, "loss": 1.0501, "step": 9568 }, { "epoch": 0.22, "learning_rate": 9.064859978360574e-06, "loss": 0.993, "step": 9569 }, { "epoch": 0.22, "learning_rate": 9.064641274944903e-06, "loss": 1.0133, "step": 9570 }, { "epoch": 0.22, "learning_rate": 9.0644225485968e-06, "loss": 0.9569, "step": 9571 }, { "epoch": 0.22, "learning_rate": 9.064203799317503e-06, "loss": 0.8248, "step": 9572 }, { "epoch": 0.22, "learning_rate": 9.063985027108245e-06, "loss": 0.9216, "step": 9573 }, { "epoch": 0.22, "learning_rate": 9.063766231970257e-06, "loss": 1.3372, "step": 9574 }, { "epoch": 0.22, "learning_rate": 9.06354741390478e-06, "loss": 1.1913, "step": 9575 }, { "epoch": 0.22, "learning_rate": 9.063328572913043e-06, "loss": 1.2958, "step": 9576 }, { "epoch": 0.22, "learning_rate": 9.063109708996283e-06, "loss": 0.8858, "step": 9577 }, { "epoch": 0.22, "learning_rate": 9.062890822155734e-06, "loss": 0.9102, "step": 9578 }, { "epoch": 0.22, "learning_rate": 9.062671912392631e-06, "loss": 0.8478, "step": 9579 }, { "epoch": 0.22, "learning_rate": 9.062452979708211e-06, "loss": 1.1367, "step": 9580 }, { "epoch": 0.22, "learning_rate": 9.062234024103707e-06, "loss": 1.1765, "step": 9581 }, { "epoch": 0.22, "learning_rate": 9.062015045580354e-06, "loss": 0.9293, "step": 9582 }, { "epoch": 0.22, "learning_rate": 9.06179604413939e-06, "loss": 0.9867, "step": 9583 }, { "epoch": 0.22, "learning_rate": 9.061577019782048e-06, "loss": 1.1037, "step": 9584 }, { "epoch": 0.22, "learning_rate": 9.061357972509564e-06, "loss": 0.9841, "step": 9585 }, { "epoch": 0.22, "learning_rate": 9.061138902323175e-06, "loss": 1.1669, "step": 9586 }, { "epoch": 0.22, "learning_rate": 9.060919809224117e-06, "loss": 0.7535, "step": 9587 }, { "epoch": 0.22, "learning_rate": 9.060700693213627e-06, "loss": 0.8049, "step": 9588 }, { "epoch": 0.22, "learning_rate": 9.060481554292937e-06, "loss": 0.8184, "step": 9589 }, { "epoch": 0.22, "learning_rate": 9.060262392463288e-06, "loss": 0.8215, "step": 9590 }, { "epoch": 0.22, "learning_rate": 9.060043207725915e-06, "loss": 0.9, "step": 9591 }, { "epoch": 0.22, "learning_rate": 9.059824000082054e-06, "loss": 1.195, "step": 9592 }, { "epoch": 0.22, "learning_rate": 9.05960476953294e-06, "loss": 0.9633, "step": 9593 }, { "epoch": 0.22, "learning_rate": 9.059385516079816e-06, "loss": 1.2976, "step": 9594 }, { "epoch": 0.22, "learning_rate": 9.059166239723914e-06, "loss": 0.9252, "step": 9595 }, { "epoch": 0.22, "learning_rate": 9.05894694046647e-06, "loss": 1.1854, "step": 9596 }, { "epoch": 0.22, "learning_rate": 9.058727618308724e-06, "loss": 0.8583, "step": 9597 }, { "epoch": 0.22, "learning_rate": 9.058508273251914e-06, "loss": 1.0401, "step": 9598 }, { "epoch": 0.22, "learning_rate": 9.058288905297277e-06, "loss": 1.0306, "step": 9599 }, { "epoch": 0.22, "learning_rate": 9.058069514446049e-06, "loss": 0.7623, "step": 9600 }, { "epoch": 0.22, "learning_rate": 9.057850100699468e-06, "loss": 0.7637, "step": 9601 }, { "epoch": 0.22, "learning_rate": 9.057630664058774e-06, "loss": 0.8806, "step": 9602 }, { "epoch": 0.22, "learning_rate": 9.057411204525203e-06, "loss": 0.992, "step": 9603 }, { "epoch": 0.22, "learning_rate": 9.057191722099994e-06, "loss": 1.2409, "step": 9604 }, { "epoch": 0.22, "learning_rate": 9.056972216784386e-06, "loss": 0.9366, "step": 9605 }, { "epoch": 0.22, "learning_rate": 9.056752688579617e-06, "loss": 0.9069, "step": 9606 }, { "epoch": 0.22, "learning_rate": 9.056533137486924e-06, "loss": 0.8333, "step": 9607 }, { "epoch": 0.22, "learning_rate": 9.056313563507547e-06, "loss": 1.2855, "step": 9608 }, { "epoch": 0.22, "learning_rate": 9.056093966642724e-06, "loss": 0.8823, "step": 9609 }, { "epoch": 0.22, "learning_rate": 9.055874346893698e-06, "loss": 1.0675, "step": 9610 }, { "epoch": 0.22, "learning_rate": 9.055654704261703e-06, "loss": 1.2765, "step": 9611 }, { "epoch": 0.22, "learning_rate": 9.05543503874798e-06, "loss": 0.9126, "step": 9612 }, { "epoch": 0.22, "learning_rate": 9.055215350353768e-06, "loss": 1.2768, "step": 9613 }, { "epoch": 0.22, "learning_rate": 9.054995639080306e-06, "loss": 1.1912, "step": 9614 }, { "epoch": 0.22, "learning_rate": 9.054775904928837e-06, "loss": 0.8984, "step": 9615 }, { "epoch": 0.22, "learning_rate": 9.054556147900597e-06, "loss": 1.2969, "step": 9616 }, { "epoch": 0.22, "learning_rate": 9.054336367996826e-06, "loss": 1.028, "step": 9617 }, { "epoch": 0.22, "learning_rate": 9.054116565218766e-06, "loss": 0.8078, "step": 9618 }, { "epoch": 0.22, "learning_rate": 9.053896739567655e-06, "loss": 1.0363, "step": 9619 }, { "epoch": 0.22, "learning_rate": 9.053676891044736e-06, "loss": 0.9039, "step": 9620 }, { "epoch": 0.22, "learning_rate": 9.053457019651245e-06, "loss": 0.9576, "step": 9621 }, { "epoch": 0.22, "learning_rate": 9.053237125388428e-06, "loss": 1.0175, "step": 9622 }, { "epoch": 0.22, "learning_rate": 9.053017208257522e-06, "loss": 0.8663, "step": 9623 }, { "epoch": 0.22, "learning_rate": 9.05279726825977e-06, "loss": 1.0894, "step": 9624 }, { "epoch": 0.22, "learning_rate": 9.052577305396409e-06, "loss": 0.8046, "step": 9625 }, { "epoch": 0.22, "learning_rate": 9.052357319668683e-06, "loss": 0.9178, "step": 9626 }, { "epoch": 0.22, "learning_rate": 9.052137311077833e-06, "loss": 0.9593, "step": 9627 }, { "epoch": 0.22, "learning_rate": 9.0519172796251e-06, "loss": 0.8644, "step": 9628 }, { "epoch": 0.22, "learning_rate": 9.051697225311726e-06, "loss": 1.0879, "step": 9629 }, { "epoch": 0.22, "learning_rate": 9.051477148138953e-06, "loss": 1.0875, "step": 9630 }, { "epoch": 0.22, "learning_rate": 9.051257048108017e-06, "loss": 1.1066, "step": 9631 }, { "epoch": 0.22, "learning_rate": 9.051036925220167e-06, "loss": 1.0224, "step": 9632 }, { "epoch": 0.22, "learning_rate": 9.050816779476644e-06, "loss": 1.0063, "step": 9633 }, { "epoch": 0.22, "learning_rate": 9.050596610878686e-06, "loss": 1.2504, "step": 9634 }, { "epoch": 0.22, "learning_rate": 9.050376419427537e-06, "loss": 0.9895, "step": 9635 }, { "epoch": 0.22, "learning_rate": 9.05015620512444e-06, "loss": 1.0127, "step": 9636 }, { "epoch": 0.22, "learning_rate": 9.04993596797064e-06, "loss": 0.89, "step": 9637 }, { "epoch": 0.22, "learning_rate": 9.049715707967373e-06, "loss": 0.9882, "step": 9638 }, { "epoch": 0.22, "learning_rate": 9.049495425115889e-06, "loss": 0.9601, "step": 9639 }, { "epoch": 0.22, "learning_rate": 9.049275119417424e-06, "loss": 0.8782, "step": 9640 }, { "epoch": 0.22, "learning_rate": 9.049054790873227e-06, "loss": 1.1297, "step": 9641 }, { "epoch": 0.22, "learning_rate": 9.048834439484536e-06, "loss": 1.145, "step": 9642 }, { "epoch": 0.22, "learning_rate": 9.048614065252596e-06, "loss": 0.8423, "step": 9643 }, { "epoch": 0.22, "learning_rate": 9.048393668178653e-06, "loss": 0.7841, "step": 9644 }, { "epoch": 0.22, "learning_rate": 9.048173248263948e-06, "loss": 1.0978, "step": 9645 }, { "epoch": 0.22, "learning_rate": 9.047952805509723e-06, "loss": 1.1069, "step": 9646 }, { "epoch": 0.22, "learning_rate": 9.047732339917226e-06, "loss": 1.2043, "step": 9647 }, { "epoch": 0.22, "learning_rate": 9.047511851487696e-06, "loss": 0.978, "step": 9648 }, { "epoch": 0.22, "learning_rate": 9.047291340222382e-06, "loss": 1.0637, "step": 9649 }, { "epoch": 0.22, "learning_rate": 9.047070806122525e-06, "loss": 1.0518, "step": 9650 }, { "epoch": 0.22, "learning_rate": 9.046850249189368e-06, "loss": 1.3205, "step": 9651 }, { "epoch": 0.22, "learning_rate": 9.046629669424158e-06, "loss": 0.9414, "step": 9652 }, { "epoch": 0.22, "learning_rate": 9.04640906682814e-06, "loss": 1.0073, "step": 9653 }, { "epoch": 0.22, "learning_rate": 9.046188441402557e-06, "loss": 0.946, "step": 9654 }, { "epoch": 0.22, "learning_rate": 9.045967793148654e-06, "loss": 1.0458, "step": 9655 }, { "epoch": 0.22, "learning_rate": 9.045747122067674e-06, "loss": 1.1017, "step": 9656 }, { "epoch": 0.22, "learning_rate": 9.045526428160865e-06, "loss": 1.0922, "step": 9657 }, { "epoch": 0.22, "learning_rate": 9.04530571142947e-06, "loss": 1.031, "step": 9658 }, { "epoch": 0.22, "learning_rate": 9.045084971874738e-06, "loss": 0.9628, "step": 9659 }, { "epoch": 0.22, "learning_rate": 9.04486420949791e-06, "loss": 0.8482, "step": 9660 }, { "epoch": 0.22, "learning_rate": 9.044643424300234e-06, "loss": 1.1629, "step": 9661 }, { "epoch": 0.22, "learning_rate": 9.044422616282956e-06, "loss": 1.0483, "step": 9662 }, { "epoch": 0.22, "learning_rate": 9.044201785447318e-06, "loss": 1.0623, "step": 9663 }, { "epoch": 0.22, "learning_rate": 9.043980931794569e-06, "loss": 1.1023, "step": 9664 }, { "epoch": 0.22, "learning_rate": 9.043760055325956e-06, "loss": 0.8954, "step": 9665 }, { "epoch": 0.22, "learning_rate": 9.043539156042723e-06, "loss": 0.9405, "step": 9666 }, { "epoch": 0.22, "learning_rate": 9.043318233946117e-06, "loss": 1.0856, "step": 9667 }, { "epoch": 0.22, "learning_rate": 9.043097289037386e-06, "loss": 1.0504, "step": 9668 }, { "epoch": 0.22, "learning_rate": 9.042876321317773e-06, "loss": 0.8628, "step": 9669 }, { "epoch": 0.22, "learning_rate": 9.042655330788529e-06, "loss": 1.0097, "step": 9670 }, { "epoch": 0.22, "learning_rate": 9.042434317450896e-06, "loss": 1.0681, "step": 9671 }, { "epoch": 0.22, "learning_rate": 9.042213281306127e-06, "loss": 0.9769, "step": 9672 }, { "epoch": 0.22, "learning_rate": 9.041992222355462e-06, "loss": 0.8595, "step": 9673 }, { "epoch": 0.22, "learning_rate": 9.041771140600155e-06, "loss": 1.0784, "step": 9674 }, { "epoch": 0.22, "learning_rate": 9.041550036041448e-06, "loss": 0.8314, "step": 9675 }, { "epoch": 0.22, "learning_rate": 9.04132890868059e-06, "loss": 1.0285, "step": 9676 }, { "epoch": 0.22, "learning_rate": 9.041107758518832e-06, "loss": 0.8703, "step": 9677 }, { "epoch": 0.22, "learning_rate": 9.040886585557417e-06, "loss": 1.1521, "step": 9678 }, { "epoch": 0.22, "learning_rate": 9.040665389797595e-06, "loss": 0.9796, "step": 9679 }, { "epoch": 0.22, "learning_rate": 9.040444171240615e-06, "loss": 1.3492, "step": 9680 }, { "epoch": 0.22, "learning_rate": 9.04022292988772e-06, "loss": 1.1554, "step": 9681 }, { "epoch": 0.22, "learning_rate": 9.040001665740166e-06, "loss": 1.0246, "step": 9682 }, { "epoch": 0.22, "learning_rate": 9.039780378799197e-06, "loss": 0.9084, "step": 9683 }, { "epoch": 0.22, "learning_rate": 9.039559069066059e-06, "loss": 1.0927, "step": 9684 }, { "epoch": 0.22, "learning_rate": 9.039337736542007e-06, "loss": 0.9118, "step": 9685 }, { "epoch": 0.22, "learning_rate": 9.039116381228284e-06, "loss": 0.9402, "step": 9686 }, { "epoch": 0.22, "learning_rate": 9.038895003126143e-06, "loss": 0.9468, "step": 9687 }, { "epoch": 0.22, "learning_rate": 9.038673602236829e-06, "loss": 0.8975, "step": 9688 }, { "epoch": 0.22, "learning_rate": 9.038452178561595e-06, "loss": 0.9869, "step": 9689 }, { "epoch": 0.22, "learning_rate": 9.038230732101687e-06, "loss": 1.0729, "step": 9690 }, { "epoch": 0.22, "learning_rate": 9.038009262858356e-06, "loss": 0.7924, "step": 9691 }, { "epoch": 0.22, "learning_rate": 9.037787770832853e-06, "loss": 1.3256, "step": 9692 }, { "epoch": 0.22, "learning_rate": 9.037566256026425e-06, "loss": 0.9582, "step": 9693 }, { "epoch": 0.22, "learning_rate": 9.037344718440321e-06, "loss": 1.1074, "step": 9694 }, { "epoch": 0.22, "learning_rate": 9.037123158075796e-06, "loss": 1.1481, "step": 9695 }, { "epoch": 0.22, "learning_rate": 9.036901574934097e-06, "loss": 0.9866, "step": 9696 }, { "epoch": 0.22, "learning_rate": 9.036679969016471e-06, "loss": 1.0099, "step": 9697 }, { "epoch": 0.22, "learning_rate": 9.036458340324173e-06, "loss": 0.7145, "step": 9698 }, { "epoch": 0.22, "learning_rate": 9.03623668885845e-06, "loss": 0.7717, "step": 9699 }, { "epoch": 0.22, "learning_rate": 9.036015014620557e-06, "loss": 0.7609, "step": 9700 }, { "epoch": 0.22, "learning_rate": 9.03579331761174e-06, "loss": 0.7048, "step": 9701 }, { "epoch": 0.23, "learning_rate": 9.03557159783325e-06, "loss": 0.8932, "step": 9702 }, { "epoch": 0.23, "learning_rate": 9.035349855286342e-06, "loss": 0.856, "step": 9703 }, { "epoch": 0.23, "learning_rate": 9.035128089972262e-06, "loss": 1.2339, "step": 9704 }, { "epoch": 0.23, "learning_rate": 9.034906301892265e-06, "loss": 1.0987, "step": 9705 }, { "epoch": 0.23, "learning_rate": 9.034684491047603e-06, "loss": 1.0608, "step": 9706 }, { "epoch": 0.23, "learning_rate": 9.034462657439524e-06, "loss": 1.1213, "step": 9707 }, { "epoch": 0.23, "learning_rate": 9.03424080106928e-06, "loss": 0.9636, "step": 9708 }, { "epoch": 0.23, "learning_rate": 9.034018921938125e-06, "loss": 0.8866, "step": 9709 }, { "epoch": 0.23, "learning_rate": 9.033797020047311e-06, "loss": 0.9441, "step": 9710 }, { "epoch": 0.23, "learning_rate": 9.033575095398088e-06, "loss": 1.0002, "step": 9711 }, { "epoch": 0.23, "learning_rate": 9.033353147991708e-06, "loss": 1.0627, "step": 9712 }, { "epoch": 0.23, "learning_rate": 9.033131177829424e-06, "loss": 0.5857, "step": 9713 }, { "epoch": 0.23, "learning_rate": 9.032909184912487e-06, "loss": 0.8946, "step": 9714 }, { "epoch": 0.23, "learning_rate": 9.032687169242152e-06, "loss": 1.0209, "step": 9715 }, { "epoch": 0.23, "learning_rate": 9.03246513081967e-06, "loss": 0.6937, "step": 9716 }, { "epoch": 0.23, "learning_rate": 9.032243069646295e-06, "loss": 1.0309, "step": 9717 }, { "epoch": 0.23, "learning_rate": 9.032020985723278e-06, "loss": 0.8126, "step": 9718 }, { "epoch": 0.23, "learning_rate": 9.031798879051872e-06, "loss": 0.8731, "step": 9719 }, { "epoch": 0.23, "learning_rate": 9.031576749633333e-06, "loss": 0.8785, "step": 9720 }, { "epoch": 0.23, "learning_rate": 9.031354597468911e-06, "loss": 1.035, "step": 9721 }, { "epoch": 0.23, "learning_rate": 9.03113242255986e-06, "loss": 0.8814, "step": 9722 }, { "epoch": 0.23, "learning_rate": 9.030910224907435e-06, "loss": 0.9317, "step": 9723 }, { "epoch": 0.23, "learning_rate": 9.030688004512889e-06, "loss": 0.9853, "step": 9724 }, { "epoch": 0.23, "learning_rate": 9.030465761377474e-06, "loss": 1.0435, "step": 9725 }, { "epoch": 0.23, "learning_rate": 9.030243495502446e-06, "loss": 0.9996, "step": 9726 }, { "epoch": 0.23, "learning_rate": 9.030021206889058e-06, "loss": 0.9308, "step": 9727 }, { "epoch": 0.23, "learning_rate": 9.029798895538566e-06, "loss": 0.8863, "step": 9728 }, { "epoch": 0.23, "learning_rate": 9.029576561452221e-06, "loss": 1.1238, "step": 9729 }, { "epoch": 0.23, "learning_rate": 9.029354204631279e-06, "loss": 1.2189, "step": 9730 }, { "epoch": 0.23, "learning_rate": 9.029131825076997e-06, "loss": 0.9926, "step": 9731 }, { "epoch": 0.23, "learning_rate": 9.028909422790626e-06, "loss": 1.2052, "step": 9732 }, { "epoch": 0.23, "learning_rate": 9.028686997773421e-06, "loss": 0.9153, "step": 9733 }, { "epoch": 0.23, "learning_rate": 9.02846455002664e-06, "loss": 0.8082, "step": 9734 }, { "epoch": 0.23, "learning_rate": 9.028242079551535e-06, "loss": 1.0119, "step": 9735 }, { "epoch": 0.23, "learning_rate": 9.028019586349362e-06, "loss": 0.8864, "step": 9736 }, { "epoch": 0.23, "learning_rate": 9.027797070421376e-06, "loss": 1.0861, "step": 9737 }, { "epoch": 0.23, "learning_rate": 9.027574531768833e-06, "loss": 0.8789, "step": 9738 }, { "epoch": 0.23, "learning_rate": 9.02735197039299e-06, "loss": 0.901, "step": 9739 }, { "epoch": 0.23, "learning_rate": 9.0271293862951e-06, "loss": 1.0981, "step": 9740 }, { "epoch": 0.23, "learning_rate": 9.026906779476418e-06, "loss": 1.0848, "step": 9741 }, { "epoch": 0.23, "learning_rate": 9.026684149938205e-06, "loss": 0.681, "step": 9742 }, { "epoch": 0.23, "learning_rate": 9.026461497681714e-06, "loss": 0.7118, "step": 9743 }, { "epoch": 0.23, "learning_rate": 9.026238822708198e-06, "loss": 0.9026, "step": 9744 }, { "epoch": 0.23, "learning_rate": 9.026016125018919e-06, "loss": 1.0138, "step": 9745 }, { "epoch": 0.23, "learning_rate": 9.02579340461513e-06, "loss": 0.7268, "step": 9746 }, { "epoch": 0.23, "learning_rate": 9.025570661498088e-06, "loss": 0.9666, "step": 9747 }, { "epoch": 0.23, "learning_rate": 9.025347895669052e-06, "loss": 0.7606, "step": 9748 }, { "epoch": 0.23, "learning_rate": 9.025125107129276e-06, "loss": 0.9506, "step": 9749 }, { "epoch": 0.23, "learning_rate": 9.024902295880016e-06, "loss": 1.0478, "step": 9750 }, { "epoch": 0.23, "learning_rate": 9.024679461922532e-06, "loss": 0.9781, "step": 9751 }, { "epoch": 0.23, "learning_rate": 9.024456605258083e-06, "loss": 0.9147, "step": 9752 }, { "epoch": 0.23, "learning_rate": 9.024233725887921e-06, "loss": 1.0423, "step": 9753 }, { "epoch": 0.23, "learning_rate": 9.024010823813307e-06, "loss": 0.9842, "step": 9754 }, { "epoch": 0.23, "learning_rate": 9.023787899035496e-06, "loss": 0.7956, "step": 9755 }, { "epoch": 0.23, "learning_rate": 9.02356495155575e-06, "loss": 1.0924, "step": 9756 }, { "epoch": 0.23, "learning_rate": 9.023341981375321e-06, "loss": 0.7812, "step": 9757 }, { "epoch": 0.23, "learning_rate": 9.023118988495474e-06, "loss": 1.1099, "step": 9758 }, { "epoch": 0.23, "learning_rate": 9.02289597291746e-06, "loss": 0.8438, "step": 9759 }, { "epoch": 0.23, "learning_rate": 9.022672934642542e-06, "loss": 0.9377, "step": 9760 }, { "epoch": 0.23, "learning_rate": 9.022449873671977e-06, "loss": 0.8633, "step": 9761 }, { "epoch": 0.23, "learning_rate": 9.022226790007023e-06, "loss": 1.1212, "step": 9762 }, { "epoch": 0.23, "learning_rate": 9.022003683648939e-06, "loss": 1.0696, "step": 9763 }, { "epoch": 0.23, "learning_rate": 9.021780554598984e-06, "loss": 1.1289, "step": 9764 }, { "epoch": 0.23, "learning_rate": 9.021557402858417e-06, "loss": 1.1774, "step": 9765 }, { "epoch": 0.23, "learning_rate": 9.021334228428497e-06, "loss": 1.19, "step": 9766 }, { "epoch": 0.23, "learning_rate": 9.021111031310482e-06, "loss": 1.0198, "step": 9767 }, { "epoch": 0.23, "learning_rate": 9.020887811505632e-06, "loss": 1.072, "step": 9768 }, { "epoch": 0.23, "learning_rate": 9.020664569015207e-06, "loss": 0.7778, "step": 9769 }, { "epoch": 0.23, "learning_rate": 9.020441303840466e-06, "loss": 0.944, "step": 9770 }, { "epoch": 0.23, "learning_rate": 9.02021801598267e-06, "loss": 1.1178, "step": 9771 }, { "epoch": 0.23, "learning_rate": 9.019994705443074e-06, "loss": 0.9809, "step": 9772 }, { "epoch": 0.23, "learning_rate": 9.019771372222944e-06, "loss": 0.6566, "step": 9773 }, { "epoch": 0.23, "learning_rate": 9.019548016323536e-06, "loss": 1.1747, "step": 9774 }, { "epoch": 0.23, "learning_rate": 9.019324637746111e-06, "loss": 1.1056, "step": 9775 }, { "epoch": 0.23, "learning_rate": 9.019101236491932e-06, "loss": 1.0662, "step": 9776 }, { "epoch": 0.23, "learning_rate": 9.018877812562255e-06, "loss": 1.0484, "step": 9777 }, { "epoch": 0.23, "learning_rate": 9.018654365958343e-06, "loss": 0.7434, "step": 9778 }, { "epoch": 0.23, "learning_rate": 9.018430896681459e-06, "loss": 1.1302, "step": 9779 }, { "epoch": 0.23, "learning_rate": 9.01820740473286e-06, "loss": 1.216, "step": 9780 }, { "epoch": 0.23, "learning_rate": 9.017983890113806e-06, "loss": 0.8927, "step": 9781 }, { "epoch": 0.23, "learning_rate": 9.017760352825561e-06, "loss": 0.6629, "step": 9782 }, { "epoch": 0.23, "learning_rate": 9.017536792869386e-06, "loss": 0.9547, "step": 9783 }, { "epoch": 0.23, "learning_rate": 9.017313210246544e-06, "loss": 1.0738, "step": 9784 }, { "epoch": 0.23, "learning_rate": 9.017089604958292e-06, "loss": 1.0742, "step": 9785 }, { "epoch": 0.23, "learning_rate": 9.016865977005893e-06, "loss": 1.1214, "step": 9786 }, { "epoch": 0.23, "learning_rate": 9.01664232639061e-06, "loss": 0.7812, "step": 9787 }, { "epoch": 0.23, "learning_rate": 9.016418653113704e-06, "loss": 1.0914, "step": 9788 }, { "epoch": 0.23, "learning_rate": 9.016194957176437e-06, "loss": 1.2043, "step": 9789 }, { "epoch": 0.23, "learning_rate": 9.01597123858007e-06, "loss": 1.0142, "step": 9790 }, { "epoch": 0.23, "learning_rate": 9.01574749732587e-06, "loss": 0.8293, "step": 9791 }, { "epoch": 0.23, "learning_rate": 9.015523733415093e-06, "loss": 0.9739, "step": 9792 }, { "epoch": 0.23, "learning_rate": 9.015299946849006e-06, "loss": 1.0474, "step": 9793 }, { "epoch": 0.23, "learning_rate": 9.015076137628868e-06, "loss": 1.0208, "step": 9794 }, { "epoch": 0.23, "learning_rate": 9.014852305755944e-06, "loss": 1.0261, "step": 9795 }, { "epoch": 0.23, "learning_rate": 9.014628451231497e-06, "loss": 1.0708, "step": 9796 }, { "epoch": 0.23, "learning_rate": 9.01440457405679e-06, "loss": 0.7563, "step": 9797 }, { "epoch": 0.23, "learning_rate": 9.014180674233084e-06, "loss": 1.0956, "step": 9798 }, { "epoch": 0.23, "learning_rate": 9.013956751761643e-06, "loss": 0.9468, "step": 9799 }, { "epoch": 0.23, "learning_rate": 9.013732806643734e-06, "loss": 1.009, "step": 9800 }, { "epoch": 0.23, "learning_rate": 9.013508838880616e-06, "loss": 0.8562, "step": 9801 }, { "epoch": 0.23, "learning_rate": 9.013284848473554e-06, "loss": 0.882, "step": 9802 }, { "epoch": 0.23, "learning_rate": 9.013060835423811e-06, "loss": 1.0407, "step": 9803 }, { "epoch": 0.23, "learning_rate": 9.012836799732652e-06, "loss": 1.1019, "step": 9804 }, { "epoch": 0.23, "learning_rate": 9.01261274140134e-06, "loss": 1.0245, "step": 9805 }, { "epoch": 0.23, "learning_rate": 9.012388660431143e-06, "loss": 1.0133, "step": 9806 }, { "epoch": 0.23, "learning_rate": 9.01216455682332e-06, "loss": 1.1441, "step": 9807 }, { "epoch": 0.23, "learning_rate": 9.011940430579138e-06, "loss": 1.078, "step": 9808 }, { "epoch": 0.23, "learning_rate": 9.01171628169986e-06, "loss": 0.8274, "step": 9809 }, { "epoch": 0.23, "learning_rate": 9.011492110186752e-06, "loss": 0.8983, "step": 9810 }, { "epoch": 0.23, "learning_rate": 9.011267916041078e-06, "loss": 1.0321, "step": 9811 }, { "epoch": 0.23, "learning_rate": 9.011043699264104e-06, "loss": 0.762, "step": 9812 }, { "epoch": 0.23, "learning_rate": 9.010819459857095e-06, "loss": 1.0433, "step": 9813 }, { "epoch": 0.23, "learning_rate": 9.010595197821315e-06, "loss": 0.9733, "step": 9814 }, { "epoch": 0.23, "learning_rate": 9.010370913158028e-06, "loss": 1.0479, "step": 9815 }, { "epoch": 0.23, "learning_rate": 9.010146605868504e-06, "loss": 0.9923, "step": 9816 }, { "epoch": 0.23, "learning_rate": 9.009922275954003e-06, "loss": 1.1281, "step": 9817 }, { "epoch": 0.23, "learning_rate": 9.009697923415795e-06, "loss": 0.9436, "step": 9818 }, { "epoch": 0.23, "learning_rate": 9.009473548255143e-06, "loss": 1.2579, "step": 9819 }, { "epoch": 0.23, "learning_rate": 9.009249150473315e-06, "loss": 0.9865, "step": 9820 }, { "epoch": 0.23, "learning_rate": 9.009024730071575e-06, "loss": 0.9698, "step": 9821 }, { "epoch": 0.23, "learning_rate": 9.008800287051191e-06, "loss": 0.8597, "step": 9822 }, { "epoch": 0.23, "learning_rate": 9.008575821413428e-06, "loss": 1.1206, "step": 9823 }, { "epoch": 0.23, "learning_rate": 9.008351333159553e-06, "loss": 1.0458, "step": 9824 }, { "epoch": 0.23, "learning_rate": 9.00812682229083e-06, "loss": 1.0821, "step": 9825 }, { "epoch": 0.23, "learning_rate": 9.007902288808532e-06, "loss": 1.0191, "step": 9826 }, { "epoch": 0.23, "learning_rate": 9.00767773271392e-06, "loss": 0.7821, "step": 9827 }, { "epoch": 0.23, "learning_rate": 9.007453154008263e-06, "loss": 1.0438, "step": 9828 }, { "epoch": 0.23, "learning_rate": 9.007228552692829e-06, "loss": 0.984, "step": 9829 }, { "epoch": 0.23, "learning_rate": 9.007003928768882e-06, "loss": 1.1367, "step": 9830 }, { "epoch": 0.23, "learning_rate": 9.006779282237693e-06, "loss": 0.9194, "step": 9831 }, { "epoch": 0.23, "learning_rate": 9.006554613100527e-06, "loss": 0.884, "step": 9832 }, { "epoch": 0.23, "learning_rate": 9.006329921358653e-06, "loss": 1.0961, "step": 9833 }, { "epoch": 0.23, "learning_rate": 9.006105207013338e-06, "loss": 0.8946, "step": 9834 }, { "epoch": 0.23, "learning_rate": 9.00588047006585e-06, "loss": 0.9322, "step": 9835 }, { "epoch": 0.23, "learning_rate": 9.005655710517456e-06, "loss": 0.9049, "step": 9836 }, { "epoch": 0.23, "learning_rate": 9.005430928369426e-06, "loss": 0.9926, "step": 9837 }, { "epoch": 0.23, "learning_rate": 9.005206123623027e-06, "loss": 0.8394, "step": 9838 }, { "epoch": 0.23, "learning_rate": 9.004981296279527e-06, "loss": 1.0121, "step": 9839 }, { "epoch": 0.23, "learning_rate": 9.004756446340195e-06, "loss": 1.2229, "step": 9840 }, { "epoch": 0.23, "learning_rate": 9.004531573806298e-06, "loss": 0.8827, "step": 9841 }, { "epoch": 0.23, "learning_rate": 9.004306678679109e-06, "loss": 0.8624, "step": 9842 }, { "epoch": 0.23, "learning_rate": 9.004081760959892e-06, "loss": 0.9981, "step": 9843 }, { "epoch": 0.23, "learning_rate": 9.00385682064992e-06, "loss": 1.2489, "step": 9844 }, { "epoch": 0.23, "learning_rate": 9.00363185775046e-06, "loss": 1.0388, "step": 9845 }, { "epoch": 0.23, "learning_rate": 9.003406872262781e-06, "loss": 0.6024, "step": 9846 }, { "epoch": 0.23, "learning_rate": 9.003181864188151e-06, "loss": 1.1066, "step": 9847 }, { "epoch": 0.23, "learning_rate": 9.002956833527843e-06, "loss": 0.9519, "step": 9848 }, { "epoch": 0.23, "learning_rate": 9.002731780283125e-06, "loss": 0.8677, "step": 9849 }, { "epoch": 0.23, "learning_rate": 9.002506704455264e-06, "loss": 1.0812, "step": 9850 }, { "epoch": 0.23, "learning_rate": 9.002281606045535e-06, "loss": 1.1044, "step": 9851 }, { "epoch": 0.23, "learning_rate": 9.002056485055206e-06, "loss": 1.1316, "step": 9852 }, { "epoch": 0.23, "learning_rate": 9.001831341485545e-06, "loss": 0.7441, "step": 9853 }, { "epoch": 0.23, "learning_rate": 9.001606175337824e-06, "loss": 1.2256, "step": 9854 }, { "epoch": 0.23, "learning_rate": 9.001380986613313e-06, "loss": 1.2299, "step": 9855 }, { "epoch": 0.23, "learning_rate": 9.001155775313283e-06, "loss": 1.031, "step": 9856 }, { "epoch": 0.23, "learning_rate": 9.000930541439004e-06, "loss": 1.0233, "step": 9857 }, { "epoch": 0.23, "learning_rate": 9.000705284991747e-06, "loss": 1.0397, "step": 9858 }, { "epoch": 0.23, "learning_rate": 9.000480005972783e-06, "loss": 1.1875, "step": 9859 }, { "epoch": 0.23, "learning_rate": 9.000254704383385e-06, "loss": 0.8307, "step": 9860 }, { "epoch": 0.23, "learning_rate": 9.000029380224819e-06, "loss": 1.252, "step": 9861 }, { "epoch": 0.23, "learning_rate": 8.99980403349836e-06, "loss": 0.9156, "step": 9862 }, { "epoch": 0.23, "learning_rate": 8.99957866420528e-06, "loss": 0.8428, "step": 9863 }, { "epoch": 0.23, "learning_rate": 8.999353272346848e-06, "loss": 0.8968, "step": 9864 }, { "epoch": 0.23, "learning_rate": 8.999127857924336e-06, "loss": 0.648, "step": 9865 }, { "epoch": 0.23, "learning_rate": 8.99890242093902e-06, "loss": 1.0393, "step": 9866 }, { "epoch": 0.23, "learning_rate": 8.998676961392165e-06, "loss": 1.084, "step": 9867 }, { "epoch": 0.23, "learning_rate": 8.998451479285048e-06, "loss": 1.3249, "step": 9868 }, { "epoch": 0.23, "learning_rate": 8.99822597461894e-06, "loss": 1.0638, "step": 9869 }, { "epoch": 0.23, "learning_rate": 8.998000447395113e-06, "loss": 1.0783, "step": 9870 }, { "epoch": 0.23, "learning_rate": 8.997774897614839e-06, "loss": 0.9531, "step": 9871 }, { "epoch": 0.23, "learning_rate": 8.99754932527939e-06, "loss": 1.0861, "step": 9872 }, { "epoch": 0.23, "learning_rate": 8.997323730390041e-06, "loss": 0.905, "step": 9873 }, { "epoch": 0.23, "learning_rate": 8.997098112948064e-06, "loss": 1.2574, "step": 9874 }, { "epoch": 0.23, "learning_rate": 8.99687247295473e-06, "loss": 1.0628, "step": 9875 }, { "epoch": 0.23, "learning_rate": 8.996646810411314e-06, "loss": 1.1663, "step": 9876 }, { "epoch": 0.23, "learning_rate": 8.996421125319089e-06, "loss": 0.9524, "step": 9877 }, { "epoch": 0.23, "learning_rate": 8.996195417679327e-06, "loss": 1.0397, "step": 9878 }, { "epoch": 0.23, "learning_rate": 8.995969687493302e-06, "loss": 1.413, "step": 9879 }, { "epoch": 0.23, "learning_rate": 8.99574393476229e-06, "loss": 0.801, "step": 9880 }, { "epoch": 0.23, "learning_rate": 8.995518159487559e-06, "loss": 1.0426, "step": 9881 }, { "epoch": 0.23, "learning_rate": 8.995292361670388e-06, "loss": 0.9616, "step": 9882 }, { "epoch": 0.23, "learning_rate": 8.99506654131205e-06, "loss": 1.0234, "step": 9883 }, { "epoch": 0.23, "learning_rate": 8.994840698413819e-06, "loss": 1.1132, "step": 9884 }, { "epoch": 0.23, "learning_rate": 8.994614832976966e-06, "loss": 1.0065, "step": 9885 }, { "epoch": 0.23, "learning_rate": 8.99438894500277e-06, "loss": 1.1342, "step": 9886 }, { "epoch": 0.23, "learning_rate": 8.994163034492503e-06, "loss": 1.0601, "step": 9887 }, { "epoch": 0.23, "learning_rate": 8.993937101447439e-06, "loss": 1.0122, "step": 9888 }, { "epoch": 0.23, "learning_rate": 8.993711145868853e-06, "loss": 0.8779, "step": 9889 }, { "epoch": 0.23, "learning_rate": 8.99348516775802e-06, "loss": 1.0863, "step": 9890 }, { "epoch": 0.23, "learning_rate": 8.993259167116218e-06, "loss": 0.9546, "step": 9891 }, { "epoch": 0.23, "learning_rate": 8.993033143944717e-06, "loss": 0.9304, "step": 9892 }, { "epoch": 0.23, "learning_rate": 8.992807098244796e-06, "loss": 0.9754, "step": 9893 }, { "epoch": 0.23, "learning_rate": 8.992581030017729e-06, "loss": 0.9323, "step": 9894 }, { "epoch": 0.23, "learning_rate": 8.992354939264789e-06, "loss": 0.9843, "step": 9895 }, { "epoch": 0.23, "learning_rate": 8.992128825987256e-06, "loss": 0.8142, "step": 9896 }, { "epoch": 0.23, "learning_rate": 8.991902690186404e-06, "loss": 0.9896, "step": 9897 }, { "epoch": 0.23, "learning_rate": 8.991676531863507e-06, "loss": 0.8911, "step": 9898 }, { "epoch": 0.23, "learning_rate": 8.991450351019845e-06, "loss": 0.9423, "step": 9899 }, { "epoch": 0.23, "learning_rate": 8.99122414765669e-06, "loss": 0.814, "step": 9900 }, { "epoch": 0.23, "learning_rate": 8.99099792177532e-06, "loss": 1.3301, "step": 9901 }, { "epoch": 0.23, "learning_rate": 8.990771673377011e-06, "loss": 0.8559, "step": 9902 }, { "epoch": 0.23, "learning_rate": 8.99054540246304e-06, "loss": 1.0291, "step": 9903 }, { "epoch": 0.23, "learning_rate": 8.990319109034683e-06, "loss": 1.0348, "step": 9904 }, { "epoch": 0.23, "learning_rate": 8.990092793093217e-06, "loss": 0.9181, "step": 9905 }, { "epoch": 0.23, "learning_rate": 8.989866454639919e-06, "loss": 0.9688, "step": 9906 }, { "epoch": 0.23, "learning_rate": 8.989640093676066e-06, "loss": 0.855, "step": 9907 }, { "epoch": 0.23, "learning_rate": 8.989413710202936e-06, "loss": 1.1478, "step": 9908 }, { "epoch": 0.23, "learning_rate": 8.989187304221803e-06, "loss": 0.8098, "step": 9909 }, { "epoch": 0.23, "learning_rate": 8.988960875733948e-06, "loss": 0.887, "step": 9910 }, { "epoch": 0.23, "learning_rate": 8.988734424740647e-06, "loss": 0.8975, "step": 9911 }, { "epoch": 0.23, "learning_rate": 8.988507951243177e-06, "loss": 1.0359, "step": 9912 }, { "epoch": 0.23, "learning_rate": 8.988281455242817e-06, "loss": 1.0228, "step": 9913 }, { "epoch": 0.23, "learning_rate": 8.988054936740845e-06, "loss": 0.9188, "step": 9914 }, { "epoch": 0.23, "learning_rate": 8.987828395738535e-06, "loss": 1.0903, "step": 9915 }, { "epoch": 0.23, "learning_rate": 8.987601832237173e-06, "loss": 1.0994, "step": 9916 }, { "epoch": 0.23, "learning_rate": 8.98737524623803e-06, "loss": 1.129, "step": 9917 }, { "epoch": 0.23, "learning_rate": 8.987148637742389e-06, "loss": 0.7568, "step": 9918 }, { "epoch": 0.23, "learning_rate": 8.986922006751524e-06, "loss": 0.9198, "step": 9919 }, { "epoch": 0.23, "learning_rate": 8.986695353266718e-06, "loss": 0.9929, "step": 9920 }, { "epoch": 0.23, "learning_rate": 8.986468677289249e-06, "loss": 1.0604, "step": 9921 }, { "epoch": 0.23, "learning_rate": 8.986241978820392e-06, "loss": 1.0059, "step": 9922 }, { "epoch": 0.23, "learning_rate": 8.98601525786143e-06, "loss": 1.0832, "step": 9923 }, { "epoch": 0.23, "learning_rate": 8.985788514413641e-06, "loss": 1.0317, "step": 9924 }, { "epoch": 0.23, "learning_rate": 8.985561748478305e-06, "loss": 0.9906, "step": 9925 }, { "epoch": 0.23, "learning_rate": 8.9853349600567e-06, "loss": 0.889, "step": 9926 }, { "epoch": 0.23, "learning_rate": 8.985108149150106e-06, "loss": 0.9254, "step": 9927 }, { "epoch": 0.23, "learning_rate": 8.984881315759804e-06, "loss": 1.007, "step": 9928 }, { "epoch": 0.23, "learning_rate": 8.984654459887072e-06, "loss": 0.771, "step": 9929 }, { "epoch": 0.23, "learning_rate": 8.984427581533191e-06, "loss": 1.2624, "step": 9930 }, { "epoch": 0.23, "learning_rate": 8.984200680699442e-06, "loss": 0.8579, "step": 9931 }, { "epoch": 0.23, "learning_rate": 8.9839737573871e-06, "loss": 0.8859, "step": 9932 }, { "epoch": 0.23, "learning_rate": 8.983746811597452e-06, "loss": 0.8288, "step": 9933 }, { "epoch": 0.23, "learning_rate": 8.983519843331776e-06, "loss": 1.0048, "step": 9934 }, { "epoch": 0.23, "learning_rate": 8.98329285259135e-06, "loss": 0.8936, "step": 9935 }, { "epoch": 0.23, "learning_rate": 8.983065839377458e-06, "loss": 0.866, "step": 9936 }, { "epoch": 0.23, "learning_rate": 8.982838803691378e-06, "loss": 0.9613, "step": 9937 }, { "epoch": 0.23, "learning_rate": 8.982611745534393e-06, "loss": 1.0876, "step": 9938 }, { "epoch": 0.23, "learning_rate": 8.982384664907784e-06, "loss": 0.9576, "step": 9939 }, { "epoch": 0.23, "learning_rate": 8.98215756181283e-06, "loss": 0.9477, "step": 9940 }, { "epoch": 0.23, "learning_rate": 8.981930436250816e-06, "loss": 0.9179, "step": 9941 }, { "epoch": 0.23, "learning_rate": 8.98170328822302e-06, "loss": 0.9055, "step": 9942 }, { "epoch": 0.23, "learning_rate": 8.981476117730725e-06, "loss": 0.9693, "step": 9943 }, { "epoch": 0.23, "learning_rate": 8.981248924775213e-06, "loss": 0.7931, "step": 9944 }, { "epoch": 0.23, "learning_rate": 8.981021709357765e-06, "loss": 1.0215, "step": 9945 }, { "epoch": 0.23, "learning_rate": 8.980794471479664e-06, "loss": 0.972, "step": 9946 }, { "epoch": 0.23, "learning_rate": 8.980567211142191e-06, "loss": 0.9735, "step": 9947 }, { "epoch": 0.23, "learning_rate": 8.980339928346629e-06, "loss": 0.8692, "step": 9948 }, { "epoch": 0.23, "learning_rate": 8.98011262309426e-06, "loss": 1.0549, "step": 9949 }, { "epoch": 0.23, "learning_rate": 8.979885295386365e-06, "loss": 0.9895, "step": 9950 }, { "epoch": 0.23, "learning_rate": 8.979657945224229e-06, "loss": 1.0004, "step": 9951 }, { "epoch": 0.23, "learning_rate": 8.979430572609132e-06, "loss": 0.8759, "step": 9952 }, { "epoch": 0.23, "learning_rate": 8.97920317754236e-06, "loss": 0.9597, "step": 9953 }, { "epoch": 0.23, "learning_rate": 8.978975760025194e-06, "loss": 1.028, "step": 9954 }, { "epoch": 0.23, "learning_rate": 8.978748320058916e-06, "loss": 1.1716, "step": 9955 }, { "epoch": 0.23, "learning_rate": 8.978520857644812e-06, "loss": 1.1849, "step": 9956 }, { "epoch": 0.23, "learning_rate": 8.978293372784165e-06, "loss": 1.1113, "step": 9957 }, { "epoch": 0.23, "learning_rate": 8.978065865478256e-06, "loss": 1.1247, "step": 9958 }, { "epoch": 0.23, "learning_rate": 8.977838335728371e-06, "loss": 0.8714, "step": 9959 }, { "epoch": 0.23, "learning_rate": 8.97761078353579e-06, "loss": 0.9726, "step": 9960 }, { "epoch": 0.23, "learning_rate": 8.977383208901803e-06, "loss": 0.7226, "step": 9961 }, { "epoch": 0.23, "learning_rate": 8.977155611827688e-06, "loss": 0.9556, "step": 9962 }, { "epoch": 0.23, "learning_rate": 8.976927992314733e-06, "loss": 1.0604, "step": 9963 }, { "epoch": 0.23, "learning_rate": 8.97670035036422e-06, "loss": 1.0633, "step": 9964 }, { "epoch": 0.23, "learning_rate": 8.976472685977433e-06, "loss": 0.9851, "step": 9965 }, { "epoch": 0.23, "learning_rate": 8.97624499915566e-06, "loss": 0.9177, "step": 9966 }, { "epoch": 0.23, "learning_rate": 8.976017289900182e-06, "loss": 1.0765, "step": 9967 }, { "epoch": 0.23, "learning_rate": 8.975789558212284e-06, "loss": 0.9578, "step": 9968 }, { "epoch": 0.23, "learning_rate": 8.975561804093253e-06, "loss": 0.9711, "step": 9969 }, { "epoch": 0.23, "learning_rate": 8.975334027544373e-06, "loss": 0.8966, "step": 9970 }, { "epoch": 0.23, "learning_rate": 8.975106228566928e-06, "loss": 1.1116, "step": 9971 }, { "epoch": 0.23, "learning_rate": 8.974878407162205e-06, "loss": 0.8769, "step": 9972 }, { "epoch": 0.23, "learning_rate": 8.974650563331486e-06, "loss": 0.8784, "step": 9973 }, { "epoch": 0.23, "learning_rate": 8.974422697076062e-06, "loss": 0.8356, "step": 9974 }, { "epoch": 0.23, "learning_rate": 8.974194808397215e-06, "loss": 0.6997, "step": 9975 }, { "epoch": 0.23, "learning_rate": 8.973966897296229e-06, "loss": 1.0064, "step": 9976 }, { "epoch": 0.23, "learning_rate": 8.973738963774393e-06, "loss": 1.2357, "step": 9977 }, { "epoch": 0.23, "learning_rate": 8.973511007832993e-06, "loss": 1.0062, "step": 9978 }, { "epoch": 0.23, "learning_rate": 8.973283029473314e-06, "loss": 0.9236, "step": 9979 }, { "epoch": 0.23, "learning_rate": 8.973055028696642e-06, "loss": 0.8727, "step": 9980 }, { "epoch": 0.23, "learning_rate": 8.972827005504263e-06, "loss": 0.8687, "step": 9981 }, { "epoch": 0.23, "learning_rate": 8.972598959897466e-06, "loss": 1.2665, "step": 9982 }, { "epoch": 0.23, "learning_rate": 8.972370891877535e-06, "loss": 0.8864, "step": 9983 }, { "epoch": 0.23, "learning_rate": 8.972142801445758e-06, "loss": 1.1594, "step": 9984 }, { "epoch": 0.23, "learning_rate": 8.97191468860342e-06, "loss": 0.7764, "step": 9985 }, { "epoch": 0.23, "learning_rate": 8.97168655335181e-06, "loss": 0.86, "step": 9986 }, { "epoch": 0.23, "learning_rate": 8.971458395692216e-06, "loss": 1.1051, "step": 9987 }, { "epoch": 0.23, "learning_rate": 8.971230215625923e-06, "loss": 0.8168, "step": 9988 }, { "epoch": 0.23, "learning_rate": 8.97100201315422e-06, "loss": 1.0839, "step": 9989 }, { "epoch": 0.23, "learning_rate": 8.970773788278393e-06, "loss": 0.9374, "step": 9990 }, { "epoch": 0.23, "learning_rate": 8.97054554099973e-06, "loss": 0.8699, "step": 9991 }, { "epoch": 0.23, "learning_rate": 8.97031727131952e-06, "loss": 1.0097, "step": 9992 }, { "epoch": 0.23, "learning_rate": 8.970088979239049e-06, "loss": 1.0783, "step": 9993 }, { "epoch": 0.23, "learning_rate": 8.969860664759606e-06, "loss": 0.9136, "step": 9994 }, { "epoch": 0.23, "learning_rate": 8.96963232788248e-06, "loss": 0.9129, "step": 9995 }, { "epoch": 0.23, "learning_rate": 8.969403968608959e-06, "loss": 0.8005, "step": 9996 }, { "epoch": 0.23, "learning_rate": 8.96917558694033e-06, "loss": 1.0415, "step": 9997 }, { "epoch": 0.23, "learning_rate": 8.968947182877881e-06, "loss": 1.05, "step": 9998 }, { "epoch": 0.23, "learning_rate": 8.968718756422904e-06, "loss": 0.8638, "step": 9999 }, { "epoch": 0.23, "learning_rate": 8.968490307576686e-06, "loss": 1.1782, "step": 10000 }, { "epoch": 0.23, "learning_rate": 8.968261836340513e-06, "loss": 0.9507, "step": 10001 }, { "epoch": 0.23, "learning_rate": 8.968033342715678e-06, "loss": 1.3601, "step": 10002 }, { "epoch": 0.23, "learning_rate": 8.96780482670347e-06, "loss": 1.2048, "step": 10003 }, { "epoch": 0.23, "learning_rate": 8.967576288305175e-06, "loss": 1.1579, "step": 10004 }, { "epoch": 0.23, "learning_rate": 8.967347727522087e-06, "loss": 1.1066, "step": 10005 }, { "epoch": 0.23, "learning_rate": 8.967119144355491e-06, "loss": 1.0593, "step": 10006 }, { "epoch": 0.23, "learning_rate": 8.96689053880668e-06, "loss": 0.967, "step": 10007 }, { "epoch": 0.23, "learning_rate": 8.966661910876941e-06, "loss": 1.0735, "step": 10008 }, { "epoch": 0.23, "learning_rate": 8.966433260567566e-06, "loss": 0.7284, "step": 10009 }, { "epoch": 0.23, "learning_rate": 8.966204587879842e-06, "loss": 0.8363, "step": 10010 }, { "epoch": 0.23, "learning_rate": 8.965975892815066e-06, "loss": 0.9902, "step": 10011 }, { "epoch": 0.23, "learning_rate": 8.965747175374523e-06, "loss": 0.8826, "step": 10012 }, { "epoch": 0.23, "learning_rate": 8.965518435559502e-06, "loss": 1.2007, "step": 10013 }, { "epoch": 0.23, "learning_rate": 8.965289673371297e-06, "loss": 1.168, "step": 10014 }, { "epoch": 0.23, "learning_rate": 8.965060888811196e-06, "loss": 1.0076, "step": 10015 }, { "epoch": 0.23, "learning_rate": 8.964832081880492e-06, "loss": 1.1244, "step": 10016 }, { "epoch": 0.23, "learning_rate": 8.964603252580475e-06, "loss": 0.7443, "step": 10017 }, { "epoch": 0.23, "learning_rate": 8.964374400912436e-06, "loss": 0.7865, "step": 10018 }, { "epoch": 0.23, "learning_rate": 8.964145526877666e-06, "loss": 1.3098, "step": 10019 }, { "epoch": 0.23, "learning_rate": 8.963916630477457e-06, "loss": 0.9248, "step": 10020 }, { "epoch": 0.23, "learning_rate": 8.963687711713101e-06, "loss": 1.0839, "step": 10021 }, { "epoch": 0.23, "learning_rate": 8.963458770585886e-06, "loss": 1.1535, "step": 10022 }, { "epoch": 0.23, "learning_rate": 8.96322980709711e-06, "loss": 1.1111, "step": 10023 }, { "epoch": 0.23, "learning_rate": 8.963000821248059e-06, "loss": 1.0529, "step": 10024 }, { "epoch": 0.23, "learning_rate": 8.962771813040025e-06, "loss": 0.7379, "step": 10025 }, { "epoch": 0.23, "learning_rate": 8.962542782474304e-06, "loss": 1.0553, "step": 10026 }, { "epoch": 0.23, "learning_rate": 8.962313729552186e-06, "loss": 1.1526, "step": 10027 }, { "epoch": 0.23, "learning_rate": 8.962084654274964e-06, "loss": 0.8301, "step": 10028 }, { "epoch": 0.23, "learning_rate": 8.961855556643929e-06, "loss": 1.135, "step": 10029 }, { "epoch": 0.23, "learning_rate": 8.961626436660374e-06, "loss": 1.1783, "step": 10030 }, { "epoch": 0.23, "learning_rate": 8.961397294325593e-06, "loss": 0.6975, "step": 10031 }, { "epoch": 0.23, "learning_rate": 8.961168129640878e-06, "loss": 0.9409, "step": 10032 }, { "epoch": 0.23, "learning_rate": 8.960938942607522e-06, "loss": 1.2849, "step": 10033 }, { "epoch": 0.23, "learning_rate": 8.960709733226817e-06, "loss": 0.768, "step": 10034 }, { "epoch": 0.23, "learning_rate": 8.960480501500058e-06, "loss": 1.0489, "step": 10035 }, { "epoch": 0.23, "learning_rate": 8.960251247428535e-06, "loss": 1.0227, "step": 10036 }, { "epoch": 0.23, "learning_rate": 8.960021971013546e-06, "loss": 0.9727, "step": 10037 }, { "epoch": 0.23, "learning_rate": 8.959792672256382e-06, "loss": 0.9414, "step": 10038 }, { "epoch": 0.23, "learning_rate": 8.959563351158339e-06, "loss": 0.8359, "step": 10039 }, { "epoch": 0.23, "learning_rate": 8.959334007720706e-06, "loss": 0.8417, "step": 10040 }, { "epoch": 0.23, "learning_rate": 8.959104641944781e-06, "loss": 1.0334, "step": 10041 }, { "epoch": 0.23, "learning_rate": 8.958875253831857e-06, "loss": 1.0004, "step": 10042 }, { "epoch": 0.23, "learning_rate": 8.958645843383229e-06, "loss": 0.8696, "step": 10043 }, { "epoch": 0.23, "learning_rate": 8.958416410600188e-06, "loss": 1.228, "step": 10044 }, { "epoch": 0.23, "learning_rate": 8.958186955484034e-06, "loss": 1.0035, "step": 10045 }, { "epoch": 0.23, "learning_rate": 8.957957478036056e-06, "loss": 0.8439, "step": 10046 }, { "epoch": 0.23, "learning_rate": 8.957727978257553e-06, "loss": 1.0523, "step": 10047 }, { "epoch": 0.23, "learning_rate": 8.957498456149815e-06, "loss": 1.0192, "step": 10048 }, { "epoch": 0.23, "learning_rate": 8.957268911714144e-06, "loss": 1.0327, "step": 10049 }, { "epoch": 0.23, "learning_rate": 8.957039344951827e-06, "loss": 0.9437, "step": 10050 }, { "epoch": 0.23, "learning_rate": 8.956809755864164e-06, "loss": 1.0529, "step": 10051 }, { "epoch": 0.23, "learning_rate": 8.956580144452452e-06, "loss": 0.7929, "step": 10052 }, { "epoch": 0.23, "learning_rate": 8.956350510717981e-06, "loss": 1.1331, "step": 10053 }, { "epoch": 0.23, "learning_rate": 8.956120854662051e-06, "loss": 1.0358, "step": 10054 }, { "epoch": 0.23, "learning_rate": 8.955891176285956e-06, "loss": 1.3173, "step": 10055 }, { "epoch": 0.23, "learning_rate": 8.955661475590993e-06, "loss": 1.0959, "step": 10056 }, { "epoch": 0.23, "learning_rate": 8.955431752578456e-06, "loss": 1.1911, "step": 10057 }, { "epoch": 0.23, "learning_rate": 8.955202007249642e-06, "loss": 0.78, "step": 10058 }, { "epoch": 0.23, "learning_rate": 8.954972239605848e-06, "loss": 1.0029, "step": 10059 }, { "epoch": 0.23, "learning_rate": 8.954742449648369e-06, "loss": 0.8874, "step": 10060 }, { "epoch": 0.23, "learning_rate": 8.954512637378503e-06, "loss": 1.231, "step": 10061 }, { "epoch": 0.23, "learning_rate": 8.954282802797545e-06, "loss": 1.1159, "step": 10062 }, { "epoch": 0.23, "learning_rate": 8.954052945906791e-06, "loss": 0.8576, "step": 10063 }, { "epoch": 0.23, "learning_rate": 8.953823066707541e-06, "loss": 0.8133, "step": 10064 }, { "epoch": 0.23, "learning_rate": 8.95359316520109e-06, "loss": 1.034, "step": 10065 }, { "epoch": 0.23, "learning_rate": 8.953363241388735e-06, "loss": 0.8083, "step": 10066 }, { "epoch": 0.23, "learning_rate": 8.953133295271775e-06, "loss": 0.8469, "step": 10067 }, { "epoch": 0.23, "learning_rate": 8.952903326851503e-06, "loss": 1.2549, "step": 10068 }, { "epoch": 0.23, "learning_rate": 8.95267333612922e-06, "loss": 1.0343, "step": 10069 }, { "epoch": 0.23, "learning_rate": 8.952443323106225e-06, "loss": 1.0617, "step": 10070 }, { "epoch": 0.23, "learning_rate": 8.952213287783814e-06, "loss": 0.9529, "step": 10071 }, { "epoch": 0.23, "learning_rate": 8.951983230163282e-06, "loss": 0.805, "step": 10072 }, { "epoch": 0.23, "learning_rate": 8.95175315024593e-06, "loss": 0.9524, "step": 10073 }, { "epoch": 0.23, "learning_rate": 8.951523048033055e-06, "loss": 1.0679, "step": 10074 }, { "epoch": 0.23, "learning_rate": 8.951292923525957e-06, "loss": 1.0482, "step": 10075 }, { "epoch": 0.23, "learning_rate": 8.951062776725932e-06, "loss": 0.929, "step": 10076 }, { "epoch": 0.23, "learning_rate": 8.95083260763428e-06, "loss": 1.1997, "step": 10077 }, { "epoch": 0.23, "learning_rate": 8.9506024162523e-06, "loss": 0.9594, "step": 10078 }, { "epoch": 0.23, "learning_rate": 8.950372202581289e-06, "loss": 1.2714, "step": 10079 }, { "epoch": 0.23, "learning_rate": 8.950141966622547e-06, "loss": 1.1102, "step": 10080 }, { "epoch": 0.23, "learning_rate": 8.949911708377373e-06, "loss": 0.8583, "step": 10081 }, { "epoch": 0.23, "learning_rate": 8.949681427847065e-06, "loss": 0.9996, "step": 10082 }, { "epoch": 0.23, "learning_rate": 8.949451125032923e-06, "loss": 1.1932, "step": 10083 }, { "epoch": 0.23, "learning_rate": 8.949220799936247e-06, "loss": 1.0815, "step": 10084 }, { "epoch": 0.23, "learning_rate": 8.948990452558336e-06, "loss": 0.946, "step": 10085 }, { "epoch": 0.23, "learning_rate": 8.948760082900489e-06, "loss": 1.1877, "step": 10086 }, { "epoch": 0.23, "learning_rate": 8.948529690964008e-06, "loss": 0.8773, "step": 10087 }, { "epoch": 0.23, "learning_rate": 8.948299276750188e-06, "loss": 1.1469, "step": 10088 }, { "epoch": 0.23, "learning_rate": 8.948068840260333e-06, "loss": 0.9037, "step": 10089 }, { "epoch": 0.23, "learning_rate": 8.947838381495743e-06, "loss": 1.4662, "step": 10090 }, { "epoch": 0.23, "learning_rate": 8.947607900457717e-06, "loss": 1.1031, "step": 10091 }, { "epoch": 0.23, "learning_rate": 8.947377397147556e-06, "loss": 1.0016, "step": 10092 }, { "epoch": 0.23, "learning_rate": 8.94714687156656e-06, "loss": 1.0348, "step": 10093 }, { "epoch": 0.23, "learning_rate": 8.94691632371603e-06, "loss": 0.7787, "step": 10094 }, { "epoch": 0.23, "learning_rate": 8.946685753597266e-06, "loss": 1.0973, "step": 10095 }, { "epoch": 0.23, "learning_rate": 8.94645516121157e-06, "loss": 0.6896, "step": 10096 }, { "epoch": 0.23, "learning_rate": 8.946224546560242e-06, "loss": 1.0081, "step": 10097 }, { "epoch": 0.23, "learning_rate": 8.945993909644586e-06, "loss": 1.0457, "step": 10098 }, { "epoch": 0.23, "learning_rate": 8.945763250465898e-06, "loss": 0.7888, "step": 10099 }, { "epoch": 0.23, "learning_rate": 8.94553256902548e-06, "loss": 1.0481, "step": 10100 }, { "epoch": 0.23, "learning_rate": 8.94530186532464e-06, "loss": 1.0738, "step": 10101 }, { "epoch": 0.23, "learning_rate": 8.945071139364675e-06, "loss": 0.8883, "step": 10102 }, { "epoch": 0.23, "learning_rate": 8.944840391146885e-06, "loss": 0.9894, "step": 10103 }, { "epoch": 0.23, "learning_rate": 8.944609620672573e-06, "loss": 0.8175, "step": 10104 }, { "epoch": 0.23, "learning_rate": 8.944378827943044e-06, "loss": 1.0261, "step": 10105 }, { "epoch": 0.23, "learning_rate": 8.944148012959597e-06, "loss": 0.9712, "step": 10106 }, { "epoch": 0.23, "learning_rate": 8.943917175723535e-06, "loss": 1.0412, "step": 10107 }, { "epoch": 0.23, "learning_rate": 8.943686316236162e-06, "loss": 1.2194, "step": 10108 }, { "epoch": 0.23, "learning_rate": 8.943455434498778e-06, "loss": 1.2625, "step": 10109 }, { "epoch": 0.23, "learning_rate": 8.943224530512686e-06, "loss": 1.0843, "step": 10110 }, { "epoch": 0.23, "learning_rate": 8.942993604279191e-06, "loss": 0.8711, "step": 10111 }, { "epoch": 0.23, "learning_rate": 8.942762655799592e-06, "loss": 1.2145, "step": 10112 }, { "epoch": 0.23, "learning_rate": 8.942531685075197e-06, "loss": 0.9823, "step": 10113 }, { "epoch": 0.23, "learning_rate": 8.942300692107303e-06, "loss": 1.0389, "step": 10114 }, { "epoch": 0.23, "learning_rate": 8.94206967689722e-06, "loss": 1.0152, "step": 10115 }, { "epoch": 0.23, "learning_rate": 8.941838639446248e-06, "loss": 1.024, "step": 10116 }, { "epoch": 0.23, "learning_rate": 8.941607579755689e-06, "loss": 1.2438, "step": 10117 }, { "epoch": 0.23, "learning_rate": 8.941376497826848e-06, "loss": 1.0474, "step": 10118 }, { "epoch": 0.23, "learning_rate": 8.94114539366103e-06, "loss": 0.9626, "step": 10119 }, { "epoch": 0.23, "learning_rate": 8.940914267259538e-06, "loss": 0.973, "step": 10120 }, { "epoch": 0.23, "learning_rate": 8.940683118623674e-06, "loss": 0.8874, "step": 10121 }, { "epoch": 0.23, "learning_rate": 8.940451947754744e-06, "loss": 1.1211, "step": 10122 }, { "epoch": 0.23, "learning_rate": 8.940220754654053e-06, "loss": 0.7918, "step": 10123 }, { "epoch": 0.23, "learning_rate": 8.939989539322904e-06, "loss": 0.9225, "step": 10124 }, { "epoch": 0.23, "learning_rate": 8.939758301762603e-06, "loss": 1.2273, "step": 10125 }, { "epoch": 0.23, "learning_rate": 8.939527041974452e-06, "loss": 0.706, "step": 10126 }, { "epoch": 0.23, "learning_rate": 8.939295759959758e-06, "loss": 1.1773, "step": 10127 }, { "epoch": 0.23, "learning_rate": 8.939064455719826e-06, "loss": 1.0896, "step": 10128 }, { "epoch": 0.23, "learning_rate": 8.938833129255962e-06, "loss": 0.9002, "step": 10129 }, { "epoch": 0.23, "learning_rate": 8.938601780569467e-06, "loss": 0.944, "step": 10130 }, { "epoch": 0.23, "learning_rate": 8.938370409661647e-06, "loss": 0.9863, "step": 10131 }, { "epoch": 0.23, "learning_rate": 8.938139016533812e-06, "loss": 0.8219, "step": 10132 }, { "epoch": 0.24, "learning_rate": 8.937907601187264e-06, "loss": 0.9437, "step": 10133 }, { "epoch": 0.24, "learning_rate": 8.93767616362331e-06, "loss": 1.2252, "step": 10134 }, { "epoch": 0.24, "learning_rate": 8.937444703843253e-06, "loss": 0.9259, "step": 10135 }, { "epoch": 0.24, "learning_rate": 8.9372132218484e-06, "loss": 0.7422, "step": 10136 }, { "epoch": 0.24, "learning_rate": 8.936981717640061e-06, "loss": 1.0056, "step": 10137 }, { "epoch": 0.24, "learning_rate": 8.936750191219537e-06, "loss": 1.0065, "step": 10138 }, { "epoch": 0.24, "learning_rate": 8.936518642588136e-06, "loss": 0.8774, "step": 10139 }, { "epoch": 0.24, "learning_rate": 8.936287071747166e-06, "loss": 0.9558, "step": 10140 }, { "epoch": 0.24, "learning_rate": 8.93605547869793e-06, "loss": 0.9122, "step": 10141 }, { "epoch": 0.24, "learning_rate": 8.935823863441739e-06, "loss": 0.9347, "step": 10142 }, { "epoch": 0.24, "learning_rate": 8.935592225979896e-06, "loss": 0.9255, "step": 10143 }, { "epoch": 0.24, "learning_rate": 8.93536056631371e-06, "loss": 0.7554, "step": 10144 }, { "epoch": 0.24, "learning_rate": 8.935128884444487e-06, "loss": 1.0042, "step": 10145 }, { "epoch": 0.24, "learning_rate": 8.934897180373533e-06, "loss": 0.9922, "step": 10146 }, { "epoch": 0.24, "learning_rate": 8.93466545410216e-06, "loss": 1.0946, "step": 10147 }, { "epoch": 0.24, "learning_rate": 8.93443370563167e-06, "loss": 0.8901, "step": 10148 }, { "epoch": 0.24, "learning_rate": 8.934201934963374e-06, "loss": 0.738, "step": 10149 }, { "epoch": 0.24, "learning_rate": 8.933970142098577e-06, "loss": 1.054, "step": 10150 }, { "epoch": 0.24, "learning_rate": 8.933738327038589e-06, "loss": 0.9019, "step": 10151 }, { "epoch": 0.24, "learning_rate": 8.933506489784716e-06, "loss": 0.9908, "step": 10152 }, { "epoch": 0.24, "learning_rate": 8.933274630338267e-06, "loss": 1.1708, "step": 10153 }, { "epoch": 0.24, "learning_rate": 8.93304274870055e-06, "loss": 1.1646, "step": 10154 }, { "epoch": 0.24, "learning_rate": 8.932810844872875e-06, "loss": 1.0924, "step": 10155 }, { "epoch": 0.24, "learning_rate": 8.932578918856547e-06, "loss": 1.0145, "step": 10156 }, { "epoch": 0.24, "learning_rate": 8.932346970652876e-06, "loss": 1.0217, "step": 10157 }, { "epoch": 0.24, "learning_rate": 8.932115000263171e-06, "loss": 1.0272, "step": 10158 }, { "epoch": 0.24, "learning_rate": 8.931883007688742e-06, "loss": 1.0286, "step": 10159 }, { "epoch": 0.24, "learning_rate": 8.931650992930896e-06, "loss": 0.7457, "step": 10160 }, { "epoch": 0.24, "learning_rate": 8.931418955990942e-06, "loss": 0.9958, "step": 10161 }, { "epoch": 0.24, "learning_rate": 8.93118689687019e-06, "loss": 1.1921, "step": 10162 }, { "epoch": 0.24, "learning_rate": 8.93095481556995e-06, "loss": 1.0691, "step": 10163 }, { "epoch": 0.24, "learning_rate": 8.930722712091528e-06, "loss": 0.8793, "step": 10164 }, { "epoch": 0.24, "learning_rate": 8.930490586436239e-06, "loss": 0.9299, "step": 10165 }, { "epoch": 0.24, "learning_rate": 8.930258438605386e-06, "loss": 1.123, "step": 10166 }, { "epoch": 0.24, "learning_rate": 8.930026268600284e-06, "loss": 0.9224, "step": 10167 }, { "epoch": 0.24, "learning_rate": 8.92979407642224e-06, "loss": 1.0319, "step": 10168 }, { "epoch": 0.24, "learning_rate": 8.929561862072566e-06, "loss": 1.0445, "step": 10169 }, { "epoch": 0.24, "learning_rate": 8.929329625552572e-06, "loss": 1.0844, "step": 10170 }, { "epoch": 0.24, "learning_rate": 8.929097366863567e-06, "loss": 0.8787, "step": 10171 }, { "epoch": 0.24, "learning_rate": 8.928865086006861e-06, "loss": 0.858, "step": 10172 }, { "epoch": 0.24, "learning_rate": 8.928632782983765e-06, "loss": 1.1091, "step": 10173 }, { "epoch": 0.24, "learning_rate": 8.928400457795591e-06, "loss": 0.8987, "step": 10174 }, { "epoch": 0.24, "learning_rate": 8.92816811044365e-06, "loss": 0.9602, "step": 10175 }, { "epoch": 0.24, "learning_rate": 8.92793574092925e-06, "loss": 0.9693, "step": 10176 }, { "epoch": 0.24, "learning_rate": 8.927703349253704e-06, "loss": 0.9514, "step": 10177 }, { "epoch": 0.24, "learning_rate": 8.927470935418325e-06, "loss": 0.7904, "step": 10178 }, { "epoch": 0.24, "learning_rate": 8.92723849942442e-06, "loss": 0.9456, "step": 10179 }, { "epoch": 0.24, "learning_rate": 8.927006041273302e-06, "loss": 1.0021, "step": 10180 }, { "epoch": 0.24, "learning_rate": 8.926773560966285e-06, "loss": 1.1719, "step": 10181 }, { "epoch": 0.24, "learning_rate": 8.926541058504678e-06, "loss": 1.4647, "step": 10182 }, { "epoch": 0.24, "learning_rate": 8.926308533889794e-06, "loss": 1.3145, "step": 10183 }, { "epoch": 0.24, "learning_rate": 8.926075987122941e-06, "loss": 0.9053, "step": 10184 }, { "epoch": 0.24, "learning_rate": 8.925843418205438e-06, "loss": 0.9266, "step": 10185 }, { "epoch": 0.24, "learning_rate": 8.925610827138592e-06, "loss": 0.9783, "step": 10186 }, { "epoch": 0.24, "learning_rate": 8.925378213923716e-06, "loss": 1.005, "step": 10187 }, { "epoch": 0.24, "learning_rate": 8.925145578562126e-06, "loss": 1.049, "step": 10188 }, { "epoch": 0.24, "learning_rate": 8.924912921055129e-06, "loss": 1.2259, "step": 10189 }, { "epoch": 0.24, "learning_rate": 8.92468024140404e-06, "loss": 0.7887, "step": 10190 }, { "epoch": 0.24, "learning_rate": 8.924447539610173e-06, "loss": 0.9169, "step": 10191 }, { "epoch": 0.24, "learning_rate": 8.92421481567484e-06, "loss": 1.3744, "step": 10192 }, { "epoch": 0.24, "learning_rate": 8.923982069599354e-06, "loss": 0.9919, "step": 10193 }, { "epoch": 0.24, "learning_rate": 8.923749301385029e-06, "loss": 0.8788, "step": 10194 }, { "epoch": 0.24, "learning_rate": 8.923516511033177e-06, "loss": 1.2593, "step": 10195 }, { "epoch": 0.24, "learning_rate": 8.92328369854511e-06, "loss": 0.8147, "step": 10196 }, { "epoch": 0.24, "learning_rate": 8.923050863922145e-06, "loss": 1.2111, "step": 10197 }, { "epoch": 0.24, "learning_rate": 8.922818007165592e-06, "loss": 1.0212, "step": 10198 }, { "epoch": 0.24, "learning_rate": 8.922585128276769e-06, "loss": 0.781, "step": 10199 }, { "epoch": 0.24, "learning_rate": 8.922352227256985e-06, "loss": 0.8311, "step": 10200 }, { "epoch": 0.24, "learning_rate": 8.922119304107556e-06, "loss": 0.995, "step": 10201 }, { "epoch": 0.24, "learning_rate": 8.9218863588298e-06, "loss": 1.0205, "step": 10202 }, { "epoch": 0.24, "learning_rate": 8.921653391425027e-06, "loss": 0.9499, "step": 10203 }, { "epoch": 0.24, "learning_rate": 8.921420401894552e-06, "loss": 0.7837, "step": 10204 }, { "epoch": 0.24, "learning_rate": 8.92118739023969e-06, "loss": 1.074, "step": 10205 }, { "epoch": 0.24, "learning_rate": 8.920954356461755e-06, "loss": 0.9061, "step": 10206 }, { "epoch": 0.24, "learning_rate": 8.92072130056206e-06, "loss": 0.6057, "step": 10207 }, { "epoch": 0.24, "learning_rate": 8.920488222541926e-06, "loss": 1.0489, "step": 10208 }, { "epoch": 0.24, "learning_rate": 8.920255122402661e-06, "loss": 1.0468, "step": 10209 }, { "epoch": 0.24, "learning_rate": 8.920022000145586e-06, "loss": 0.7586, "step": 10210 }, { "epoch": 0.24, "learning_rate": 8.919788855772011e-06, "loss": 0.924, "step": 10211 }, { "epoch": 0.24, "learning_rate": 8.919555689283256e-06, "loss": 0.8907, "step": 10212 }, { "epoch": 0.24, "learning_rate": 8.919322500680634e-06, "loss": 0.7901, "step": 10213 }, { "epoch": 0.24, "learning_rate": 8.91908928996546e-06, "loss": 1.2254, "step": 10214 }, { "epoch": 0.24, "learning_rate": 8.918856057139052e-06, "loss": 1.1222, "step": 10215 }, { "epoch": 0.24, "learning_rate": 8.918622802202724e-06, "loss": 0.9894, "step": 10216 }, { "epoch": 0.24, "learning_rate": 8.918389525157792e-06, "loss": 1.0152, "step": 10217 }, { "epoch": 0.24, "learning_rate": 8.918156226005575e-06, "loss": 1.1617, "step": 10218 }, { "epoch": 0.24, "learning_rate": 8.917922904747385e-06, "loss": 1.2, "step": 10219 }, { "epoch": 0.24, "learning_rate": 8.917689561384541e-06, "loss": 0.8344, "step": 10220 }, { "epoch": 0.24, "learning_rate": 8.917456195918358e-06, "loss": 0.8431, "step": 10221 }, { "epoch": 0.24, "learning_rate": 8.917222808350155e-06, "loss": 1.275, "step": 10222 }, { "epoch": 0.24, "learning_rate": 8.916989398681248e-06, "loss": 1.008, "step": 10223 }, { "epoch": 0.24, "learning_rate": 8.916755966912952e-06, "loss": 1.0059, "step": 10224 }, { "epoch": 0.24, "learning_rate": 8.916522513046586e-06, "loss": 0.7251, "step": 10225 }, { "epoch": 0.24, "learning_rate": 8.916289037083466e-06, "loss": 0.8956, "step": 10226 }, { "epoch": 0.24, "learning_rate": 8.91605553902491e-06, "loss": 1.0138, "step": 10227 }, { "epoch": 0.24, "learning_rate": 8.915822018872233e-06, "loss": 1.1145, "step": 10228 }, { "epoch": 0.24, "learning_rate": 8.915588476626758e-06, "loss": 0.897, "step": 10229 }, { "epoch": 0.24, "learning_rate": 8.915354912289797e-06, "loss": 0.9362, "step": 10230 }, { "epoch": 0.24, "learning_rate": 8.91512132586267e-06, "loss": 1.1019, "step": 10231 }, { "epoch": 0.24, "learning_rate": 8.914887717346693e-06, "loss": 1.032, "step": 10232 }, { "epoch": 0.24, "learning_rate": 8.91465408674319e-06, "loss": 0.9871, "step": 10233 }, { "epoch": 0.24, "learning_rate": 8.914420434053472e-06, "loss": 1.038, "step": 10234 }, { "epoch": 0.24, "learning_rate": 8.914186759278862e-06, "loss": 0.6546, "step": 10235 }, { "epoch": 0.24, "learning_rate": 8.913953062420675e-06, "loss": 1.0995, "step": 10236 }, { "epoch": 0.24, "learning_rate": 8.913719343480232e-06, "loss": 1.181, "step": 10237 }, { "epoch": 0.24, "learning_rate": 8.913485602458849e-06, "loss": 0.8425, "step": 10238 }, { "epoch": 0.24, "learning_rate": 8.913251839357849e-06, "loss": 1.1813, "step": 10239 }, { "epoch": 0.24, "learning_rate": 8.913018054178547e-06, "loss": 0.9315, "step": 10240 }, { "epoch": 0.24, "learning_rate": 8.91278424692226e-06, "loss": 1.2546, "step": 10241 }, { "epoch": 0.24, "learning_rate": 8.912550417590316e-06, "loss": 0.9802, "step": 10242 }, { "epoch": 0.24, "learning_rate": 8.912316566184027e-06, "loss": 1.0466, "step": 10243 }, { "epoch": 0.24, "learning_rate": 8.912082692704713e-06, "loss": 1.0091, "step": 10244 }, { "epoch": 0.24, "learning_rate": 8.911848797153696e-06, "loss": 0.7869, "step": 10245 }, { "epoch": 0.24, "learning_rate": 8.911614879532291e-06, "loss": 0.9867, "step": 10246 }, { "epoch": 0.24, "learning_rate": 8.911380939841823e-06, "loss": 1.0477, "step": 10247 }, { "epoch": 0.24, "learning_rate": 8.91114697808361e-06, "loss": 1.1367, "step": 10248 }, { "epoch": 0.24, "learning_rate": 8.910912994258972e-06, "loss": 1.0018, "step": 10249 }, { "epoch": 0.24, "learning_rate": 8.910678988369228e-06, "loss": 1.129, "step": 10250 }, { "epoch": 0.24, "learning_rate": 8.9104449604157e-06, "loss": 1.1643, "step": 10251 }, { "epoch": 0.24, "learning_rate": 8.910210910399706e-06, "loss": 0.8879, "step": 10252 }, { "epoch": 0.24, "learning_rate": 8.90997683832257e-06, "loss": 1.0389, "step": 10253 }, { "epoch": 0.24, "learning_rate": 8.909742744185609e-06, "loss": 0.7728, "step": 10254 }, { "epoch": 0.24, "learning_rate": 8.909508627990146e-06, "loss": 0.9962, "step": 10255 }, { "epoch": 0.24, "learning_rate": 8.909274489737503e-06, "loss": 1.1461, "step": 10256 }, { "epoch": 0.24, "learning_rate": 8.909040329428997e-06, "loss": 0.8436, "step": 10257 }, { "epoch": 0.24, "learning_rate": 8.908806147065951e-06, "loss": 0.7906, "step": 10258 }, { "epoch": 0.24, "learning_rate": 8.90857194264969e-06, "loss": 0.9613, "step": 10259 }, { "epoch": 0.24, "learning_rate": 8.908337716181528e-06, "loss": 1.0238, "step": 10260 }, { "epoch": 0.24, "learning_rate": 8.908103467662793e-06, "loss": 1.1514, "step": 10261 }, { "epoch": 0.24, "learning_rate": 8.907869197094802e-06, "loss": 1.0791, "step": 10262 }, { "epoch": 0.24, "learning_rate": 8.907634904478882e-06, "loss": 0.9204, "step": 10263 }, { "epoch": 0.24, "learning_rate": 8.907400589816348e-06, "loss": 1.1568, "step": 10264 }, { "epoch": 0.24, "learning_rate": 8.907166253108527e-06, "loss": 0.8899, "step": 10265 }, { "epoch": 0.24, "learning_rate": 8.90693189435674e-06, "loss": 1.0618, "step": 10266 }, { "epoch": 0.24, "learning_rate": 8.906697513562309e-06, "loss": 0.7879, "step": 10267 }, { "epoch": 0.24, "learning_rate": 8.906463110726556e-06, "loss": 1.1392, "step": 10268 }, { "epoch": 0.24, "learning_rate": 8.906228685850803e-06, "loss": 0.8651, "step": 10269 }, { "epoch": 0.24, "learning_rate": 8.905994238936376e-06, "loss": 1.0575, "step": 10270 }, { "epoch": 0.24, "learning_rate": 8.905759769984594e-06, "loss": 1.0574, "step": 10271 }, { "epoch": 0.24, "learning_rate": 8.905525278996781e-06, "loss": 0.9405, "step": 10272 }, { "epoch": 0.24, "learning_rate": 8.90529076597426e-06, "loss": 1.0561, "step": 10273 }, { "epoch": 0.24, "learning_rate": 8.905056230918354e-06, "loss": 0.9301, "step": 10274 }, { "epoch": 0.24, "learning_rate": 8.904821673830385e-06, "loss": 1.0117, "step": 10275 }, { "epoch": 0.24, "learning_rate": 8.90458709471168e-06, "loss": 0.9276, "step": 10276 }, { "epoch": 0.24, "learning_rate": 8.90435249356356e-06, "loss": 0.9557, "step": 10277 }, { "epoch": 0.24, "learning_rate": 8.904117870387348e-06, "loss": 1.0737, "step": 10278 }, { "epoch": 0.24, "learning_rate": 8.90388322518437e-06, "loss": 1.0191, "step": 10279 }, { "epoch": 0.24, "learning_rate": 8.903648557955946e-06, "loss": 1.1509, "step": 10280 }, { "epoch": 0.24, "learning_rate": 8.903413868703403e-06, "loss": 0.9865, "step": 10281 }, { "epoch": 0.24, "learning_rate": 8.903179157428065e-06, "loss": 0.8788, "step": 10282 }, { "epoch": 0.24, "learning_rate": 8.902944424131256e-06, "loss": 1.0115, "step": 10283 }, { "epoch": 0.24, "learning_rate": 8.9027096688143e-06, "loss": 1.0018, "step": 10284 }, { "epoch": 0.24, "learning_rate": 8.902474891478521e-06, "loss": 1.104, "step": 10285 }, { "epoch": 0.24, "learning_rate": 8.902240092125245e-06, "loss": 0.8672, "step": 10286 }, { "epoch": 0.24, "learning_rate": 8.902005270755793e-06, "loss": 1.0046, "step": 10287 }, { "epoch": 0.24, "learning_rate": 8.901770427371496e-06, "loss": 1.0382, "step": 10288 }, { "epoch": 0.24, "learning_rate": 8.901535561973674e-06, "loss": 0.9911, "step": 10289 }, { "epoch": 0.24, "learning_rate": 8.901300674563655e-06, "loss": 0.8852, "step": 10290 }, { "epoch": 0.24, "learning_rate": 8.901065765142762e-06, "loss": 0.8562, "step": 10291 }, { "epoch": 0.24, "learning_rate": 8.900830833712322e-06, "loss": 0.806, "step": 10292 }, { "epoch": 0.24, "learning_rate": 8.900595880273658e-06, "loss": 1.0709, "step": 10293 }, { "epoch": 0.24, "learning_rate": 8.900360904828098e-06, "loss": 1.1863, "step": 10294 }, { "epoch": 0.24, "learning_rate": 8.900125907376968e-06, "loss": 1.0559, "step": 10295 }, { "epoch": 0.24, "learning_rate": 8.899890887921593e-06, "loss": 0.9346, "step": 10296 }, { "epoch": 0.24, "learning_rate": 8.899655846463298e-06, "loss": 1.3267, "step": 10297 }, { "epoch": 0.24, "learning_rate": 8.89942078300341e-06, "loss": 1.0099, "step": 10298 }, { "epoch": 0.24, "learning_rate": 8.899185697543255e-06, "loss": 0.955, "step": 10299 }, { "epoch": 0.24, "learning_rate": 8.898950590084162e-06, "loss": 0.9544, "step": 10300 }, { "epoch": 0.24, "learning_rate": 8.898715460627453e-06, "loss": 1.1466, "step": 10301 }, { "epoch": 0.24, "learning_rate": 8.898480309174456e-06, "loss": 0.9484, "step": 10302 }, { "epoch": 0.24, "learning_rate": 8.898245135726498e-06, "loss": 0.819, "step": 10303 }, { "epoch": 0.24, "learning_rate": 8.898009940284908e-06, "loss": 0.9258, "step": 10304 }, { "epoch": 0.24, "learning_rate": 8.89777472285101e-06, "loss": 0.9272, "step": 10305 }, { "epoch": 0.24, "learning_rate": 8.897539483426132e-06, "loss": 0.9731, "step": 10306 }, { "epoch": 0.24, "learning_rate": 8.897304222011602e-06, "loss": 0.9741, "step": 10307 }, { "epoch": 0.24, "learning_rate": 8.897068938608746e-06, "loss": 1.122, "step": 10308 }, { "epoch": 0.24, "learning_rate": 8.896833633218893e-06, "loss": 1.0558, "step": 10309 }, { "epoch": 0.24, "learning_rate": 8.896598305843368e-06, "loss": 1.0801, "step": 10310 }, { "epoch": 0.24, "learning_rate": 8.896362956483502e-06, "loss": 0.9762, "step": 10311 }, { "epoch": 0.24, "learning_rate": 8.896127585140621e-06, "loss": 1.058, "step": 10312 }, { "epoch": 0.24, "learning_rate": 8.895892191816053e-06, "loss": 0.8496, "step": 10313 }, { "epoch": 0.24, "learning_rate": 8.895656776511125e-06, "loss": 0.7664, "step": 10314 }, { "epoch": 0.24, "learning_rate": 8.895421339227168e-06, "loss": 1.0392, "step": 10315 }, { "epoch": 0.24, "learning_rate": 8.895185879965508e-06, "loss": 0.9207, "step": 10316 }, { "epoch": 0.24, "learning_rate": 8.894950398727475e-06, "loss": 1.1401, "step": 10317 }, { "epoch": 0.24, "learning_rate": 8.894714895514397e-06, "loss": 1.1839, "step": 10318 }, { "epoch": 0.24, "learning_rate": 8.894479370327602e-06, "loss": 0.8615, "step": 10319 }, { "epoch": 0.24, "learning_rate": 8.894243823168419e-06, "loss": 0.9999, "step": 10320 }, { "epoch": 0.24, "learning_rate": 8.894008254038178e-06, "loss": 0.9654, "step": 10321 }, { "epoch": 0.24, "learning_rate": 8.893772662938206e-06, "loss": 0.9444, "step": 10322 }, { "epoch": 0.24, "learning_rate": 8.893537049869834e-06, "loss": 1.0921, "step": 10323 }, { "epoch": 0.24, "learning_rate": 8.89330141483439e-06, "loss": 0.8636, "step": 10324 }, { "epoch": 0.24, "learning_rate": 8.893065757833206e-06, "loss": 0.7832, "step": 10325 }, { "epoch": 0.24, "learning_rate": 8.89283007886761e-06, "loss": 0.9769, "step": 10326 }, { "epoch": 0.24, "learning_rate": 8.89259437793893e-06, "loss": 0.9984, "step": 10327 }, { "epoch": 0.24, "learning_rate": 8.892358655048498e-06, "loss": 1.1429, "step": 10328 }, { "epoch": 0.24, "learning_rate": 8.892122910197642e-06, "loss": 0.972, "step": 10329 }, { "epoch": 0.24, "learning_rate": 8.891887143387694e-06, "loss": 0.7698, "step": 10330 }, { "epoch": 0.24, "learning_rate": 8.891651354619985e-06, "loss": 0.9522, "step": 10331 }, { "epoch": 0.24, "learning_rate": 8.891415543895843e-06, "loss": 1.021, "step": 10332 }, { "epoch": 0.24, "learning_rate": 8.891179711216598e-06, "loss": 1.1619, "step": 10333 }, { "epoch": 0.24, "learning_rate": 8.890943856583583e-06, "loss": 0.9026, "step": 10334 }, { "epoch": 0.24, "learning_rate": 8.890707979998125e-06, "loss": 0.9178, "step": 10335 }, { "epoch": 0.24, "learning_rate": 8.890472081461561e-06, "loss": 0.8796, "step": 10336 }, { "epoch": 0.24, "learning_rate": 8.890236160975217e-06, "loss": 1.0404, "step": 10337 }, { "epoch": 0.24, "learning_rate": 8.890000218540422e-06, "loss": 0.8488, "step": 10338 }, { "epoch": 0.24, "learning_rate": 8.889764254158515e-06, "loss": 0.8378, "step": 10339 }, { "epoch": 0.24, "learning_rate": 8.88952826783082e-06, "loss": 0.986, "step": 10340 }, { "epoch": 0.24, "learning_rate": 8.88929225955867e-06, "loss": 0.8677, "step": 10341 }, { "epoch": 0.24, "learning_rate": 8.8890562293434e-06, "loss": 1.1715, "step": 10342 }, { "epoch": 0.24, "learning_rate": 8.88882017718634e-06, "loss": 0.8958, "step": 10343 }, { "epoch": 0.24, "learning_rate": 8.888584103088819e-06, "loss": 1.109, "step": 10344 }, { "epoch": 0.24, "learning_rate": 8.888348007052172e-06, "loss": 0.9075, "step": 10345 }, { "epoch": 0.24, "learning_rate": 8.888111889077729e-06, "loss": 1.2974, "step": 10346 }, { "epoch": 0.24, "learning_rate": 8.887875749166823e-06, "loss": 0.9082, "step": 10347 }, { "epoch": 0.24, "learning_rate": 8.887639587320788e-06, "loss": 0.8279, "step": 10348 }, { "epoch": 0.24, "learning_rate": 8.887403403540954e-06, "loss": 0.9882, "step": 10349 }, { "epoch": 0.24, "learning_rate": 8.887167197828655e-06, "loss": 0.9124, "step": 10350 }, { "epoch": 0.24, "learning_rate": 8.88693097018522e-06, "loss": 0.9299, "step": 10351 }, { "epoch": 0.24, "learning_rate": 8.88669472061199e-06, "loss": 0.8288, "step": 10352 }, { "epoch": 0.24, "learning_rate": 8.88645844911029e-06, "loss": 0.7271, "step": 10353 }, { "epoch": 0.24, "learning_rate": 8.886222155681457e-06, "loss": 0.9073, "step": 10354 }, { "epoch": 0.24, "learning_rate": 8.885985840326821e-06, "loss": 0.9667, "step": 10355 }, { "epoch": 0.24, "learning_rate": 8.885749503047718e-06, "loss": 0.8859, "step": 10356 }, { "epoch": 0.24, "learning_rate": 8.885513143845482e-06, "loss": 1.0182, "step": 10357 }, { "epoch": 0.24, "learning_rate": 8.885276762721441e-06, "loss": 0.8883, "step": 10358 }, { "epoch": 0.24, "learning_rate": 8.885040359676937e-06, "loss": 0.6893, "step": 10359 }, { "epoch": 0.24, "learning_rate": 8.8848039347133e-06, "loss": 0.9384, "step": 10360 }, { "epoch": 0.24, "learning_rate": 8.88456748783186e-06, "loss": 1.067, "step": 10361 }, { "epoch": 0.24, "learning_rate": 8.884331019033956e-06, "loss": 0.9565, "step": 10362 }, { "epoch": 0.24, "learning_rate": 8.884094528320921e-06, "loss": 0.7284, "step": 10363 }, { "epoch": 0.24, "learning_rate": 8.883858015694089e-06, "loss": 1.1107, "step": 10364 }, { "epoch": 0.24, "learning_rate": 8.883621481154794e-06, "loss": 0.926, "step": 10365 }, { "epoch": 0.24, "learning_rate": 8.883384924704371e-06, "loss": 0.9996, "step": 10366 }, { "epoch": 0.24, "learning_rate": 8.883148346344153e-06, "loss": 1.0947, "step": 10367 }, { "epoch": 0.24, "learning_rate": 8.882911746075478e-06, "loss": 1.3714, "step": 10368 }, { "epoch": 0.24, "learning_rate": 8.882675123899677e-06, "loss": 1.1461, "step": 10369 }, { "epoch": 0.24, "learning_rate": 8.88243847981809e-06, "loss": 0.924, "step": 10370 }, { "epoch": 0.24, "learning_rate": 8.882201813832048e-06, "loss": 1.2085, "step": 10371 }, { "epoch": 0.24, "learning_rate": 8.881965125942886e-06, "loss": 0.8971, "step": 10372 }, { "epoch": 0.24, "learning_rate": 8.881728416151942e-06, "loss": 1.0535, "step": 10373 }, { "epoch": 0.24, "learning_rate": 8.88149168446055e-06, "loss": 0.7899, "step": 10374 }, { "epoch": 0.24, "learning_rate": 8.881254930870047e-06, "loss": 0.8127, "step": 10375 }, { "epoch": 0.24, "learning_rate": 8.881018155381766e-06, "loss": 0.9082, "step": 10376 }, { "epoch": 0.24, "learning_rate": 8.880781357997046e-06, "loss": 1.2972, "step": 10377 }, { "epoch": 0.24, "learning_rate": 8.88054453871722e-06, "loss": 0.907, "step": 10378 }, { "epoch": 0.24, "learning_rate": 8.880307697543627e-06, "loss": 1.3367, "step": 10379 }, { "epoch": 0.24, "learning_rate": 8.880070834477601e-06, "loss": 0.936, "step": 10380 }, { "epoch": 0.24, "learning_rate": 8.87983394952048e-06, "loss": 1.1003, "step": 10381 }, { "epoch": 0.24, "learning_rate": 8.8795970426736e-06, "loss": 0.9232, "step": 10382 }, { "epoch": 0.24, "learning_rate": 8.879360113938295e-06, "loss": 0.9203, "step": 10383 }, { "epoch": 0.24, "learning_rate": 8.879123163315907e-06, "loss": 0.8328, "step": 10384 }, { "epoch": 0.24, "learning_rate": 8.878886190807769e-06, "loss": 0.6259, "step": 10385 }, { "epoch": 0.24, "learning_rate": 8.878649196415218e-06, "loss": 0.9549, "step": 10386 }, { "epoch": 0.24, "learning_rate": 8.878412180139592e-06, "loss": 0.771, "step": 10387 }, { "epoch": 0.24, "learning_rate": 8.87817514198223e-06, "loss": 1.2955, "step": 10388 }, { "epoch": 0.24, "learning_rate": 8.877938081944467e-06, "loss": 0.838, "step": 10389 }, { "epoch": 0.24, "learning_rate": 8.877701000027641e-06, "loss": 0.952, "step": 10390 }, { "epoch": 0.24, "learning_rate": 8.87746389623309e-06, "loss": 1.2287, "step": 10391 }, { "epoch": 0.24, "learning_rate": 8.87722677056215e-06, "loss": 1.0063, "step": 10392 }, { "epoch": 0.24, "learning_rate": 8.876989623016163e-06, "loss": 1.1545, "step": 10393 }, { "epoch": 0.24, "learning_rate": 8.876752453596462e-06, "loss": 1.1143, "step": 10394 }, { "epoch": 0.24, "learning_rate": 8.876515262304387e-06, "loss": 0.988, "step": 10395 }, { "epoch": 0.24, "learning_rate": 8.876278049141279e-06, "loss": 0.8216, "step": 10396 }, { "epoch": 0.24, "learning_rate": 8.876040814108474e-06, "loss": 1.2646, "step": 10397 }, { "epoch": 0.24, "learning_rate": 8.875803557207308e-06, "loss": 1.0975, "step": 10398 }, { "epoch": 0.24, "learning_rate": 8.875566278439122e-06, "loss": 0.9095, "step": 10399 }, { "epoch": 0.24, "learning_rate": 8.875328977805256e-06, "loss": 0.866, "step": 10400 }, { "epoch": 0.24, "learning_rate": 8.875091655307046e-06, "loss": 0.8873, "step": 10401 }, { "epoch": 0.24, "learning_rate": 8.874854310945833e-06, "loss": 0.7396, "step": 10402 }, { "epoch": 0.24, "learning_rate": 8.874616944722956e-06, "loss": 1.1243, "step": 10403 }, { "epoch": 0.24, "learning_rate": 8.874379556639755e-06, "loss": 0.9817, "step": 10404 }, { "epoch": 0.24, "learning_rate": 8.874142146697567e-06, "loss": 0.87, "step": 10405 }, { "epoch": 0.24, "learning_rate": 8.873904714897733e-06, "loss": 0.8774, "step": 10406 }, { "epoch": 0.24, "learning_rate": 8.87366726124159e-06, "loss": 0.8103, "step": 10407 }, { "epoch": 0.24, "learning_rate": 8.873429785730482e-06, "loss": 0.8858, "step": 10408 }, { "epoch": 0.24, "learning_rate": 8.873192288365746e-06, "loss": 0.9278, "step": 10409 }, { "epoch": 0.24, "learning_rate": 8.872954769148722e-06, "loss": 1.0373, "step": 10410 }, { "epoch": 0.24, "learning_rate": 8.872717228080752e-06, "loss": 0.997, "step": 10411 }, { "epoch": 0.24, "learning_rate": 8.872479665163174e-06, "loss": 0.8335, "step": 10412 }, { "epoch": 0.24, "learning_rate": 8.87224208039733e-06, "loss": 1.0224, "step": 10413 }, { "epoch": 0.24, "learning_rate": 8.872004473784557e-06, "loss": 1.2176, "step": 10414 }, { "epoch": 0.24, "learning_rate": 8.8717668453262e-06, "loss": 0.9208, "step": 10415 }, { "epoch": 0.24, "learning_rate": 8.871529195023599e-06, "loss": 1.0494, "step": 10416 }, { "epoch": 0.24, "learning_rate": 8.87129152287809e-06, "loss": 1.0619, "step": 10417 }, { "epoch": 0.24, "learning_rate": 8.871053828891021e-06, "loss": 1.0338, "step": 10418 }, { "epoch": 0.24, "learning_rate": 8.870816113063728e-06, "loss": 1.2443, "step": 10419 }, { "epoch": 0.24, "learning_rate": 8.870578375397554e-06, "loss": 0.8889, "step": 10420 }, { "epoch": 0.24, "learning_rate": 8.87034061589384e-06, "loss": 1.2836, "step": 10421 }, { "epoch": 0.24, "learning_rate": 8.870102834553928e-06, "loss": 1.018, "step": 10422 }, { "epoch": 0.24, "learning_rate": 8.86986503137916e-06, "loss": 1.0362, "step": 10423 }, { "epoch": 0.24, "learning_rate": 8.869627206370875e-06, "loss": 1.0252, "step": 10424 }, { "epoch": 0.24, "learning_rate": 8.869389359530416e-06, "loss": 1.1752, "step": 10425 }, { "epoch": 0.24, "learning_rate": 8.869151490859127e-06, "loss": 0.9958, "step": 10426 }, { "epoch": 0.24, "learning_rate": 8.868913600358348e-06, "loss": 1.0896, "step": 10427 }, { "epoch": 0.24, "learning_rate": 8.868675688029422e-06, "loss": 1.3593, "step": 10428 }, { "epoch": 0.24, "learning_rate": 8.86843775387369e-06, "loss": 0.8886, "step": 10429 }, { "epoch": 0.24, "learning_rate": 8.868199797892497e-06, "loss": 0.9605, "step": 10430 }, { "epoch": 0.24, "learning_rate": 8.867961820087181e-06, "loss": 0.8996, "step": 10431 }, { "epoch": 0.24, "learning_rate": 8.867723820459089e-06, "loss": 0.824, "step": 10432 }, { "epoch": 0.24, "learning_rate": 8.867485799009564e-06, "loss": 1.0025, "step": 10433 }, { "epoch": 0.24, "learning_rate": 8.867247755739945e-06, "loss": 1.0677, "step": 10434 }, { "epoch": 0.24, "learning_rate": 8.867009690651578e-06, "loss": 1.1008, "step": 10435 }, { "epoch": 0.24, "learning_rate": 8.866771603745805e-06, "loss": 0.8828, "step": 10436 }, { "epoch": 0.24, "learning_rate": 8.86653349502397e-06, "loss": 0.986, "step": 10437 }, { "epoch": 0.24, "learning_rate": 8.866295364487416e-06, "loss": 0.9662, "step": 10438 }, { "epoch": 0.24, "learning_rate": 8.866057212137486e-06, "loss": 0.9115, "step": 10439 }, { "epoch": 0.24, "learning_rate": 8.865819037975526e-06, "loss": 0.9328, "step": 10440 }, { "epoch": 0.24, "learning_rate": 8.865580842002875e-06, "loss": 0.9157, "step": 10441 }, { "epoch": 0.24, "learning_rate": 8.865342624220883e-06, "loss": 0.8177, "step": 10442 }, { "epoch": 0.24, "learning_rate": 8.865104384630887e-06, "loss": 1.2089, "step": 10443 }, { "epoch": 0.24, "learning_rate": 8.864866123234238e-06, "loss": 0.9711, "step": 10444 }, { "epoch": 0.24, "learning_rate": 8.864627840032276e-06, "loss": 1.1327, "step": 10445 }, { "epoch": 0.24, "learning_rate": 8.864389535026348e-06, "loss": 1.0581, "step": 10446 }, { "epoch": 0.24, "learning_rate": 8.864151208217795e-06, "loss": 0.9988, "step": 10447 }, { "epoch": 0.24, "learning_rate": 8.863912859607966e-06, "loss": 1.0339, "step": 10448 }, { "epoch": 0.24, "learning_rate": 8.863674489198202e-06, "loss": 1.4216, "step": 10449 }, { "epoch": 0.24, "learning_rate": 8.863436096989849e-06, "loss": 0.8293, "step": 10450 }, { "epoch": 0.24, "learning_rate": 8.863197682984253e-06, "loss": 0.9409, "step": 10451 }, { "epoch": 0.24, "learning_rate": 8.862959247182758e-06, "loss": 0.8853, "step": 10452 }, { "epoch": 0.24, "learning_rate": 8.86272078958671e-06, "loss": 1.0598, "step": 10453 }, { "epoch": 0.24, "learning_rate": 8.862482310197454e-06, "loss": 1.0543, "step": 10454 }, { "epoch": 0.24, "learning_rate": 8.862243809016337e-06, "loss": 0.9644, "step": 10455 }, { "epoch": 0.24, "learning_rate": 8.862005286044701e-06, "loss": 0.8477, "step": 10456 }, { "epoch": 0.24, "learning_rate": 8.861766741283895e-06, "loss": 0.8864, "step": 10457 }, { "epoch": 0.24, "learning_rate": 8.861528174735263e-06, "loss": 0.9818, "step": 10458 }, { "epoch": 0.24, "learning_rate": 8.861289586400153e-06, "loss": 1.1139, "step": 10459 }, { "epoch": 0.24, "learning_rate": 8.861050976279908e-06, "loss": 1.0096, "step": 10460 }, { "epoch": 0.24, "learning_rate": 8.860812344375877e-06, "loss": 1.1158, "step": 10461 }, { "epoch": 0.24, "learning_rate": 8.860573690689406e-06, "loss": 0.9107, "step": 10462 }, { "epoch": 0.24, "learning_rate": 8.860335015221839e-06, "loss": 1.2973, "step": 10463 }, { "epoch": 0.24, "learning_rate": 8.860096317974526e-06, "loss": 0.8426, "step": 10464 }, { "epoch": 0.24, "learning_rate": 8.859857598948812e-06, "loss": 1.105, "step": 10465 }, { "epoch": 0.24, "learning_rate": 8.859618858146045e-06, "loss": 1.1155, "step": 10466 }, { "epoch": 0.24, "learning_rate": 8.859380095567569e-06, "loss": 0.9539, "step": 10467 }, { "epoch": 0.24, "learning_rate": 8.859141311214733e-06, "loss": 0.9026, "step": 10468 }, { "epoch": 0.24, "learning_rate": 8.858902505088885e-06, "loss": 1.1677, "step": 10469 }, { "epoch": 0.24, "learning_rate": 8.85866367719137e-06, "loss": 0.9526, "step": 10470 }, { "epoch": 0.24, "learning_rate": 8.85842482752354e-06, "loss": 0.8794, "step": 10471 }, { "epoch": 0.24, "learning_rate": 8.858185956086738e-06, "loss": 1.1059, "step": 10472 }, { "epoch": 0.24, "learning_rate": 8.857947062882312e-06, "loss": 1.032, "step": 10473 }, { "epoch": 0.24, "learning_rate": 8.857708147911614e-06, "loss": 0.9421, "step": 10474 }, { "epoch": 0.24, "learning_rate": 8.857469211175986e-06, "loss": 0.8543, "step": 10475 }, { "epoch": 0.24, "learning_rate": 8.85723025267678e-06, "loss": 0.7662, "step": 10476 }, { "epoch": 0.24, "learning_rate": 8.856991272415346e-06, "loss": 1.0747, "step": 10477 }, { "epoch": 0.24, "learning_rate": 8.856752270393025e-06, "loss": 1.0365, "step": 10478 }, { "epoch": 0.24, "learning_rate": 8.856513246611174e-06, "loss": 0.619, "step": 10479 }, { "epoch": 0.24, "learning_rate": 8.856274201071135e-06, "loss": 0.8218, "step": 10480 }, { "epoch": 0.24, "learning_rate": 8.85603513377426e-06, "loss": 0.7681, "step": 10481 }, { "epoch": 0.24, "learning_rate": 8.855796044721898e-06, "loss": 1.011, "step": 10482 }, { "epoch": 0.24, "learning_rate": 8.855556933915395e-06, "loss": 0.7966, "step": 10483 }, { "epoch": 0.24, "learning_rate": 8.855317801356104e-06, "loss": 1.1936, "step": 10484 }, { "epoch": 0.24, "learning_rate": 8.855078647045372e-06, "loss": 0.9687, "step": 10485 }, { "epoch": 0.24, "learning_rate": 8.854839470984548e-06, "loss": 0.852, "step": 10486 }, { "epoch": 0.24, "learning_rate": 8.854600273174981e-06, "loss": 0.8411, "step": 10487 }, { "epoch": 0.24, "learning_rate": 8.854361053618024e-06, "loss": 0.9853, "step": 10488 }, { "epoch": 0.24, "learning_rate": 8.854121812315021e-06, "loss": 0.9932, "step": 10489 }, { "epoch": 0.24, "learning_rate": 8.853882549267328e-06, "loss": 0.9853, "step": 10490 }, { "epoch": 0.24, "learning_rate": 8.853643264476289e-06, "loss": 1.1003, "step": 10491 }, { "epoch": 0.24, "learning_rate": 8.853403957943259e-06, "loss": 1.0381, "step": 10492 }, { "epoch": 0.24, "learning_rate": 8.853164629669583e-06, "loss": 0.9017, "step": 10493 }, { "epoch": 0.24, "learning_rate": 8.852925279656616e-06, "loss": 1.0265, "step": 10494 }, { "epoch": 0.24, "learning_rate": 8.852685907905708e-06, "loss": 0.9608, "step": 10495 }, { "epoch": 0.24, "learning_rate": 8.852446514418207e-06, "loss": 1.1681, "step": 10496 }, { "epoch": 0.24, "learning_rate": 8.852207099195465e-06, "loss": 0.9525, "step": 10497 }, { "epoch": 0.24, "learning_rate": 8.851967662238831e-06, "loss": 1.0696, "step": 10498 }, { "epoch": 0.24, "learning_rate": 8.85172820354966e-06, "loss": 0.9924, "step": 10499 }, { "epoch": 0.24, "learning_rate": 8.8514887231293e-06, "loss": 1.2065, "step": 10500 }, { "epoch": 0.24, "learning_rate": 8.851249220979102e-06, "loss": 0.9336, "step": 10501 }, { "epoch": 0.24, "learning_rate": 8.851009697100416e-06, "loss": 0.8696, "step": 10502 }, { "epoch": 0.24, "learning_rate": 8.850770151494598e-06, "loss": 0.8773, "step": 10503 }, { "epoch": 0.24, "learning_rate": 8.850530584162996e-06, "loss": 0.9119, "step": 10504 }, { "epoch": 0.24, "learning_rate": 8.850290995106963e-06, "loss": 0.9421, "step": 10505 }, { "epoch": 0.24, "learning_rate": 8.850051384327848e-06, "loss": 0.8741, "step": 10506 }, { "epoch": 0.24, "learning_rate": 8.849811751827006e-06, "loss": 0.8036, "step": 10507 }, { "epoch": 0.24, "learning_rate": 8.84957209760579e-06, "loss": 0.9194, "step": 10508 }, { "epoch": 0.24, "learning_rate": 8.849332421665547e-06, "loss": 1.2319, "step": 10509 }, { "epoch": 0.24, "learning_rate": 8.849092724007633e-06, "loss": 1.3378, "step": 10510 }, { "epoch": 0.24, "learning_rate": 8.848853004633401e-06, "loss": 0.9353, "step": 10511 }, { "epoch": 0.24, "learning_rate": 8.8486132635442e-06, "loss": 1.2029, "step": 10512 }, { "epoch": 0.24, "learning_rate": 8.848373500741387e-06, "loss": 1.0889, "step": 10513 }, { "epoch": 0.24, "learning_rate": 8.848133716226313e-06, "loss": 0.9759, "step": 10514 }, { "epoch": 0.24, "learning_rate": 8.847893910000328e-06, "loss": 1.0066, "step": 10515 }, { "epoch": 0.24, "learning_rate": 8.847654082064788e-06, "loss": 0.8184, "step": 10516 }, { "epoch": 0.24, "learning_rate": 8.847414232421046e-06, "loss": 0.6695, "step": 10517 }, { "epoch": 0.24, "learning_rate": 8.847174361070455e-06, "loss": 0.9191, "step": 10518 }, { "epoch": 0.24, "learning_rate": 8.846934468014365e-06, "loss": 0.8911, "step": 10519 }, { "epoch": 0.24, "learning_rate": 8.846694553254137e-06, "loss": 1.0228, "step": 10520 }, { "epoch": 0.24, "learning_rate": 8.846454616791117e-06, "loss": 1.0114, "step": 10521 }, { "epoch": 0.24, "learning_rate": 8.846214658626662e-06, "loss": 0.9473, "step": 10522 }, { "epoch": 0.24, "learning_rate": 8.845974678762124e-06, "loss": 1.0422, "step": 10523 }, { "epoch": 0.24, "learning_rate": 8.84573467719886e-06, "loss": 0.9692, "step": 10524 }, { "epoch": 0.24, "learning_rate": 8.845494653938223e-06, "loss": 0.926, "step": 10525 }, { "epoch": 0.24, "learning_rate": 8.845254608981567e-06, "loss": 0.8163, "step": 10526 }, { "epoch": 0.24, "learning_rate": 8.845014542330245e-06, "loss": 1.005, "step": 10527 }, { "epoch": 0.24, "learning_rate": 8.844774453985613e-06, "loss": 0.9834, "step": 10528 }, { "epoch": 0.24, "learning_rate": 8.844534343949025e-06, "loss": 1.304, "step": 10529 }, { "epoch": 0.24, "learning_rate": 8.844294212221836e-06, "loss": 0.9505, "step": 10530 }, { "epoch": 0.24, "learning_rate": 8.844054058805401e-06, "loss": 1.0083, "step": 10531 }, { "epoch": 0.24, "learning_rate": 8.843813883701073e-06, "loss": 0.9541, "step": 10532 }, { "epoch": 0.24, "learning_rate": 8.843573686910209e-06, "loss": 0.9637, "step": 10533 }, { "epoch": 0.24, "learning_rate": 8.843333468434166e-06, "loss": 1.0489, "step": 10534 }, { "epoch": 0.24, "learning_rate": 8.843093228274294e-06, "loss": 0.9452, "step": 10535 }, { "epoch": 0.24, "learning_rate": 8.842852966431953e-06, "loss": 0.9936, "step": 10536 }, { "epoch": 0.24, "learning_rate": 8.842612682908496e-06, "loss": 1.0075, "step": 10537 }, { "epoch": 0.24, "learning_rate": 8.84237237770528e-06, "loss": 0.6835, "step": 10538 }, { "epoch": 0.24, "learning_rate": 8.842132050823661e-06, "loss": 0.9419, "step": 10539 }, { "epoch": 0.24, "learning_rate": 8.841891702264992e-06, "loss": 0.873, "step": 10540 }, { "epoch": 0.24, "learning_rate": 8.841651332030633e-06, "loss": 1.2301, "step": 10541 }, { "epoch": 0.24, "learning_rate": 8.84141094012194e-06, "loss": 0.9393, "step": 10542 }, { "epoch": 0.24, "learning_rate": 8.841170526540267e-06, "loss": 0.8892, "step": 10543 }, { "epoch": 0.24, "learning_rate": 8.84093009128697e-06, "loss": 0.7821, "step": 10544 }, { "epoch": 0.24, "learning_rate": 8.840689634363406e-06, "loss": 0.8208, "step": 10545 }, { "epoch": 0.24, "learning_rate": 8.840449155770934e-06, "loss": 1.4141, "step": 10546 }, { "epoch": 0.24, "learning_rate": 8.84020865551091e-06, "loss": 1.1359, "step": 10547 }, { "epoch": 0.24, "learning_rate": 8.83996813358469e-06, "loss": 1.0077, "step": 10548 }, { "epoch": 0.24, "learning_rate": 8.839727589993627e-06, "loss": 0.9481, "step": 10549 }, { "epoch": 0.24, "learning_rate": 8.839487024739085e-06, "loss": 1.0029, "step": 10550 }, { "epoch": 0.24, "learning_rate": 8.839246437822417e-06, "loss": 0.9871, "step": 10551 }, { "epoch": 0.24, "learning_rate": 8.839005829244984e-06, "loss": 0.9509, "step": 10552 }, { "epoch": 0.24, "learning_rate": 8.83876519900814e-06, "loss": 1.0269, "step": 10553 }, { "epoch": 0.24, "learning_rate": 8.838524547113244e-06, "loss": 0.7598, "step": 10554 }, { "epoch": 0.24, "learning_rate": 8.838283873561653e-06, "loss": 1.1297, "step": 10555 }, { "epoch": 0.24, "learning_rate": 8.838043178354727e-06, "loss": 1.0406, "step": 10556 }, { "epoch": 0.24, "learning_rate": 8.83780246149382e-06, "loss": 0.648, "step": 10557 }, { "epoch": 0.24, "learning_rate": 8.837561722980295e-06, "loss": 1.0311, "step": 10558 }, { "epoch": 0.24, "learning_rate": 8.837320962815506e-06, "loss": 1.0267, "step": 10559 }, { "epoch": 0.24, "learning_rate": 8.837080181000814e-06, "loss": 0.5736, "step": 10560 }, { "epoch": 0.24, "learning_rate": 8.836839377537577e-06, "loss": 0.7707, "step": 10561 }, { "epoch": 0.24, "learning_rate": 8.836598552427152e-06, "loss": 1.0223, "step": 10562 }, { "epoch": 0.24, "learning_rate": 8.8363577056709e-06, "loss": 0.8936, "step": 10563 }, { "epoch": 0.24, "learning_rate": 8.836116837270178e-06, "loss": 1.0502, "step": 10564 }, { "epoch": 0.25, "learning_rate": 8.835875947226346e-06, "loss": 0.9332, "step": 10565 }, { "epoch": 0.25, "learning_rate": 8.835635035540763e-06, "loss": 1.0904, "step": 10566 }, { "epoch": 0.25, "learning_rate": 8.83539410221479e-06, "loss": 0.9301, "step": 10567 }, { "epoch": 0.25, "learning_rate": 8.835153147249782e-06, "loss": 1.0632, "step": 10568 }, { "epoch": 0.25, "learning_rate": 8.834912170647102e-06, "loss": 0.7661, "step": 10569 }, { "epoch": 0.25, "learning_rate": 8.834671172408108e-06, "loss": 1.023, "step": 10570 }, { "epoch": 0.25, "learning_rate": 8.834430152534157e-06, "loss": 1.221, "step": 10571 }, { "epoch": 0.25, "learning_rate": 8.834189111026616e-06, "loss": 1.0425, "step": 10572 }, { "epoch": 0.25, "learning_rate": 8.83394804788684e-06, "loss": 0.8719, "step": 10573 }, { "epoch": 0.25, "learning_rate": 8.833706963116188e-06, "loss": 0.6457, "step": 10574 }, { "epoch": 0.25, "learning_rate": 8.833465856716023e-06, "loss": 0.9838, "step": 10575 }, { "epoch": 0.25, "learning_rate": 8.833224728687706e-06, "loss": 1.0327, "step": 10576 }, { "epoch": 0.25, "learning_rate": 8.832983579032595e-06, "loss": 1.0375, "step": 10577 }, { "epoch": 0.25, "learning_rate": 8.832742407752051e-06, "loss": 1.041, "step": 10578 }, { "epoch": 0.25, "learning_rate": 8.832501214847435e-06, "loss": 0.5923, "step": 10579 }, { "epoch": 0.25, "learning_rate": 8.832260000320108e-06, "loss": 0.9461, "step": 10580 }, { "epoch": 0.25, "learning_rate": 8.832018764171431e-06, "loss": 0.9303, "step": 10581 }, { "epoch": 0.25, "learning_rate": 8.831777506402764e-06, "loss": 1.0188, "step": 10582 }, { "epoch": 0.25, "learning_rate": 8.831536227015469e-06, "loss": 0.7086, "step": 10583 }, { "epoch": 0.25, "learning_rate": 8.831294926010907e-06, "loss": 1.2398, "step": 10584 }, { "epoch": 0.25, "learning_rate": 8.831053603390441e-06, "loss": 0.9287, "step": 10585 }, { "epoch": 0.25, "learning_rate": 8.83081225915543e-06, "loss": 0.9586, "step": 10586 }, { "epoch": 0.25, "learning_rate": 8.830570893307237e-06, "loss": 1.066, "step": 10587 }, { "epoch": 0.25, "learning_rate": 8.830329505847224e-06, "loss": 0.9548, "step": 10588 }, { "epoch": 0.25, "learning_rate": 8.830088096776752e-06, "loss": 0.7733, "step": 10589 }, { "epoch": 0.25, "learning_rate": 8.829846666097185e-06, "loss": 0.9611, "step": 10590 }, { "epoch": 0.25, "learning_rate": 8.82960521380988e-06, "loss": 0.9857, "step": 10591 }, { "epoch": 0.25, "learning_rate": 8.829363739916206e-06, "loss": 0.9348, "step": 10592 }, { "epoch": 0.25, "learning_rate": 8.82912224441752e-06, "loss": 0.876, "step": 10593 }, { "epoch": 0.25, "learning_rate": 8.82888072731519e-06, "loss": 1.2182, "step": 10594 }, { "epoch": 0.25, "learning_rate": 8.828639188610573e-06, "loss": 0.813, "step": 10595 }, { "epoch": 0.25, "learning_rate": 8.828397628305034e-06, "loss": 0.9834, "step": 10596 }, { "epoch": 0.25, "learning_rate": 8.828156046399939e-06, "loss": 1.2616, "step": 10597 }, { "epoch": 0.25, "learning_rate": 8.827914442896644e-06, "loss": 1.0702, "step": 10598 }, { "epoch": 0.25, "learning_rate": 8.827672817796518e-06, "loss": 0.9185, "step": 10599 }, { "epoch": 0.25, "learning_rate": 8.827431171100922e-06, "loss": 0.9684, "step": 10600 }, { "epoch": 0.25, "learning_rate": 8.82718950281122e-06, "loss": 0.941, "step": 10601 }, { "epoch": 0.25, "learning_rate": 8.826947812928774e-06, "loss": 1.0076, "step": 10602 }, { "epoch": 0.25, "learning_rate": 8.826706101454951e-06, "loss": 1.0278, "step": 10603 }, { "epoch": 0.25, "learning_rate": 8.82646436839111e-06, "loss": 1.0217, "step": 10604 }, { "epoch": 0.25, "learning_rate": 8.82622261373862e-06, "loss": 0.819, "step": 10605 }, { "epoch": 0.25, "learning_rate": 8.82598083749884e-06, "loss": 0.9721, "step": 10606 }, { "epoch": 0.25, "learning_rate": 8.825739039673137e-06, "loss": 0.9205, "step": 10607 }, { "epoch": 0.25, "learning_rate": 8.825497220262875e-06, "loss": 1.1496, "step": 10608 }, { "epoch": 0.25, "learning_rate": 8.825255379269418e-06, "loss": 0.9539, "step": 10609 }, { "epoch": 0.25, "learning_rate": 8.825013516694128e-06, "loss": 0.949, "step": 10610 }, { "epoch": 0.25, "learning_rate": 8.824771632538375e-06, "loss": 1.1115, "step": 10611 }, { "epoch": 0.25, "learning_rate": 8.82452972680352e-06, "loss": 0.9202, "step": 10612 }, { "epoch": 0.25, "learning_rate": 8.824287799490927e-06, "loss": 1.0738, "step": 10613 }, { "epoch": 0.25, "learning_rate": 8.824045850601963e-06, "loss": 1.1186, "step": 10614 }, { "epoch": 0.25, "learning_rate": 8.823803880137993e-06, "loss": 0.769, "step": 10615 }, { "epoch": 0.25, "learning_rate": 8.82356188810038e-06, "loss": 1.0371, "step": 10616 }, { "epoch": 0.25, "learning_rate": 8.823319874490492e-06, "loss": 0.8419, "step": 10617 }, { "epoch": 0.25, "learning_rate": 8.823077839309695e-06, "loss": 1.0922, "step": 10618 }, { "epoch": 0.25, "learning_rate": 8.822835782559351e-06, "loss": 1.2215, "step": 10619 }, { "epoch": 0.25, "learning_rate": 8.822593704240828e-06, "loss": 0.9878, "step": 10620 }, { "epoch": 0.25, "learning_rate": 8.82235160435549e-06, "loss": 1.1011, "step": 10621 }, { "epoch": 0.25, "learning_rate": 8.822109482904706e-06, "loss": 1.0538, "step": 10622 }, { "epoch": 0.25, "learning_rate": 8.82186733988984e-06, "loss": 0.7444, "step": 10623 }, { "epoch": 0.25, "learning_rate": 8.821625175312258e-06, "loss": 1.0769, "step": 10624 }, { "epoch": 0.25, "learning_rate": 8.821382989173327e-06, "loss": 0.8878, "step": 10625 }, { "epoch": 0.25, "learning_rate": 8.821140781474414e-06, "loss": 1.0711, "step": 10626 }, { "epoch": 0.25, "learning_rate": 8.820898552216884e-06, "loss": 0.9734, "step": 10627 }, { "epoch": 0.25, "learning_rate": 8.820656301402102e-06, "loss": 0.8607, "step": 10628 }, { "epoch": 0.25, "learning_rate": 8.820414029031439e-06, "loss": 0.9415, "step": 10629 }, { "epoch": 0.25, "learning_rate": 8.82017173510626e-06, "loss": 1.081, "step": 10630 }, { "epoch": 0.25, "learning_rate": 8.819929419627931e-06, "loss": 1.1891, "step": 10631 }, { "epoch": 0.25, "learning_rate": 8.81968708259782e-06, "loss": 1.2182, "step": 10632 }, { "epoch": 0.25, "learning_rate": 8.819444724017296e-06, "loss": 0.9344, "step": 10633 }, { "epoch": 0.25, "learning_rate": 8.819202343887725e-06, "loss": 0.9724, "step": 10634 }, { "epoch": 0.25, "learning_rate": 8.818959942210473e-06, "loss": 1.1207, "step": 10635 }, { "epoch": 0.25, "learning_rate": 8.818717518986908e-06, "loss": 1.1808, "step": 10636 }, { "epoch": 0.25, "learning_rate": 8.8184750742184e-06, "loss": 1.2416, "step": 10637 }, { "epoch": 0.25, "learning_rate": 8.818232607906314e-06, "loss": 0.8208, "step": 10638 }, { "epoch": 0.25, "learning_rate": 8.81799012005202e-06, "loss": 0.9018, "step": 10639 }, { "epoch": 0.25, "learning_rate": 8.817747610656886e-06, "loss": 1.0725, "step": 10640 }, { "epoch": 0.25, "learning_rate": 8.817505079722277e-06, "loss": 0.978, "step": 10641 }, { "epoch": 0.25, "learning_rate": 8.817262527249567e-06, "loss": 1.3338, "step": 10642 }, { "epoch": 0.25, "learning_rate": 8.81701995324012e-06, "loss": 0.9738, "step": 10643 }, { "epoch": 0.25, "learning_rate": 8.816777357695307e-06, "loss": 1.3799, "step": 10644 }, { "epoch": 0.25, "learning_rate": 8.816534740616496e-06, "loss": 1.0577, "step": 10645 }, { "epoch": 0.25, "learning_rate": 8.816292102005054e-06, "loss": 0.9179, "step": 10646 }, { "epoch": 0.25, "learning_rate": 8.816049441862352e-06, "loss": 1.0676, "step": 10647 }, { "epoch": 0.25, "learning_rate": 8.81580676018976e-06, "loss": 1.1782, "step": 10648 }, { "epoch": 0.25, "learning_rate": 8.815564056988645e-06, "loss": 1.0451, "step": 10649 }, { "epoch": 0.25, "learning_rate": 8.815321332260375e-06, "loss": 1.0517, "step": 10650 }, { "epoch": 0.25, "learning_rate": 8.815078586006325e-06, "loss": 1.0352, "step": 10651 }, { "epoch": 0.25, "learning_rate": 8.81483581822786e-06, "loss": 0.9202, "step": 10652 }, { "epoch": 0.25, "learning_rate": 8.81459302892635e-06, "loss": 1.1841, "step": 10653 }, { "epoch": 0.25, "learning_rate": 8.814350218103167e-06, "loss": 0.9083, "step": 10654 }, { "epoch": 0.25, "learning_rate": 8.814107385759678e-06, "loss": 1.1894, "step": 10655 }, { "epoch": 0.25, "learning_rate": 8.813864531897255e-06, "loss": 0.8523, "step": 10656 }, { "epoch": 0.25, "learning_rate": 8.813621656517269e-06, "loss": 0.9231, "step": 10657 }, { "epoch": 0.25, "learning_rate": 8.813378759621088e-06, "loss": 0.8, "step": 10658 }, { "epoch": 0.25, "learning_rate": 8.813135841210081e-06, "loss": 0.9582, "step": 10659 }, { "epoch": 0.25, "learning_rate": 8.812892901285624e-06, "loss": 0.8916, "step": 10660 }, { "epoch": 0.25, "learning_rate": 8.812649939849085e-06, "loss": 0.9497, "step": 10661 }, { "epoch": 0.25, "learning_rate": 8.812406956901833e-06, "loss": 1.0439, "step": 10662 }, { "epoch": 0.25, "learning_rate": 8.812163952445241e-06, "loss": 0.8198, "step": 10663 }, { "epoch": 0.25, "learning_rate": 8.811920926480678e-06, "loss": 1.0179, "step": 10664 }, { "epoch": 0.25, "learning_rate": 8.811677879009516e-06, "loss": 1.1322, "step": 10665 }, { "epoch": 0.25, "learning_rate": 8.81143481003313e-06, "loss": 1.2443, "step": 10666 }, { "epoch": 0.25, "learning_rate": 8.811191719552884e-06, "loss": 0.9112, "step": 10667 }, { "epoch": 0.25, "learning_rate": 8.810948607570157e-06, "loss": 0.9333, "step": 10668 }, { "epoch": 0.25, "learning_rate": 8.810705474086316e-06, "loss": 0.9647, "step": 10669 }, { "epoch": 0.25, "learning_rate": 8.810462319102733e-06, "loss": 0.8503, "step": 10670 }, { "epoch": 0.25, "learning_rate": 8.810219142620781e-06, "loss": 0.8996, "step": 10671 }, { "epoch": 0.25, "learning_rate": 8.809975944641833e-06, "loss": 0.9363, "step": 10672 }, { "epoch": 0.25, "learning_rate": 8.80973272516726e-06, "loss": 0.9212, "step": 10673 }, { "epoch": 0.25, "learning_rate": 8.809489484198433e-06, "loss": 1.1396, "step": 10674 }, { "epoch": 0.25, "learning_rate": 8.809246221736725e-06, "loss": 1.0334, "step": 10675 }, { "epoch": 0.25, "learning_rate": 8.809002937783509e-06, "loss": 1.0573, "step": 10676 }, { "epoch": 0.25, "learning_rate": 8.808759632340159e-06, "loss": 0.9097, "step": 10677 }, { "epoch": 0.25, "learning_rate": 8.808516305408045e-06, "loss": 0.9514, "step": 10678 }, { "epoch": 0.25, "learning_rate": 8.80827295698854e-06, "loss": 0.993, "step": 10679 }, { "epoch": 0.25, "learning_rate": 8.80802958708302e-06, "loss": 0.9398, "step": 10680 }, { "epoch": 0.25, "learning_rate": 8.807786195692855e-06, "loss": 0.8822, "step": 10681 }, { "epoch": 0.25, "learning_rate": 8.80754278281942e-06, "loss": 1.2182, "step": 10682 }, { "epoch": 0.25, "learning_rate": 8.807299348464088e-06, "loss": 1.0023, "step": 10683 }, { "epoch": 0.25, "learning_rate": 8.807055892628232e-06, "loss": 1.2031, "step": 10684 }, { "epoch": 0.25, "learning_rate": 8.806812415313223e-06, "loss": 1.1551, "step": 10685 }, { "epoch": 0.25, "learning_rate": 8.80656891652044e-06, "loss": 1.0449, "step": 10686 }, { "epoch": 0.25, "learning_rate": 8.806325396251255e-06, "loss": 1.0009, "step": 10687 }, { "epoch": 0.25, "learning_rate": 8.806081854507039e-06, "loss": 1.2534, "step": 10688 }, { "epoch": 0.25, "learning_rate": 8.805838291289167e-06, "loss": 0.9385, "step": 10689 }, { "epoch": 0.25, "learning_rate": 8.805594706599016e-06, "loss": 0.808, "step": 10690 }, { "epoch": 0.25, "learning_rate": 8.805351100437958e-06, "loss": 0.841, "step": 10691 }, { "epoch": 0.25, "learning_rate": 8.805107472807368e-06, "loss": 0.8877, "step": 10692 }, { "epoch": 0.25, "learning_rate": 8.804863823708621e-06, "loss": 1.1374, "step": 10693 }, { "epoch": 0.25, "learning_rate": 8.804620153143091e-06, "loss": 1.062, "step": 10694 }, { "epoch": 0.25, "learning_rate": 8.804376461112152e-06, "loss": 0.9819, "step": 10695 }, { "epoch": 0.25, "learning_rate": 8.804132747617182e-06, "loss": 0.9193, "step": 10696 }, { "epoch": 0.25, "learning_rate": 8.803889012659552e-06, "loss": 0.8595, "step": 10697 }, { "epoch": 0.25, "learning_rate": 8.803645256240638e-06, "loss": 0.9462, "step": 10698 }, { "epoch": 0.25, "learning_rate": 8.803401478361817e-06, "loss": 1.2443, "step": 10699 }, { "epoch": 0.25, "learning_rate": 8.803157679024465e-06, "loss": 1.2166, "step": 10700 }, { "epoch": 0.25, "learning_rate": 8.802913858229956e-06, "loss": 1.115, "step": 10701 }, { "epoch": 0.25, "learning_rate": 8.802670015979664e-06, "loss": 0.913, "step": 10702 }, { "epoch": 0.25, "learning_rate": 8.802426152274967e-06, "loss": 1.0482, "step": 10703 }, { "epoch": 0.25, "learning_rate": 8.802182267117242e-06, "loss": 0.9976, "step": 10704 }, { "epoch": 0.25, "learning_rate": 8.80193836050786e-06, "loss": 1.0063, "step": 10705 }, { "epoch": 0.25, "learning_rate": 8.801694432448202e-06, "loss": 1.0074, "step": 10706 }, { "epoch": 0.25, "learning_rate": 8.801450482939642e-06, "loss": 0.8766, "step": 10707 }, { "epoch": 0.25, "learning_rate": 8.801206511983557e-06, "loss": 1.1267, "step": 10708 }, { "epoch": 0.25, "learning_rate": 8.800962519581325e-06, "loss": 0.9511, "step": 10709 }, { "epoch": 0.25, "learning_rate": 8.80071850573432e-06, "loss": 1.0284, "step": 10710 }, { "epoch": 0.25, "learning_rate": 8.800474470443919e-06, "loss": 1.2087, "step": 10711 }, { "epoch": 0.25, "learning_rate": 8.800230413711501e-06, "loss": 1.0363, "step": 10712 }, { "epoch": 0.25, "learning_rate": 8.79998633553844e-06, "loss": 0.882, "step": 10713 }, { "epoch": 0.25, "learning_rate": 8.799742235926116e-06, "loss": 1.0797, "step": 10714 }, { "epoch": 0.25, "learning_rate": 8.799498114875905e-06, "loss": 0.9145, "step": 10715 }, { "epoch": 0.25, "learning_rate": 8.79925397238918e-06, "loss": 0.9722, "step": 10716 }, { "epoch": 0.25, "learning_rate": 8.799009808467327e-06, "loss": 0.9697, "step": 10717 }, { "epoch": 0.25, "learning_rate": 8.798765623111718e-06, "loss": 0.9948, "step": 10718 }, { "epoch": 0.25, "learning_rate": 8.798521416323732e-06, "loss": 0.999, "step": 10719 }, { "epoch": 0.25, "learning_rate": 8.798277188104747e-06, "loss": 1.1062, "step": 10720 }, { "epoch": 0.25, "learning_rate": 8.798032938456138e-06, "loss": 0.7805, "step": 10721 }, { "epoch": 0.25, "learning_rate": 8.797788667379288e-06, "loss": 1.1126, "step": 10722 }, { "epoch": 0.25, "learning_rate": 8.797544374875571e-06, "loss": 1.2759, "step": 10723 }, { "epoch": 0.25, "learning_rate": 8.797300060946368e-06, "loss": 1.0332, "step": 10724 }, { "epoch": 0.25, "learning_rate": 8.797055725593055e-06, "loss": 0.949, "step": 10725 }, { "epoch": 0.25, "learning_rate": 8.796811368817014e-06, "loss": 0.7656, "step": 10726 }, { "epoch": 0.25, "learning_rate": 8.79656699061962e-06, "loss": 1.007, "step": 10727 }, { "epoch": 0.25, "learning_rate": 8.796322591002253e-06, "loss": 0.9448, "step": 10728 }, { "epoch": 0.25, "learning_rate": 8.796078169966294e-06, "loss": 1.1448, "step": 10729 }, { "epoch": 0.25, "learning_rate": 8.795833727513119e-06, "loss": 0.8748, "step": 10730 }, { "epoch": 0.25, "learning_rate": 8.795589263644108e-06, "loss": 0.8387, "step": 10731 }, { "epoch": 0.25, "learning_rate": 8.795344778360641e-06, "loss": 0.9752, "step": 10732 }, { "epoch": 0.25, "learning_rate": 8.795100271664096e-06, "loss": 1.172, "step": 10733 }, { "epoch": 0.25, "learning_rate": 8.794855743555855e-06, "loss": 0.9345, "step": 10734 }, { "epoch": 0.25, "learning_rate": 8.794611194037295e-06, "loss": 0.9838, "step": 10735 }, { "epoch": 0.25, "learning_rate": 8.794366623109798e-06, "loss": 0.9683, "step": 10736 }, { "epoch": 0.25, "learning_rate": 8.794122030774741e-06, "loss": 1.044, "step": 10737 }, { "epoch": 0.25, "learning_rate": 8.793877417033505e-06, "loss": 1.0127, "step": 10738 }, { "epoch": 0.25, "learning_rate": 8.793632781887473e-06, "loss": 0.8121, "step": 10739 }, { "epoch": 0.25, "learning_rate": 8.793388125338022e-06, "loss": 1.2768, "step": 10740 }, { "epoch": 0.25, "learning_rate": 8.793143447386531e-06, "loss": 1.1337, "step": 10741 }, { "epoch": 0.25, "learning_rate": 8.792898748034386e-06, "loss": 0.9905, "step": 10742 }, { "epoch": 0.25, "learning_rate": 8.792654027282962e-06, "loss": 0.9763, "step": 10743 }, { "epoch": 0.25, "learning_rate": 8.792409285133644e-06, "loss": 0.9323, "step": 10744 }, { "epoch": 0.25, "learning_rate": 8.792164521587808e-06, "loss": 1.2975, "step": 10745 }, { "epoch": 0.25, "learning_rate": 8.791919736646841e-06, "loss": 0.9667, "step": 10746 }, { "epoch": 0.25, "learning_rate": 8.791674930312118e-06, "loss": 0.7392, "step": 10747 }, { "epoch": 0.25, "learning_rate": 8.791430102585025e-06, "loss": 0.9347, "step": 10748 }, { "epoch": 0.25, "learning_rate": 8.791185253466941e-06, "loss": 1.0429, "step": 10749 }, { "epoch": 0.25, "learning_rate": 8.790940382959245e-06, "loss": 1.0663, "step": 10750 }, { "epoch": 0.25, "learning_rate": 8.790695491063323e-06, "loss": 1.2616, "step": 10751 }, { "epoch": 0.25, "learning_rate": 8.790450577780557e-06, "loss": 1.0123, "step": 10752 }, { "epoch": 0.25, "learning_rate": 8.790205643112325e-06, "loss": 0.9401, "step": 10753 }, { "epoch": 0.25, "learning_rate": 8.789960687060009e-06, "loss": 1.0375, "step": 10754 }, { "epoch": 0.25, "learning_rate": 8.789715709624993e-06, "loss": 1.0192, "step": 10755 }, { "epoch": 0.25, "learning_rate": 8.78947071080866e-06, "loss": 0.9686, "step": 10756 }, { "epoch": 0.25, "learning_rate": 8.789225690612392e-06, "loss": 0.8491, "step": 10757 }, { "epoch": 0.25, "learning_rate": 8.788980649037568e-06, "loss": 0.8748, "step": 10758 }, { "epoch": 0.25, "learning_rate": 8.788735586085574e-06, "loss": 0.8066, "step": 10759 }, { "epoch": 0.25, "learning_rate": 8.788490501757791e-06, "loss": 0.9332, "step": 10760 }, { "epoch": 0.25, "learning_rate": 8.788245396055604e-06, "loss": 1.0465, "step": 10761 }, { "epoch": 0.25, "learning_rate": 8.788000268980392e-06, "loss": 0.8648, "step": 10762 }, { "epoch": 0.25, "learning_rate": 8.787755120533542e-06, "loss": 1.0044, "step": 10763 }, { "epoch": 0.25, "learning_rate": 8.787509950716434e-06, "loss": 0.843, "step": 10764 }, { "epoch": 0.25, "learning_rate": 8.787264759530452e-06, "loss": 0.9773, "step": 10765 }, { "epoch": 0.25, "learning_rate": 8.787019546976983e-06, "loss": 0.8766, "step": 10766 }, { "epoch": 0.25, "learning_rate": 8.786774313057405e-06, "loss": 1.0395, "step": 10767 }, { "epoch": 0.25, "learning_rate": 8.786529057773103e-06, "loss": 0.9435, "step": 10768 }, { "epoch": 0.25, "learning_rate": 8.786283781125462e-06, "loss": 1.0641, "step": 10769 }, { "epoch": 0.25, "learning_rate": 8.786038483115866e-06, "loss": 1.1015, "step": 10770 }, { "epoch": 0.25, "learning_rate": 8.785793163745698e-06, "loss": 1.17, "step": 10771 }, { "epoch": 0.25, "learning_rate": 8.785547823016342e-06, "loss": 0.9005, "step": 10772 }, { "epoch": 0.25, "learning_rate": 8.785302460929185e-06, "loss": 1.2483, "step": 10773 }, { "epoch": 0.25, "learning_rate": 8.785057077485607e-06, "loss": 0.8974, "step": 10774 }, { "epoch": 0.25, "learning_rate": 8.784811672686995e-06, "loss": 0.9619, "step": 10775 }, { "epoch": 0.25, "learning_rate": 8.784566246534732e-06, "loss": 0.81, "step": 10776 }, { "epoch": 0.25, "learning_rate": 8.784320799030206e-06, "loss": 1.2254, "step": 10777 }, { "epoch": 0.25, "learning_rate": 8.784075330174798e-06, "loss": 1.0698, "step": 10778 }, { "epoch": 0.25, "learning_rate": 8.783829839969893e-06, "loss": 0.949, "step": 10779 }, { "epoch": 0.25, "learning_rate": 8.783584328416879e-06, "loss": 1.0158, "step": 10780 }, { "epoch": 0.25, "learning_rate": 8.78333879551714e-06, "loss": 1.0905, "step": 10781 }, { "epoch": 0.25, "learning_rate": 8.783093241272061e-06, "loss": 1.1662, "step": 10782 }, { "epoch": 0.25, "learning_rate": 8.782847665683026e-06, "loss": 1.0118, "step": 10783 }, { "epoch": 0.25, "learning_rate": 8.782602068751423e-06, "loss": 0.9904, "step": 10784 }, { "epoch": 0.25, "learning_rate": 8.782356450478636e-06, "loss": 1.1582, "step": 10785 }, { "epoch": 0.25, "learning_rate": 8.782110810866049e-06, "loss": 1.1488, "step": 10786 }, { "epoch": 0.25, "learning_rate": 8.781865149915052e-06, "loss": 0.9027, "step": 10787 }, { "epoch": 0.25, "learning_rate": 8.78161946762703e-06, "loss": 0.8192, "step": 10788 }, { "epoch": 0.25, "learning_rate": 8.781373764003367e-06, "loss": 0.8324, "step": 10789 }, { "epoch": 0.25, "learning_rate": 8.78112803904545e-06, "loss": 0.9102, "step": 10790 }, { "epoch": 0.25, "learning_rate": 8.780882292754666e-06, "loss": 0.9916, "step": 10791 }, { "epoch": 0.25, "learning_rate": 8.780636525132403e-06, "loss": 0.9066, "step": 10792 }, { "epoch": 0.25, "learning_rate": 8.780390736180044e-06, "loss": 1.0305, "step": 10793 }, { "epoch": 0.25, "learning_rate": 8.780144925898978e-06, "loss": 0.9095, "step": 10794 }, { "epoch": 0.25, "learning_rate": 8.779899094290592e-06, "loss": 1.1103, "step": 10795 }, { "epoch": 0.25, "learning_rate": 8.779653241356273e-06, "loss": 0.98, "step": 10796 }, { "epoch": 0.25, "learning_rate": 8.779407367097405e-06, "loss": 0.8907, "step": 10797 }, { "epoch": 0.25, "learning_rate": 8.77916147151538e-06, "loss": 0.9843, "step": 10798 }, { "epoch": 0.25, "learning_rate": 8.778915554611583e-06, "loss": 0.893, "step": 10799 }, { "epoch": 0.25, "learning_rate": 8.7786696163874e-06, "loss": 0.8504, "step": 10800 }, { "epoch": 0.25, "learning_rate": 8.778423656844222e-06, "loss": 1.0453, "step": 10801 }, { "epoch": 0.25, "learning_rate": 8.778177675983433e-06, "loss": 1.0845, "step": 10802 }, { "epoch": 0.25, "learning_rate": 8.777931673806423e-06, "loss": 0.7979, "step": 10803 }, { "epoch": 0.25, "learning_rate": 8.77768565031458e-06, "loss": 1.1403, "step": 10804 }, { "epoch": 0.25, "learning_rate": 8.777439605509292e-06, "loss": 1.0874, "step": 10805 }, { "epoch": 0.25, "learning_rate": 8.777193539391947e-06, "loss": 1.156, "step": 10806 }, { "epoch": 0.25, "learning_rate": 8.77694745196393e-06, "loss": 0.9484, "step": 10807 }, { "epoch": 0.25, "learning_rate": 8.776701343226635e-06, "loss": 1.1117, "step": 10808 }, { "epoch": 0.25, "learning_rate": 8.776455213181447e-06, "loss": 0.9646, "step": 10809 }, { "epoch": 0.25, "learning_rate": 8.776209061829755e-06, "loss": 0.9631, "step": 10810 }, { "epoch": 0.25, "learning_rate": 8.775962889172948e-06, "loss": 1.1414, "step": 10811 }, { "epoch": 0.25, "learning_rate": 8.775716695212417e-06, "loss": 1.3573, "step": 10812 }, { "epoch": 0.25, "learning_rate": 8.775470479949548e-06, "loss": 0.7894, "step": 10813 }, { "epoch": 0.25, "learning_rate": 8.775224243385733e-06, "loss": 0.841, "step": 10814 }, { "epoch": 0.25, "learning_rate": 8.774977985522358e-06, "loss": 0.8313, "step": 10815 }, { "epoch": 0.25, "learning_rate": 8.774731706360814e-06, "loss": 1.089, "step": 10816 }, { "epoch": 0.25, "learning_rate": 8.774485405902492e-06, "loss": 1.1097, "step": 10817 }, { "epoch": 0.25, "learning_rate": 8.77423908414878e-06, "loss": 0.8968, "step": 10818 }, { "epoch": 0.25, "learning_rate": 8.773992741101065e-06, "loss": 1.1426, "step": 10819 }, { "epoch": 0.25, "learning_rate": 8.77374637676074e-06, "loss": 0.9655, "step": 10820 }, { "epoch": 0.25, "learning_rate": 8.773499991129197e-06, "loss": 1.1402, "step": 10821 }, { "epoch": 0.25, "learning_rate": 8.773253584207823e-06, "loss": 1.1829, "step": 10822 }, { "epoch": 0.25, "learning_rate": 8.77300715599801e-06, "loss": 0.9016, "step": 10823 }, { "epoch": 0.25, "learning_rate": 8.772760706501146e-06, "loss": 0.8942, "step": 10824 }, { "epoch": 0.25, "learning_rate": 8.772514235718621e-06, "loss": 0.9636, "step": 10825 }, { "epoch": 0.25, "learning_rate": 8.77226774365183e-06, "loss": 1.0292, "step": 10826 }, { "epoch": 0.25, "learning_rate": 8.77202123030216e-06, "loss": 0.9894, "step": 10827 }, { "epoch": 0.25, "learning_rate": 8.771774695671002e-06, "loss": 1.0955, "step": 10828 }, { "epoch": 0.25, "learning_rate": 8.771528139759749e-06, "loss": 1.1528, "step": 10829 }, { "epoch": 0.25, "learning_rate": 8.771281562569791e-06, "loss": 0.9881, "step": 10830 }, { "epoch": 0.25, "learning_rate": 8.771034964102519e-06, "loss": 1.1339, "step": 10831 }, { "epoch": 0.25, "learning_rate": 8.770788344359322e-06, "loss": 0.8021, "step": 10832 }, { "epoch": 0.25, "learning_rate": 8.770541703341596e-06, "loss": 1.1282, "step": 10833 }, { "epoch": 0.25, "learning_rate": 8.77029504105073e-06, "loss": 1.1501, "step": 10834 }, { "epoch": 0.25, "learning_rate": 8.770048357488114e-06, "loss": 0.9285, "step": 10835 }, { "epoch": 0.25, "learning_rate": 8.769801652655143e-06, "loss": 0.8079, "step": 10836 }, { "epoch": 0.25, "learning_rate": 8.769554926553207e-06, "loss": 1.1051, "step": 10837 }, { "epoch": 0.25, "learning_rate": 8.7693081791837e-06, "loss": 0.9397, "step": 10838 }, { "epoch": 0.25, "learning_rate": 8.769061410548012e-06, "loss": 0.9352, "step": 10839 }, { "epoch": 0.25, "learning_rate": 8.768814620647534e-06, "loss": 0.9944, "step": 10840 }, { "epoch": 0.25, "learning_rate": 8.76856780948366e-06, "loss": 0.9854, "step": 10841 }, { "epoch": 0.25, "learning_rate": 8.768320977057785e-06, "loss": 0.999, "step": 10842 }, { "epoch": 0.25, "learning_rate": 8.7680741233713e-06, "loss": 1.0081, "step": 10843 }, { "epoch": 0.25, "learning_rate": 8.767827248425595e-06, "loss": 1.0276, "step": 10844 }, { "epoch": 0.25, "learning_rate": 8.767580352222065e-06, "loss": 1.121, "step": 10845 }, { "epoch": 0.25, "learning_rate": 8.767333434762105e-06, "loss": 0.8313, "step": 10846 }, { "epoch": 0.25, "learning_rate": 8.767086496047103e-06, "loss": 1.2028, "step": 10847 }, { "epoch": 0.25, "learning_rate": 8.766839536078457e-06, "loss": 1.0133, "step": 10848 }, { "epoch": 0.25, "learning_rate": 8.76659255485756e-06, "loss": 0.9692, "step": 10849 }, { "epoch": 0.25, "learning_rate": 8.766345552385802e-06, "loss": 0.8751, "step": 10850 }, { "epoch": 0.25, "learning_rate": 8.766098528664579e-06, "loss": 0.9026, "step": 10851 }, { "epoch": 0.25, "learning_rate": 8.765851483695284e-06, "loss": 0.9738, "step": 10852 }, { "epoch": 0.25, "learning_rate": 8.765604417479311e-06, "loss": 1.3377, "step": 10853 }, { "epoch": 0.25, "learning_rate": 8.765357330018056e-06, "loss": 0.8715, "step": 10854 }, { "epoch": 0.25, "learning_rate": 8.76511022131291e-06, "loss": 0.8808, "step": 10855 }, { "epoch": 0.25, "learning_rate": 8.764863091365267e-06, "loss": 1.2579, "step": 10856 }, { "epoch": 0.25, "learning_rate": 8.764615940176522e-06, "loss": 1.0502, "step": 10857 }, { "epoch": 0.25, "learning_rate": 8.764368767748073e-06, "loss": 0.7919, "step": 10858 }, { "epoch": 0.25, "learning_rate": 8.764121574081309e-06, "loss": 0.9809, "step": 10859 }, { "epoch": 0.25, "learning_rate": 8.763874359177628e-06, "loss": 1.0672, "step": 10860 }, { "epoch": 0.25, "learning_rate": 8.763627123038423e-06, "loss": 0.9981, "step": 10861 }, { "epoch": 0.25, "learning_rate": 8.763379865665091e-06, "loss": 0.8755, "step": 10862 }, { "epoch": 0.25, "learning_rate": 8.763132587059025e-06, "loss": 0.9002, "step": 10863 }, { "epoch": 0.25, "learning_rate": 8.762885287221621e-06, "loss": 0.6775, "step": 10864 }, { "epoch": 0.25, "learning_rate": 8.762637966154275e-06, "loss": 0.64, "step": 10865 }, { "epoch": 0.25, "learning_rate": 8.76239062385838e-06, "loss": 0.9706, "step": 10866 }, { "epoch": 0.25, "learning_rate": 8.762143260335334e-06, "loss": 0.9183, "step": 10867 }, { "epoch": 0.25, "learning_rate": 8.76189587558653e-06, "loss": 1.0422, "step": 10868 }, { "epoch": 0.25, "learning_rate": 8.76164846961337e-06, "loss": 1.2696, "step": 10869 }, { "epoch": 0.25, "learning_rate": 8.761401042417241e-06, "loss": 1.2086, "step": 10870 }, { "epoch": 0.25, "learning_rate": 8.761153593999544e-06, "loss": 0.7668, "step": 10871 }, { "epoch": 0.25, "learning_rate": 8.760906124361675e-06, "loss": 0.9247, "step": 10872 }, { "epoch": 0.25, "learning_rate": 8.760658633505027e-06, "loss": 0.7877, "step": 10873 }, { "epoch": 0.25, "learning_rate": 8.760411121431001e-06, "loss": 0.9311, "step": 10874 }, { "epoch": 0.25, "learning_rate": 8.760163588140991e-06, "loss": 1.1317, "step": 10875 }, { "epoch": 0.25, "learning_rate": 8.759916033636396e-06, "loss": 0.6144, "step": 10876 }, { "epoch": 0.25, "learning_rate": 8.759668457918606e-06, "loss": 1.0917, "step": 10877 }, { "epoch": 0.25, "learning_rate": 8.759420860989026e-06, "loss": 1.0484, "step": 10878 }, { "epoch": 0.25, "learning_rate": 8.759173242849046e-06, "loss": 0.936, "step": 10879 }, { "epoch": 0.25, "learning_rate": 8.758925603500069e-06, "loss": 0.9773, "step": 10880 }, { "epoch": 0.25, "learning_rate": 8.758677942943487e-06, "loss": 1.056, "step": 10881 }, { "epoch": 0.25, "learning_rate": 8.758430261180703e-06, "loss": 0.9436, "step": 10882 }, { "epoch": 0.25, "learning_rate": 8.758182558213109e-06, "loss": 0.8944, "step": 10883 }, { "epoch": 0.25, "learning_rate": 8.757934834042104e-06, "loss": 0.8288, "step": 10884 }, { "epoch": 0.25, "learning_rate": 8.757687088669088e-06, "loss": 0.7239, "step": 10885 }, { "epoch": 0.25, "learning_rate": 8.757439322095456e-06, "loss": 1.279, "step": 10886 }, { "epoch": 0.25, "learning_rate": 8.757191534322607e-06, "loss": 0.8532, "step": 10887 }, { "epoch": 0.25, "learning_rate": 8.756943725351938e-06, "loss": 0.8765, "step": 10888 }, { "epoch": 0.25, "learning_rate": 8.756695895184851e-06, "loss": 0.8178, "step": 10889 }, { "epoch": 0.25, "learning_rate": 8.756448043822738e-06, "loss": 0.771, "step": 10890 }, { "epoch": 0.25, "learning_rate": 8.756200171267003e-06, "loss": 1.3112, "step": 10891 }, { "epoch": 0.25, "learning_rate": 8.755952277519042e-06, "loss": 0.9963, "step": 10892 }, { "epoch": 0.25, "learning_rate": 8.755704362580253e-06, "loss": 0.9169, "step": 10893 }, { "epoch": 0.25, "learning_rate": 8.755456426452035e-06, "loss": 0.8623, "step": 10894 }, { "epoch": 0.25, "learning_rate": 8.755208469135787e-06, "loss": 1.0615, "step": 10895 }, { "epoch": 0.25, "learning_rate": 8.754960490632909e-06, "loss": 0.9672, "step": 10896 }, { "epoch": 0.25, "learning_rate": 8.7547124909448e-06, "loss": 1.0059, "step": 10897 }, { "epoch": 0.25, "learning_rate": 8.754464470072857e-06, "loss": 1.2139, "step": 10898 }, { "epoch": 0.25, "learning_rate": 8.754216428018481e-06, "loss": 1.1789, "step": 10899 }, { "epoch": 0.25, "learning_rate": 8.753968364783072e-06, "loss": 1.1896, "step": 10900 }, { "epoch": 0.25, "learning_rate": 8.75372028036803e-06, "loss": 0.9788, "step": 10901 }, { "epoch": 0.25, "learning_rate": 8.753472174774752e-06, "loss": 0.9297, "step": 10902 }, { "epoch": 0.25, "learning_rate": 8.753224048004639e-06, "loss": 1.1682, "step": 10903 }, { "epoch": 0.25, "learning_rate": 8.752975900059093e-06, "loss": 1.0935, "step": 10904 }, { "epoch": 0.25, "learning_rate": 8.75272773093951e-06, "loss": 1.0889, "step": 10905 }, { "epoch": 0.25, "learning_rate": 8.752479540647294e-06, "loss": 1.0413, "step": 10906 }, { "epoch": 0.25, "learning_rate": 8.752231329183843e-06, "loss": 1.0437, "step": 10907 }, { "epoch": 0.25, "learning_rate": 8.751983096550559e-06, "loss": 1.1485, "step": 10908 }, { "epoch": 0.25, "learning_rate": 8.751734842748839e-06, "loss": 1.2132, "step": 10909 }, { "epoch": 0.25, "learning_rate": 8.751486567780087e-06, "loss": 0.7885, "step": 10910 }, { "epoch": 0.25, "learning_rate": 8.751238271645705e-06, "loss": 1.2226, "step": 10911 }, { "epoch": 0.25, "learning_rate": 8.750989954347092e-06, "loss": 1.0019, "step": 10912 }, { "epoch": 0.25, "learning_rate": 8.750741615885646e-06, "loss": 0.8919, "step": 10913 }, { "epoch": 0.25, "learning_rate": 8.750493256262774e-06, "loss": 0.9171, "step": 10914 }, { "epoch": 0.25, "learning_rate": 8.750244875479871e-06, "loss": 1.0832, "step": 10915 }, { "epoch": 0.25, "learning_rate": 8.749996473538343e-06, "loss": 0.8314, "step": 10916 }, { "epoch": 0.25, "learning_rate": 8.74974805043959e-06, "loss": 1.1915, "step": 10917 }, { "epoch": 0.25, "learning_rate": 8.749499606185014e-06, "loss": 0.8312, "step": 10918 }, { "epoch": 0.25, "learning_rate": 8.749251140776016e-06, "loss": 1.0534, "step": 10919 }, { "epoch": 0.25, "learning_rate": 8.749002654213999e-06, "loss": 0.8242, "step": 10920 }, { "epoch": 0.25, "learning_rate": 8.748754146500363e-06, "loss": 0.9243, "step": 10921 }, { "epoch": 0.25, "learning_rate": 8.74850561763651e-06, "loss": 1.0604, "step": 10922 }, { "epoch": 0.25, "learning_rate": 8.748257067623844e-06, "loss": 1.174, "step": 10923 }, { "epoch": 0.25, "learning_rate": 8.748008496463768e-06, "loss": 0.7132, "step": 10924 }, { "epoch": 0.25, "learning_rate": 8.747759904157682e-06, "loss": 0.9508, "step": 10925 }, { "epoch": 0.25, "learning_rate": 8.747511290706989e-06, "loss": 1.0945, "step": 10926 }, { "epoch": 0.25, "learning_rate": 8.747262656113094e-06, "loss": 1.091, "step": 10927 }, { "epoch": 0.25, "learning_rate": 8.747014000377397e-06, "loss": 0.9541, "step": 10928 }, { "epoch": 0.25, "learning_rate": 8.7467653235013e-06, "loss": 1.0976, "step": 10929 }, { "epoch": 0.25, "learning_rate": 8.74651662548621e-06, "loss": 0.7736, "step": 10930 }, { "epoch": 0.25, "learning_rate": 8.746267906333528e-06, "loss": 1.084, "step": 10931 }, { "epoch": 0.25, "learning_rate": 8.746019166044657e-06, "loss": 1.0694, "step": 10932 }, { "epoch": 0.25, "learning_rate": 8.745770404621e-06, "loss": 1.2219, "step": 10933 }, { "epoch": 0.25, "learning_rate": 8.745521622063961e-06, "loss": 0.9564, "step": 10934 }, { "epoch": 0.25, "learning_rate": 8.745272818374945e-06, "loss": 0.8903, "step": 10935 }, { "epoch": 0.25, "learning_rate": 8.745023993555356e-06, "loss": 0.8333, "step": 10936 }, { "epoch": 0.25, "learning_rate": 8.744775147606592e-06, "loss": 0.941, "step": 10937 }, { "epoch": 0.25, "learning_rate": 8.744526280530065e-06, "loss": 0.9465, "step": 10938 }, { "epoch": 0.25, "learning_rate": 8.744277392327175e-06, "loss": 1.1022, "step": 10939 }, { "epoch": 0.25, "learning_rate": 8.744028482999325e-06, "loss": 1.1236, "step": 10940 }, { "epoch": 0.25, "learning_rate": 8.743779552547921e-06, "loss": 1.0612, "step": 10941 }, { "epoch": 0.25, "learning_rate": 8.743530600974368e-06, "loss": 1.0558, "step": 10942 }, { "epoch": 0.25, "learning_rate": 8.743281628280071e-06, "loss": 0.8432, "step": 10943 }, { "epoch": 0.25, "learning_rate": 8.743032634466431e-06, "loss": 1.074, "step": 10944 }, { "epoch": 0.25, "learning_rate": 8.742783619534858e-06, "loss": 0.7684, "step": 10945 }, { "epoch": 0.25, "learning_rate": 8.742534583486755e-06, "loss": 0.7753, "step": 10946 }, { "epoch": 0.25, "learning_rate": 8.742285526323524e-06, "loss": 1.0869, "step": 10947 }, { "epoch": 0.25, "learning_rate": 8.742036448046574e-06, "loss": 0.5187, "step": 10948 }, { "epoch": 0.25, "learning_rate": 8.741787348657309e-06, "loss": 1.0126, "step": 10949 }, { "epoch": 0.25, "learning_rate": 8.741538228157133e-06, "loss": 1.177, "step": 10950 }, { "epoch": 0.25, "learning_rate": 8.741289086547454e-06, "loss": 0.9271, "step": 10951 }, { "epoch": 0.25, "learning_rate": 8.741039923829675e-06, "loss": 1.0081, "step": 10952 }, { "epoch": 0.25, "learning_rate": 8.740790740005205e-06, "loss": 0.8226, "step": 10953 }, { "epoch": 0.25, "learning_rate": 8.740541535075449e-06, "loss": 0.7918, "step": 10954 }, { "epoch": 0.25, "learning_rate": 8.74029230904181e-06, "loss": 0.9644, "step": 10955 }, { "epoch": 0.25, "learning_rate": 8.740043061905696e-06, "loss": 1.2279, "step": 10956 }, { "epoch": 0.25, "learning_rate": 8.739793793668514e-06, "loss": 0.8234, "step": 10957 }, { "epoch": 0.25, "learning_rate": 8.739544504331672e-06, "loss": 0.8358, "step": 10958 }, { "epoch": 0.25, "learning_rate": 8.739295193896571e-06, "loss": 0.8934, "step": 10959 }, { "epoch": 0.25, "learning_rate": 8.739045862364623e-06, "loss": 0.9757, "step": 10960 }, { "epoch": 0.25, "learning_rate": 8.73879650973723e-06, "loss": 0.9698, "step": 10961 }, { "epoch": 0.25, "learning_rate": 8.738547136015805e-06, "loss": 1.1575, "step": 10962 }, { "epoch": 0.25, "learning_rate": 8.73829774120175e-06, "loss": 0.7956, "step": 10963 }, { "epoch": 0.25, "learning_rate": 8.738048325296472e-06, "loss": 1.2272, "step": 10964 }, { "epoch": 0.25, "learning_rate": 8.737798888301381e-06, "loss": 1.002, "step": 10965 }, { "epoch": 0.25, "learning_rate": 8.737549430217883e-06, "loss": 1.1768, "step": 10966 }, { "epoch": 0.25, "learning_rate": 8.737299951047384e-06, "loss": 0.9372, "step": 10967 }, { "epoch": 0.25, "learning_rate": 8.737050450791293e-06, "loss": 0.9199, "step": 10968 }, { "epoch": 0.25, "learning_rate": 8.736800929451019e-06, "loss": 0.831, "step": 10969 }, { "epoch": 0.25, "learning_rate": 8.736551387027968e-06, "loss": 0.9778, "step": 10970 }, { "epoch": 0.25, "learning_rate": 8.736301823523547e-06, "loss": 0.8461, "step": 10971 }, { "epoch": 0.25, "learning_rate": 8.736052238939166e-06, "loss": 0.923, "step": 10972 }, { "epoch": 0.25, "learning_rate": 8.735802633276234e-06, "loss": 0.912, "step": 10973 }, { "epoch": 0.25, "learning_rate": 8.735553006536155e-06, "loss": 0.9995, "step": 10974 }, { "epoch": 0.25, "learning_rate": 8.735303358720341e-06, "loss": 0.8134, "step": 10975 }, { "epoch": 0.25, "learning_rate": 8.7350536898302e-06, "loss": 1.0122, "step": 10976 }, { "epoch": 0.25, "learning_rate": 8.73480399986714e-06, "loss": 1.094, "step": 10977 }, { "epoch": 0.25, "learning_rate": 8.73455428883257e-06, "loss": 0.9366, "step": 10978 }, { "epoch": 0.25, "learning_rate": 8.734304556727896e-06, "loss": 0.9448, "step": 10979 }, { "epoch": 0.25, "learning_rate": 8.734054803554535e-06, "loss": 0.8885, "step": 10980 }, { "epoch": 0.25, "learning_rate": 8.733805029313887e-06, "loss": 0.9431, "step": 10981 }, { "epoch": 0.25, "learning_rate": 8.733555234007366e-06, "loss": 0.81, "step": 10982 }, { "epoch": 0.25, "learning_rate": 8.73330541763638e-06, "loss": 0.9446, "step": 10983 }, { "epoch": 0.25, "learning_rate": 8.733055580202339e-06, "loss": 0.9102, "step": 10984 }, { "epoch": 0.25, "learning_rate": 8.732805721706651e-06, "loss": 0.8454, "step": 10985 }, { "epoch": 0.25, "learning_rate": 8.73255584215073e-06, "loss": 0.7343, "step": 10986 }, { "epoch": 0.25, "learning_rate": 8.732305941535981e-06, "loss": 1.0721, "step": 10987 }, { "epoch": 0.25, "learning_rate": 8.732056019863816e-06, "loss": 0.9416, "step": 10988 }, { "epoch": 0.25, "learning_rate": 8.731806077135645e-06, "loss": 0.6713, "step": 10989 }, { "epoch": 0.25, "learning_rate": 8.731556113352877e-06, "loss": 0.9067, "step": 10990 }, { "epoch": 0.25, "learning_rate": 8.731306128516925e-06, "loss": 0.8336, "step": 10991 }, { "epoch": 0.25, "learning_rate": 8.731056122629196e-06, "loss": 0.9041, "step": 10992 }, { "epoch": 0.25, "learning_rate": 8.730806095691102e-06, "loss": 0.9036, "step": 10993 }, { "epoch": 0.25, "learning_rate": 8.730556047704056e-06, "loss": 1.0642, "step": 10994 }, { "epoch": 0.25, "learning_rate": 8.730305978669464e-06, "loss": 1.1359, "step": 10995 }, { "epoch": 0.26, "learning_rate": 8.730055888588741e-06, "loss": 1.1269, "step": 10996 }, { "epoch": 0.26, "learning_rate": 8.729805777463296e-06, "loss": 1.1359, "step": 10997 }, { "epoch": 0.26, "learning_rate": 8.729555645294541e-06, "loss": 1.1562, "step": 10998 }, { "epoch": 0.26, "learning_rate": 8.729305492083886e-06, "loss": 1.1779, "step": 10999 }, { "epoch": 0.26, "learning_rate": 8.729055317832741e-06, "loss": 0.9444, "step": 11000 }, { "epoch": 0.26, "learning_rate": 8.728805122542524e-06, "loss": 1.1263, "step": 11001 }, { "epoch": 0.26, "learning_rate": 8.728554906214638e-06, "loss": 0.9701, "step": 11002 }, { "epoch": 0.26, "learning_rate": 8.728304668850502e-06, "loss": 1.0653, "step": 11003 }, { "epoch": 0.26, "learning_rate": 8.728054410451524e-06, "loss": 1.1, "step": 11004 }, { "epoch": 0.26, "learning_rate": 8.727804131019115e-06, "loss": 1.1454, "step": 11005 }, { "epoch": 0.26, "learning_rate": 8.72755383055469e-06, "loss": 1.2151, "step": 11006 }, { "epoch": 0.26, "learning_rate": 8.72730350905966e-06, "loss": 0.9399, "step": 11007 }, { "epoch": 0.26, "learning_rate": 8.727053166535435e-06, "loss": 1.1318, "step": 11008 }, { "epoch": 0.26, "learning_rate": 8.726802802983432e-06, "loss": 0.8008, "step": 11009 }, { "epoch": 0.26, "learning_rate": 8.72655241840506e-06, "loss": 0.9208, "step": 11010 }, { "epoch": 0.26, "learning_rate": 8.726302012801731e-06, "loss": 1.1339, "step": 11011 }, { "epoch": 0.26, "learning_rate": 8.726051586174862e-06, "loss": 0.9016, "step": 11012 }, { "epoch": 0.26, "learning_rate": 8.725801138525864e-06, "loss": 1.1248, "step": 11013 }, { "epoch": 0.26, "learning_rate": 8.725550669856148e-06, "loss": 0.8817, "step": 11014 }, { "epoch": 0.26, "learning_rate": 8.72530018016713e-06, "loss": 1.0227, "step": 11015 }, { "epoch": 0.26, "learning_rate": 8.72504966946022e-06, "loss": 1.2111, "step": 11016 }, { "epoch": 0.26, "learning_rate": 8.724799137736833e-06, "loss": 1.0525, "step": 11017 }, { "epoch": 0.26, "learning_rate": 8.724548584998383e-06, "loss": 0.8234, "step": 11018 }, { "epoch": 0.26, "learning_rate": 8.724298011246283e-06, "loss": 0.8565, "step": 11019 }, { "epoch": 0.26, "learning_rate": 8.724047416481948e-06, "loss": 1.1892, "step": 11020 }, { "epoch": 0.26, "learning_rate": 8.72379680070679e-06, "loss": 1.2631, "step": 11021 }, { "epoch": 0.26, "learning_rate": 8.723546163922223e-06, "loss": 1.1456, "step": 11022 }, { "epoch": 0.26, "learning_rate": 8.723295506129663e-06, "loss": 0.8112, "step": 11023 }, { "epoch": 0.26, "learning_rate": 8.723044827330524e-06, "loss": 1.1633, "step": 11024 }, { "epoch": 0.26, "learning_rate": 8.722794127526217e-06, "loss": 0.9835, "step": 11025 }, { "epoch": 0.26, "learning_rate": 8.72254340671816e-06, "loss": 0.8575, "step": 11026 }, { "epoch": 0.26, "learning_rate": 8.722292664907768e-06, "loss": 1.3215, "step": 11027 }, { "epoch": 0.26, "learning_rate": 8.722041902096453e-06, "loss": 0.7179, "step": 11028 }, { "epoch": 0.26, "learning_rate": 8.721791118285629e-06, "loss": 0.8335, "step": 11029 }, { "epoch": 0.26, "learning_rate": 8.721540313476713e-06, "loss": 1.0191, "step": 11030 }, { "epoch": 0.26, "learning_rate": 8.72128948767112e-06, "loss": 1.02, "step": 11031 }, { "epoch": 0.26, "learning_rate": 8.721038640870265e-06, "loss": 1.0784, "step": 11032 }, { "epoch": 0.26, "learning_rate": 8.720787773075564e-06, "loss": 1.2327, "step": 11033 }, { "epoch": 0.26, "learning_rate": 8.72053688428843e-06, "loss": 1.1025, "step": 11034 }, { "epoch": 0.26, "learning_rate": 8.72028597451028e-06, "loss": 1.1656, "step": 11035 }, { "epoch": 0.26, "learning_rate": 8.720035043742532e-06, "loss": 1.0342, "step": 11036 }, { "epoch": 0.26, "learning_rate": 8.719784091986598e-06, "loss": 0.9987, "step": 11037 }, { "epoch": 0.26, "learning_rate": 8.719533119243894e-06, "loss": 1.1833, "step": 11038 }, { "epoch": 0.26, "learning_rate": 8.719282125515838e-06, "loss": 1.0931, "step": 11039 }, { "epoch": 0.26, "learning_rate": 8.719031110803845e-06, "loss": 0.8247, "step": 11040 }, { "epoch": 0.26, "learning_rate": 8.718780075109333e-06, "loss": 1.0464, "step": 11041 }, { "epoch": 0.26, "learning_rate": 8.718529018433714e-06, "loss": 1.143, "step": 11042 }, { "epoch": 0.26, "learning_rate": 8.71827794077841e-06, "loss": 0.8569, "step": 11043 }, { "epoch": 0.26, "learning_rate": 8.718026842144832e-06, "loss": 1.0069, "step": 11044 }, { "epoch": 0.26, "learning_rate": 8.717775722534401e-06, "loss": 1.0109, "step": 11045 }, { "epoch": 0.26, "learning_rate": 8.717524581948531e-06, "loss": 0.9674, "step": 11046 }, { "epoch": 0.26, "learning_rate": 8.717273420388642e-06, "loss": 0.9855, "step": 11047 }, { "epoch": 0.26, "learning_rate": 8.717022237856149e-06, "loss": 1.0221, "step": 11048 }, { "epoch": 0.26, "learning_rate": 8.716771034352468e-06, "loss": 1.0277, "step": 11049 }, { "epoch": 0.26, "learning_rate": 8.716519809879018e-06, "loss": 0.8218, "step": 11050 }, { "epoch": 0.26, "learning_rate": 8.716268564437219e-06, "loss": 1.2107, "step": 11051 }, { "epoch": 0.26, "learning_rate": 8.71601729802848e-06, "loss": 0.7934, "step": 11052 }, { "epoch": 0.26, "learning_rate": 8.715766010654229e-06, "loss": 1.081, "step": 11053 }, { "epoch": 0.26, "learning_rate": 8.715514702315877e-06, "loss": 0.9513, "step": 11054 }, { "epoch": 0.26, "learning_rate": 8.715263373014844e-06, "loss": 0.881, "step": 11055 }, { "epoch": 0.26, "learning_rate": 8.715012022752547e-06, "loss": 0.7791, "step": 11056 }, { "epoch": 0.26, "learning_rate": 8.714760651530405e-06, "loss": 0.9282, "step": 11057 }, { "epoch": 0.26, "learning_rate": 8.714509259349837e-06, "loss": 1.096, "step": 11058 }, { "epoch": 0.26, "learning_rate": 8.71425784621226e-06, "loss": 1.1454, "step": 11059 }, { "epoch": 0.26, "learning_rate": 8.714006412119094e-06, "loss": 0.9895, "step": 11060 }, { "epoch": 0.26, "learning_rate": 8.713754957071755e-06, "loss": 1.2629, "step": 11061 }, { "epoch": 0.26, "learning_rate": 8.713503481071663e-06, "loss": 0.9547, "step": 11062 }, { "epoch": 0.26, "learning_rate": 8.713251984120238e-06, "loss": 0.9472, "step": 11063 }, { "epoch": 0.26, "learning_rate": 8.713000466218897e-06, "loss": 0.946, "step": 11064 }, { "epoch": 0.26, "learning_rate": 8.71274892736906e-06, "loss": 1.0084, "step": 11065 }, { "epoch": 0.26, "learning_rate": 8.712497367572147e-06, "loss": 0.8339, "step": 11066 }, { "epoch": 0.26, "learning_rate": 8.712245786829577e-06, "loss": 0.8369, "step": 11067 }, { "epoch": 0.26, "learning_rate": 8.711994185142767e-06, "loss": 0.9355, "step": 11068 }, { "epoch": 0.26, "learning_rate": 8.711742562513138e-06, "loss": 1.0167, "step": 11069 }, { "epoch": 0.26, "learning_rate": 8.71149091894211e-06, "loss": 1.078, "step": 11070 }, { "epoch": 0.26, "learning_rate": 8.711239254431103e-06, "loss": 1.0211, "step": 11071 }, { "epoch": 0.26, "learning_rate": 8.710987568981537e-06, "loss": 0.9931, "step": 11072 }, { "epoch": 0.26, "learning_rate": 8.710735862594832e-06, "loss": 1.2973, "step": 11073 }, { "epoch": 0.26, "learning_rate": 8.710484135272407e-06, "loss": 1.2382, "step": 11074 }, { "epoch": 0.26, "learning_rate": 8.710232387015685e-06, "loss": 1.1045, "step": 11075 }, { "epoch": 0.26, "learning_rate": 8.70998061782608e-06, "loss": 1.136, "step": 11076 }, { "epoch": 0.26, "learning_rate": 8.70972882770502e-06, "loss": 1.1958, "step": 11077 }, { "epoch": 0.26, "learning_rate": 8.709477016653922e-06, "loss": 1.2491, "step": 11078 }, { "epoch": 0.26, "learning_rate": 8.709225184674205e-06, "loss": 0.8848, "step": 11079 }, { "epoch": 0.26, "learning_rate": 8.708973331767295e-06, "loss": 0.8028, "step": 11080 }, { "epoch": 0.26, "learning_rate": 8.708721457934606e-06, "loss": 0.8019, "step": 11081 }, { "epoch": 0.26, "learning_rate": 8.708469563177566e-06, "loss": 1.2566, "step": 11082 }, { "epoch": 0.26, "learning_rate": 8.708217647497593e-06, "loss": 1.2784, "step": 11083 }, { "epoch": 0.26, "learning_rate": 8.707965710896106e-06, "loss": 0.9107, "step": 11084 }, { "epoch": 0.26, "learning_rate": 8.707713753374529e-06, "loss": 0.9956, "step": 11085 }, { "epoch": 0.26, "learning_rate": 8.707461774934285e-06, "loss": 0.8587, "step": 11086 }, { "epoch": 0.26, "learning_rate": 8.707209775576792e-06, "loss": 1.1581, "step": 11087 }, { "epoch": 0.26, "learning_rate": 8.706957755303474e-06, "loss": 0.8434, "step": 11088 }, { "epoch": 0.26, "learning_rate": 8.706705714115752e-06, "loss": 1.0433, "step": 11089 }, { "epoch": 0.26, "learning_rate": 8.70645365201505e-06, "loss": 1.1646, "step": 11090 }, { "epoch": 0.26, "learning_rate": 8.706201569002787e-06, "loss": 1.0984, "step": 11091 }, { "epoch": 0.26, "learning_rate": 8.705949465080389e-06, "loss": 0.7649, "step": 11092 }, { "epoch": 0.26, "learning_rate": 8.705697340249275e-06, "loss": 1.0114, "step": 11093 }, { "epoch": 0.26, "learning_rate": 8.705445194510868e-06, "loss": 1.0779, "step": 11094 }, { "epoch": 0.26, "learning_rate": 8.705193027866591e-06, "loss": 0.9039, "step": 11095 }, { "epoch": 0.26, "learning_rate": 8.70494084031787e-06, "loss": 0.8184, "step": 11096 }, { "epoch": 0.26, "learning_rate": 8.704688631866121e-06, "loss": 0.8993, "step": 11097 }, { "epoch": 0.26, "learning_rate": 8.704436402512773e-06, "loss": 1.0008, "step": 11098 }, { "epoch": 0.26, "learning_rate": 8.704184152259246e-06, "loss": 0.8739, "step": 11099 }, { "epoch": 0.26, "learning_rate": 8.703931881106965e-06, "loss": 1.1354, "step": 11100 }, { "epoch": 0.26, "learning_rate": 8.70367958905735e-06, "loss": 1.222, "step": 11101 }, { "epoch": 0.26, "learning_rate": 8.703427276111828e-06, "loss": 0.98, "step": 11102 }, { "epoch": 0.26, "learning_rate": 8.703174942271821e-06, "loss": 1.0874, "step": 11103 }, { "epoch": 0.26, "learning_rate": 8.702922587538754e-06, "loss": 0.9224, "step": 11104 }, { "epoch": 0.26, "learning_rate": 8.702670211914049e-06, "loss": 1.0224, "step": 11105 }, { "epoch": 0.26, "learning_rate": 8.702417815399131e-06, "loss": 1.049, "step": 11106 }, { "epoch": 0.26, "learning_rate": 8.702165397995422e-06, "loss": 0.9267, "step": 11107 }, { "epoch": 0.26, "learning_rate": 8.701912959704348e-06, "loss": 0.9474, "step": 11108 }, { "epoch": 0.26, "learning_rate": 8.701660500527334e-06, "loss": 0.938, "step": 11109 }, { "epoch": 0.26, "learning_rate": 8.701408020465803e-06, "loss": 0.9286, "step": 11110 }, { "epoch": 0.26, "learning_rate": 8.701155519521178e-06, "loss": 0.9224, "step": 11111 }, { "epoch": 0.26, "learning_rate": 8.700902997694888e-06, "loss": 1.0384, "step": 11112 }, { "epoch": 0.26, "learning_rate": 8.700650454988353e-06, "loss": 1.2316, "step": 11113 }, { "epoch": 0.26, "learning_rate": 8.700397891403e-06, "loss": 1.0221, "step": 11114 }, { "epoch": 0.26, "learning_rate": 8.700145306940255e-06, "loss": 1.0373, "step": 11115 }, { "epoch": 0.26, "learning_rate": 8.699892701601542e-06, "loss": 0.962, "step": 11116 }, { "epoch": 0.26, "learning_rate": 8.699640075388285e-06, "loss": 1.1562, "step": 11117 }, { "epoch": 0.26, "learning_rate": 8.699387428301911e-06, "loss": 1.0021, "step": 11118 }, { "epoch": 0.26, "learning_rate": 8.699134760343844e-06, "loss": 0.7966, "step": 11119 }, { "epoch": 0.26, "learning_rate": 8.69888207151551e-06, "loss": 0.8536, "step": 11120 }, { "epoch": 0.26, "learning_rate": 8.698629361818336e-06, "loss": 1.0953, "step": 11121 }, { "epoch": 0.26, "learning_rate": 8.698376631253746e-06, "loss": 0.6255, "step": 11122 }, { "epoch": 0.26, "learning_rate": 8.698123879823167e-06, "loss": 1.2221, "step": 11123 }, { "epoch": 0.26, "learning_rate": 8.697871107528025e-06, "loss": 0.9043, "step": 11124 }, { "epoch": 0.26, "learning_rate": 8.697618314369745e-06, "loss": 1.197, "step": 11125 }, { "epoch": 0.26, "learning_rate": 8.697365500349755e-06, "loss": 0.9301, "step": 11126 }, { "epoch": 0.26, "learning_rate": 8.697112665469478e-06, "loss": 0.9449, "step": 11127 }, { "epoch": 0.26, "learning_rate": 8.696859809730344e-06, "loss": 0.8741, "step": 11128 }, { "epoch": 0.26, "learning_rate": 8.69660693313378e-06, "loss": 1.0272, "step": 11129 }, { "epoch": 0.26, "learning_rate": 8.69635403568121e-06, "loss": 1.0932, "step": 11130 }, { "epoch": 0.26, "learning_rate": 8.696101117374061e-06, "loss": 1.0214, "step": 11131 }, { "epoch": 0.26, "learning_rate": 8.695848178213762e-06, "loss": 0.8699, "step": 11132 }, { "epoch": 0.26, "learning_rate": 8.69559521820174e-06, "loss": 0.7962, "step": 11133 }, { "epoch": 0.26, "learning_rate": 8.695342237339419e-06, "loss": 1.0015, "step": 11134 }, { "epoch": 0.26, "learning_rate": 8.695089235628229e-06, "loss": 1.1186, "step": 11135 }, { "epoch": 0.26, "learning_rate": 8.694836213069597e-06, "loss": 0.9257, "step": 11136 }, { "epoch": 0.26, "learning_rate": 8.694583169664951e-06, "loss": 0.8445, "step": 11137 }, { "epoch": 0.26, "learning_rate": 8.694330105415718e-06, "loss": 1.1635, "step": 11138 }, { "epoch": 0.26, "learning_rate": 8.694077020323326e-06, "loss": 1.0036, "step": 11139 }, { "epoch": 0.26, "learning_rate": 8.693823914389201e-06, "loss": 0.6902, "step": 11140 }, { "epoch": 0.26, "learning_rate": 8.693570787614776e-06, "loss": 1.0253, "step": 11141 }, { "epoch": 0.26, "learning_rate": 8.693317640001473e-06, "loss": 1.2627, "step": 11142 }, { "epoch": 0.26, "learning_rate": 8.693064471550724e-06, "loss": 0.8937, "step": 11143 }, { "epoch": 0.26, "learning_rate": 8.692811282263956e-06, "loss": 0.8883, "step": 11144 }, { "epoch": 0.26, "learning_rate": 8.692558072142598e-06, "loss": 1.0407, "step": 11145 }, { "epoch": 0.26, "learning_rate": 8.69230484118808e-06, "loss": 1.1231, "step": 11146 }, { "epoch": 0.26, "learning_rate": 8.692051589401827e-06, "loss": 0.8774, "step": 11147 }, { "epoch": 0.26, "learning_rate": 8.691798316785272e-06, "loss": 0.9252, "step": 11148 }, { "epoch": 0.26, "learning_rate": 8.691545023339842e-06, "loss": 1.2841, "step": 11149 }, { "epoch": 0.26, "learning_rate": 8.691291709066965e-06, "loss": 1.1545, "step": 11150 }, { "epoch": 0.26, "learning_rate": 8.691038373968071e-06, "loss": 1.1871, "step": 11151 }, { "epoch": 0.26, "learning_rate": 8.690785018044589e-06, "loss": 1.0417, "step": 11152 }, { "epoch": 0.26, "learning_rate": 8.69053164129795e-06, "loss": 0.9074, "step": 11153 }, { "epoch": 0.26, "learning_rate": 8.690278243729584e-06, "loss": 1.1434, "step": 11154 }, { "epoch": 0.26, "learning_rate": 8.690024825340917e-06, "loss": 1.0625, "step": 11155 }, { "epoch": 0.26, "learning_rate": 8.689771386133383e-06, "loss": 0.7575, "step": 11156 }, { "epoch": 0.26, "learning_rate": 8.689517926108408e-06, "loss": 1.0972, "step": 11157 }, { "epoch": 0.26, "learning_rate": 8.689264445267424e-06, "loss": 1.0066, "step": 11158 }, { "epoch": 0.26, "learning_rate": 8.689010943611862e-06, "loss": 0.7141, "step": 11159 }, { "epoch": 0.26, "learning_rate": 8.68875742114315e-06, "loss": 1.0891, "step": 11160 }, { "epoch": 0.26, "learning_rate": 8.68850387786272e-06, "loss": 0.7166, "step": 11161 }, { "epoch": 0.26, "learning_rate": 8.688250313772003e-06, "loss": 0.7589, "step": 11162 }, { "epoch": 0.26, "learning_rate": 8.687996728872427e-06, "loss": 1.0063, "step": 11163 }, { "epoch": 0.26, "learning_rate": 8.687743123165424e-06, "loss": 1.3476, "step": 11164 }, { "epoch": 0.26, "learning_rate": 8.687489496652427e-06, "loss": 1.1944, "step": 11165 }, { "epoch": 0.26, "learning_rate": 8.687235849334864e-06, "loss": 1.0595, "step": 11166 }, { "epoch": 0.26, "learning_rate": 8.686982181214167e-06, "loss": 1.2753, "step": 11167 }, { "epoch": 0.26, "learning_rate": 8.686728492291767e-06, "loss": 0.9812, "step": 11168 }, { "epoch": 0.26, "learning_rate": 8.686474782569096e-06, "loss": 0.9753, "step": 11169 }, { "epoch": 0.26, "learning_rate": 8.686221052047585e-06, "loss": 1.2398, "step": 11170 }, { "epoch": 0.26, "learning_rate": 8.685967300728668e-06, "loss": 1.2343, "step": 11171 }, { "epoch": 0.26, "learning_rate": 8.68571352861377e-06, "loss": 1.4104, "step": 11172 }, { "epoch": 0.26, "learning_rate": 8.685459735704328e-06, "loss": 1.0798, "step": 11173 }, { "epoch": 0.26, "learning_rate": 8.685205922001777e-06, "loss": 1.0977, "step": 11174 }, { "epoch": 0.26, "learning_rate": 8.68495208750754e-06, "loss": 0.7083, "step": 11175 }, { "epoch": 0.26, "learning_rate": 8.684698232223057e-06, "loss": 1.1986, "step": 11176 }, { "epoch": 0.26, "learning_rate": 8.684444356149754e-06, "loss": 0.6998, "step": 11177 }, { "epoch": 0.26, "learning_rate": 8.68419045928907e-06, "loss": 1.1723, "step": 11178 }, { "epoch": 0.26, "learning_rate": 8.683936541642433e-06, "loss": 1.0641, "step": 11179 }, { "epoch": 0.26, "learning_rate": 8.683682603211275e-06, "loss": 1.0935, "step": 11180 }, { "epoch": 0.26, "learning_rate": 8.683428643997031e-06, "loss": 0.878, "step": 11181 }, { "epoch": 0.26, "learning_rate": 8.683174664001136e-06, "loss": 0.97, "step": 11182 }, { "epoch": 0.26, "learning_rate": 8.682920663225016e-06, "loss": 0.9862, "step": 11183 }, { "epoch": 0.26, "learning_rate": 8.68266664167011e-06, "loss": 0.8956, "step": 11184 }, { "epoch": 0.26, "learning_rate": 8.682412599337848e-06, "loss": 0.9934, "step": 11185 }, { "epoch": 0.26, "learning_rate": 8.682158536229665e-06, "loss": 0.7987, "step": 11186 }, { "epoch": 0.26, "learning_rate": 8.681904452346997e-06, "loss": 1.2199, "step": 11187 }, { "epoch": 0.26, "learning_rate": 8.68165034769127e-06, "loss": 0.7707, "step": 11188 }, { "epoch": 0.26, "learning_rate": 8.681396222263926e-06, "loss": 0.855, "step": 11189 }, { "epoch": 0.26, "learning_rate": 8.681142076066393e-06, "loss": 0.8828, "step": 11190 }, { "epoch": 0.26, "learning_rate": 8.680887909100106e-06, "loss": 0.9914, "step": 11191 }, { "epoch": 0.26, "learning_rate": 8.680633721366502e-06, "loss": 0.927, "step": 11192 }, { "epoch": 0.26, "learning_rate": 8.680379512867013e-06, "loss": 0.907, "step": 11193 }, { "epoch": 0.26, "learning_rate": 8.68012528360307e-06, "loss": 0.7326, "step": 11194 }, { "epoch": 0.26, "learning_rate": 8.679871033576112e-06, "loss": 1.1079, "step": 11195 }, { "epoch": 0.26, "learning_rate": 8.679616762787573e-06, "loss": 1.0411, "step": 11196 }, { "epoch": 0.26, "learning_rate": 8.679362471238886e-06, "loss": 0.984, "step": 11197 }, { "epoch": 0.26, "learning_rate": 8.679108158931487e-06, "loss": 1.1049, "step": 11198 }, { "epoch": 0.26, "learning_rate": 8.67885382586681e-06, "loss": 1.006, "step": 11199 }, { "epoch": 0.26, "learning_rate": 8.678599472046287e-06, "loss": 1.1098, "step": 11200 }, { "epoch": 0.26, "learning_rate": 8.678345097471359e-06, "loss": 0.696, "step": 11201 }, { "epoch": 0.26, "learning_rate": 8.678090702143456e-06, "loss": 0.9799, "step": 11202 }, { "epoch": 0.26, "learning_rate": 8.677836286064016e-06, "loss": 1.1574, "step": 11203 }, { "epoch": 0.26, "learning_rate": 8.677581849234475e-06, "loss": 1.1187, "step": 11204 }, { "epoch": 0.26, "learning_rate": 8.677327391656267e-06, "loss": 1.0113, "step": 11205 }, { "epoch": 0.26, "learning_rate": 8.677072913330828e-06, "loss": 1.0295, "step": 11206 }, { "epoch": 0.26, "learning_rate": 8.676818414259593e-06, "loss": 1.0672, "step": 11207 }, { "epoch": 0.26, "learning_rate": 8.676563894443998e-06, "loss": 1.1026, "step": 11208 }, { "epoch": 0.26, "learning_rate": 8.676309353885483e-06, "loss": 1.0964, "step": 11209 }, { "epoch": 0.26, "learning_rate": 8.676054792585477e-06, "loss": 0.9392, "step": 11210 }, { "epoch": 0.26, "learning_rate": 8.675800210545422e-06, "loss": 0.9669, "step": 11211 }, { "epoch": 0.26, "learning_rate": 8.675545607766751e-06, "loss": 0.9808, "step": 11212 }, { "epoch": 0.26, "learning_rate": 8.675290984250903e-06, "loss": 0.7053, "step": 11213 }, { "epoch": 0.26, "learning_rate": 8.675036339999312e-06, "loss": 0.7073, "step": 11214 }, { "epoch": 0.26, "learning_rate": 8.674781675013417e-06, "loss": 1.0609, "step": 11215 }, { "epoch": 0.26, "learning_rate": 8.674526989294652e-06, "loss": 0.9403, "step": 11216 }, { "epoch": 0.26, "learning_rate": 8.674272282844458e-06, "loss": 1.0956, "step": 11217 }, { "epoch": 0.26, "learning_rate": 8.674017555664268e-06, "loss": 0.7909, "step": 11218 }, { "epoch": 0.26, "learning_rate": 8.673762807755522e-06, "loss": 1.2771, "step": 11219 }, { "epoch": 0.26, "learning_rate": 8.673508039119655e-06, "loss": 0.9003, "step": 11220 }, { "epoch": 0.26, "learning_rate": 8.673253249758107e-06, "loss": 1.0185, "step": 11221 }, { "epoch": 0.26, "learning_rate": 8.672998439672314e-06, "loss": 0.8864, "step": 11222 }, { "epoch": 0.26, "learning_rate": 8.672743608863712e-06, "loss": 1.0627, "step": 11223 }, { "epoch": 0.26, "learning_rate": 8.672488757333741e-06, "loss": 0.8911, "step": 11224 }, { "epoch": 0.26, "learning_rate": 8.672233885083839e-06, "loss": 1.0307, "step": 11225 }, { "epoch": 0.26, "learning_rate": 8.671978992115441e-06, "loss": 0.6602, "step": 11226 }, { "epoch": 0.26, "learning_rate": 8.67172407842999e-06, "loss": 0.6569, "step": 11227 }, { "epoch": 0.26, "learning_rate": 8.671469144028918e-06, "loss": 0.6853, "step": 11228 }, { "epoch": 0.26, "learning_rate": 8.671214188913671e-06, "loss": 1.0858, "step": 11229 }, { "epoch": 0.26, "learning_rate": 8.670959213085681e-06, "loss": 1.0257, "step": 11230 }, { "epoch": 0.26, "learning_rate": 8.67070421654639e-06, "loss": 0.8445, "step": 11231 }, { "epoch": 0.26, "learning_rate": 8.670449199297233e-06, "loss": 1.0804, "step": 11232 }, { "epoch": 0.26, "learning_rate": 8.670194161339655e-06, "loss": 1.1013, "step": 11233 }, { "epoch": 0.26, "learning_rate": 8.669939102675089e-06, "loss": 1.0645, "step": 11234 }, { "epoch": 0.26, "learning_rate": 8.669684023304975e-06, "loss": 0.9601, "step": 11235 }, { "epoch": 0.26, "learning_rate": 8.669428923230756e-06, "loss": 1.0395, "step": 11236 }, { "epoch": 0.26, "learning_rate": 8.669173802453867e-06, "loss": 0.9171, "step": 11237 }, { "epoch": 0.26, "learning_rate": 8.668918660975749e-06, "loss": 0.7679, "step": 11238 }, { "epoch": 0.26, "learning_rate": 8.668663498797842e-06, "loss": 1.1113, "step": 11239 }, { "epoch": 0.26, "learning_rate": 8.668408315921587e-06, "loss": 0.9772, "step": 11240 }, { "epoch": 0.26, "learning_rate": 8.668153112348418e-06, "loss": 1.1751, "step": 11241 }, { "epoch": 0.26, "learning_rate": 8.66789788807978e-06, "loss": 1.1063, "step": 11242 }, { "epoch": 0.26, "learning_rate": 8.667642643117112e-06, "loss": 1.0868, "step": 11243 }, { "epoch": 0.26, "learning_rate": 8.667387377461853e-06, "loss": 1.2584, "step": 11244 }, { "epoch": 0.26, "learning_rate": 8.667132091115446e-06, "loss": 1.0155, "step": 11245 }, { "epoch": 0.26, "learning_rate": 8.666876784079328e-06, "loss": 0.8792, "step": 11246 }, { "epoch": 0.26, "learning_rate": 8.66662145635494e-06, "loss": 0.8945, "step": 11247 }, { "epoch": 0.26, "learning_rate": 8.666366107943723e-06, "loss": 1.1591, "step": 11248 }, { "epoch": 0.26, "learning_rate": 8.666110738847118e-06, "loss": 0.7482, "step": 11249 }, { "epoch": 0.26, "learning_rate": 8.665855349066567e-06, "loss": 1.071, "step": 11250 }, { "epoch": 0.26, "learning_rate": 8.665599938603509e-06, "loss": 0.9471, "step": 11251 }, { "epoch": 0.26, "learning_rate": 8.665344507459384e-06, "loss": 1.0057, "step": 11252 }, { "epoch": 0.26, "learning_rate": 8.665089055635636e-06, "loss": 0.9547, "step": 11253 }, { "epoch": 0.26, "learning_rate": 8.664833583133704e-06, "loss": 0.9606, "step": 11254 }, { "epoch": 0.26, "learning_rate": 8.664578089955031e-06, "loss": 1.1355, "step": 11255 }, { "epoch": 0.26, "learning_rate": 8.664322576101056e-06, "loss": 0.9608, "step": 11256 }, { "epoch": 0.26, "learning_rate": 8.664067041573223e-06, "loss": 0.7765, "step": 11257 }, { "epoch": 0.26, "learning_rate": 8.663811486372974e-06, "loss": 1.0565, "step": 11258 }, { "epoch": 0.26, "learning_rate": 8.66355591050175e-06, "loss": 1.14, "step": 11259 }, { "epoch": 0.26, "learning_rate": 8.663300313960992e-06, "loss": 0.7889, "step": 11260 }, { "epoch": 0.26, "learning_rate": 8.663044696752142e-06, "loss": 0.9713, "step": 11261 }, { "epoch": 0.26, "learning_rate": 8.662789058876645e-06, "loss": 1.057, "step": 11262 }, { "epoch": 0.26, "learning_rate": 8.662533400335939e-06, "loss": 1.2618, "step": 11263 }, { "epoch": 0.26, "learning_rate": 8.66227772113147e-06, "loss": 0.7924, "step": 11264 }, { "epoch": 0.26, "learning_rate": 8.662022021264679e-06, "loss": 0.8273, "step": 11265 }, { "epoch": 0.26, "learning_rate": 8.66176630073701e-06, "loss": 0.9346, "step": 11266 }, { "epoch": 0.26, "learning_rate": 8.661510559549901e-06, "loss": 1.0884, "step": 11267 }, { "epoch": 0.26, "learning_rate": 8.661254797704802e-06, "loss": 1.0588, "step": 11268 }, { "epoch": 0.26, "learning_rate": 8.660999015203152e-06, "loss": 0.9072, "step": 11269 }, { "epoch": 0.26, "learning_rate": 8.660743212046393e-06, "loss": 0.7227, "step": 11270 }, { "epoch": 0.26, "learning_rate": 8.660487388235971e-06, "loss": 0.9328, "step": 11271 }, { "epoch": 0.26, "learning_rate": 8.660231543773328e-06, "loss": 1.2293, "step": 11272 }, { "epoch": 0.26, "learning_rate": 8.659975678659906e-06, "loss": 0.9474, "step": 11273 }, { "epoch": 0.26, "learning_rate": 8.659719792897152e-06, "loss": 1.3253, "step": 11274 }, { "epoch": 0.26, "learning_rate": 8.659463886486508e-06, "loss": 0.9062, "step": 11275 }, { "epoch": 0.26, "learning_rate": 8.659207959429416e-06, "loss": 1.0316, "step": 11276 }, { "epoch": 0.26, "learning_rate": 8.658952011727324e-06, "loss": 1.0454, "step": 11277 }, { "epoch": 0.26, "learning_rate": 8.658696043381673e-06, "loss": 1.1262, "step": 11278 }, { "epoch": 0.26, "learning_rate": 8.658440054393906e-06, "loss": 1.047, "step": 11279 }, { "epoch": 0.26, "learning_rate": 8.65818404476547e-06, "loss": 1.036, "step": 11280 }, { "epoch": 0.26, "learning_rate": 8.65792801449781e-06, "loss": 0.9967, "step": 11281 }, { "epoch": 0.26, "learning_rate": 8.657671963592366e-06, "loss": 0.9736, "step": 11282 }, { "epoch": 0.26, "learning_rate": 8.657415892050589e-06, "loss": 1.0753, "step": 11283 }, { "epoch": 0.26, "learning_rate": 8.657159799873917e-06, "loss": 0.8804, "step": 11284 }, { "epoch": 0.26, "learning_rate": 8.6569036870638e-06, "loss": 0.9509, "step": 11285 }, { "epoch": 0.26, "learning_rate": 8.656647553621683e-06, "loss": 0.9099, "step": 11286 }, { "epoch": 0.26, "learning_rate": 8.656391399549005e-06, "loss": 0.9364, "step": 11287 }, { "epoch": 0.26, "learning_rate": 8.65613522484722e-06, "loss": 0.9426, "step": 11288 }, { "epoch": 0.26, "learning_rate": 8.655879029517764e-06, "loss": 0.8899, "step": 11289 }, { "epoch": 0.26, "learning_rate": 8.65562281356209e-06, "loss": 0.962, "step": 11290 }, { "epoch": 0.26, "learning_rate": 8.655366576981641e-06, "loss": 1.0862, "step": 11291 }, { "epoch": 0.26, "learning_rate": 8.65511031977786e-06, "loss": 1.0371, "step": 11292 }, { "epoch": 0.26, "learning_rate": 8.654854041952198e-06, "loss": 0.8329, "step": 11293 }, { "epoch": 0.26, "learning_rate": 8.654597743506097e-06, "loss": 1.259, "step": 11294 }, { "epoch": 0.26, "learning_rate": 8.654341424441003e-06, "loss": 0.9841, "step": 11295 }, { "epoch": 0.26, "learning_rate": 8.654085084758365e-06, "loss": 0.9459, "step": 11296 }, { "epoch": 0.26, "learning_rate": 8.653828724459626e-06, "loss": 1.0244, "step": 11297 }, { "epoch": 0.26, "learning_rate": 8.653572343546234e-06, "loss": 1.1317, "step": 11298 }, { "epoch": 0.26, "learning_rate": 8.653315942019637e-06, "loss": 0.9118, "step": 11299 }, { "epoch": 0.26, "learning_rate": 8.653059519881279e-06, "loss": 1.0431, "step": 11300 }, { "epoch": 0.26, "learning_rate": 8.652803077132609e-06, "loss": 0.9522, "step": 11301 }, { "epoch": 0.26, "learning_rate": 8.652546613775071e-06, "loss": 1.0254, "step": 11302 }, { "epoch": 0.26, "learning_rate": 8.652290129810113e-06, "loss": 0.8216, "step": 11303 }, { "epoch": 0.26, "learning_rate": 8.652033625239182e-06, "loss": 0.7368, "step": 11304 }, { "epoch": 0.26, "learning_rate": 8.651777100063727e-06, "loss": 0.798, "step": 11305 }, { "epoch": 0.26, "learning_rate": 8.651520554285194e-06, "loss": 0.9865, "step": 11306 }, { "epoch": 0.26, "learning_rate": 8.65126398790503e-06, "loss": 0.7534, "step": 11307 }, { "epoch": 0.26, "learning_rate": 8.651007400924683e-06, "loss": 1.1139, "step": 11308 }, { "epoch": 0.26, "learning_rate": 8.650750793345602e-06, "loss": 0.9411, "step": 11309 }, { "epoch": 0.26, "learning_rate": 8.650494165169232e-06, "loss": 1.1394, "step": 11310 }, { "epoch": 0.26, "learning_rate": 8.650237516397021e-06, "loss": 0.9861, "step": 11311 }, { "epoch": 0.26, "learning_rate": 8.64998084703042e-06, "loss": 1.1016, "step": 11312 }, { "epoch": 0.26, "learning_rate": 8.649724157070876e-06, "loss": 0.9336, "step": 11313 }, { "epoch": 0.26, "learning_rate": 8.649467446519834e-06, "loss": 0.6052, "step": 11314 }, { "epoch": 0.26, "learning_rate": 8.649210715378746e-06, "loss": 1.0387, "step": 11315 }, { "epoch": 0.26, "learning_rate": 8.64895396364906e-06, "loss": 1.0984, "step": 11316 }, { "epoch": 0.26, "learning_rate": 8.648697191332224e-06, "loss": 1.0083, "step": 11317 }, { "epoch": 0.26, "learning_rate": 8.648440398429687e-06, "loss": 1.1455, "step": 11318 }, { "epoch": 0.26, "learning_rate": 8.648183584942896e-06, "loss": 1.124, "step": 11319 }, { "epoch": 0.26, "learning_rate": 8.647926750873302e-06, "loss": 0.9542, "step": 11320 }, { "epoch": 0.26, "learning_rate": 8.647669896222353e-06, "loss": 1.0905, "step": 11321 }, { "epoch": 0.26, "learning_rate": 8.6474130209915e-06, "loss": 1.0155, "step": 11322 }, { "epoch": 0.26, "learning_rate": 8.64715612518219e-06, "loss": 1.1974, "step": 11323 }, { "epoch": 0.26, "learning_rate": 8.646899208795874e-06, "loss": 1.0336, "step": 11324 }, { "epoch": 0.26, "learning_rate": 8.646642271833999e-06, "loss": 0.876, "step": 11325 }, { "epoch": 0.26, "learning_rate": 8.646385314298017e-06, "loss": 0.9502, "step": 11326 }, { "epoch": 0.26, "learning_rate": 8.646128336189376e-06, "loss": 0.8218, "step": 11327 }, { "epoch": 0.26, "learning_rate": 8.64587133750953e-06, "loss": 1.1538, "step": 11328 }, { "epoch": 0.26, "learning_rate": 8.645614318259923e-06, "loss": 0.8676, "step": 11329 }, { "epoch": 0.26, "learning_rate": 8.64535727844201e-06, "loss": 0.914, "step": 11330 }, { "epoch": 0.26, "learning_rate": 8.64510021805724e-06, "loss": 1.2246, "step": 11331 }, { "epoch": 0.26, "learning_rate": 8.644843137107058e-06, "loss": 1.0253, "step": 11332 }, { "epoch": 0.26, "learning_rate": 8.644586035592921e-06, "loss": 0.8296, "step": 11333 }, { "epoch": 0.26, "learning_rate": 8.64432891351628e-06, "loss": 0.6798, "step": 11334 }, { "epoch": 0.26, "learning_rate": 8.644071770878581e-06, "loss": 1.1339, "step": 11335 }, { "epoch": 0.26, "learning_rate": 8.643814607681277e-06, "loss": 1.0593, "step": 11336 }, { "epoch": 0.26, "learning_rate": 8.64355742392582e-06, "loss": 0.8863, "step": 11337 }, { "epoch": 0.26, "learning_rate": 8.643300219613658e-06, "loss": 1.1017, "step": 11338 }, { "epoch": 0.26, "learning_rate": 8.643042994746245e-06, "loss": 1.0112, "step": 11339 }, { "epoch": 0.26, "learning_rate": 8.64278574932503e-06, "loss": 0.9607, "step": 11340 }, { "epoch": 0.26, "learning_rate": 8.64252848335147e-06, "loss": 0.9168, "step": 11341 }, { "epoch": 0.26, "learning_rate": 8.642271196827009e-06, "loss": 0.8833, "step": 11342 }, { "epoch": 0.26, "learning_rate": 8.6420138897531e-06, "loss": 0.9068, "step": 11343 }, { "epoch": 0.26, "learning_rate": 8.641756562131197e-06, "loss": 1.002, "step": 11344 }, { "epoch": 0.26, "learning_rate": 8.641499213962753e-06, "loss": 1.1768, "step": 11345 }, { "epoch": 0.26, "learning_rate": 8.641241845249216e-06, "loss": 1.4188, "step": 11346 }, { "epoch": 0.26, "learning_rate": 8.640984455992042e-06, "loss": 1.0874, "step": 11347 }, { "epoch": 0.26, "learning_rate": 8.64072704619268e-06, "loss": 0.9641, "step": 11348 }, { "epoch": 0.26, "learning_rate": 8.640469615852585e-06, "loss": 0.7655, "step": 11349 }, { "epoch": 0.26, "learning_rate": 8.640212164973207e-06, "loss": 1.0487, "step": 11350 }, { "epoch": 0.26, "learning_rate": 8.639954693556001e-06, "loss": 0.956, "step": 11351 }, { "epoch": 0.26, "learning_rate": 8.639697201602417e-06, "loss": 1.1528, "step": 11352 }, { "epoch": 0.26, "learning_rate": 8.639439689113909e-06, "loss": 0.9781, "step": 11353 }, { "epoch": 0.26, "learning_rate": 8.63918215609193e-06, "loss": 0.7749, "step": 11354 }, { "epoch": 0.26, "learning_rate": 8.638924602537932e-06, "loss": 1.0351, "step": 11355 }, { "epoch": 0.26, "learning_rate": 8.638667028453372e-06, "loss": 1.0614, "step": 11356 }, { "epoch": 0.26, "learning_rate": 8.638409433839696e-06, "loss": 1.2899, "step": 11357 }, { "epoch": 0.26, "learning_rate": 8.638151818698364e-06, "loss": 0.89, "step": 11358 }, { "epoch": 0.26, "learning_rate": 8.637894183030826e-06, "loss": 1.1826, "step": 11359 }, { "epoch": 0.26, "learning_rate": 8.637636526838537e-06, "loss": 0.9641, "step": 11360 }, { "epoch": 0.26, "learning_rate": 8.63737885012295e-06, "loss": 0.8887, "step": 11361 }, { "epoch": 0.26, "learning_rate": 8.63712115288552e-06, "loss": 0.9896, "step": 11362 }, { "epoch": 0.26, "learning_rate": 8.636863435127699e-06, "loss": 1.2742, "step": 11363 }, { "epoch": 0.26, "learning_rate": 8.63660569685094e-06, "loss": 0.9844, "step": 11364 }, { "epoch": 0.26, "learning_rate": 8.636347938056701e-06, "loss": 0.7965, "step": 11365 }, { "epoch": 0.26, "learning_rate": 8.636090158746434e-06, "loss": 0.8292, "step": 11366 }, { "epoch": 0.26, "learning_rate": 8.635832358921592e-06, "loss": 0.8193, "step": 11367 }, { "epoch": 0.26, "learning_rate": 8.635574538583633e-06, "loss": 1.1261, "step": 11368 }, { "epoch": 0.26, "learning_rate": 8.635316697734009e-06, "loss": 1.0261, "step": 11369 }, { "epoch": 0.26, "learning_rate": 8.635058836374178e-06, "loss": 0.9434, "step": 11370 }, { "epoch": 0.26, "learning_rate": 8.63480095450559e-06, "loss": 1.1652, "step": 11371 }, { "epoch": 0.26, "learning_rate": 8.6345430521297e-06, "loss": 1.2165, "step": 11372 }, { "epoch": 0.26, "learning_rate": 8.634285129247968e-06, "loss": 0.9108, "step": 11373 }, { "epoch": 0.26, "learning_rate": 8.634027185861846e-06, "loss": 0.9678, "step": 11374 }, { "epoch": 0.26, "learning_rate": 8.63376922197279e-06, "loss": 1.2144, "step": 11375 }, { "epoch": 0.26, "learning_rate": 8.633511237582257e-06, "loss": 0.934, "step": 11376 }, { "epoch": 0.26, "learning_rate": 8.633253232691698e-06, "loss": 1.1063, "step": 11377 }, { "epoch": 0.26, "learning_rate": 8.632995207302572e-06, "loss": 1.052, "step": 11378 }, { "epoch": 0.26, "learning_rate": 8.632737161416335e-06, "loss": 1.0974, "step": 11379 }, { "epoch": 0.26, "learning_rate": 8.632479095034442e-06, "loss": 1.0858, "step": 11380 }, { "epoch": 0.26, "learning_rate": 8.632221008158348e-06, "loss": 1.0665, "step": 11381 }, { "epoch": 0.26, "learning_rate": 8.631962900789511e-06, "loss": 1.096, "step": 11382 }, { "epoch": 0.26, "learning_rate": 8.631704772929386e-06, "loss": 1.0053, "step": 11383 }, { "epoch": 0.26, "learning_rate": 8.63144662457943e-06, "loss": 1.2243, "step": 11384 }, { "epoch": 0.26, "learning_rate": 8.6311884557411e-06, "loss": 0.794, "step": 11385 }, { "epoch": 0.26, "learning_rate": 8.63093026641585e-06, "loss": 1.0797, "step": 11386 }, { "epoch": 0.26, "learning_rate": 8.630672056605139e-06, "loss": 1.1247, "step": 11387 }, { "epoch": 0.26, "learning_rate": 8.630413826310424e-06, "loss": 0.7214, "step": 11388 }, { "epoch": 0.26, "learning_rate": 8.63015557553316e-06, "loss": 1.0309, "step": 11389 }, { "epoch": 0.26, "learning_rate": 8.629897304274806e-06, "loss": 1.228, "step": 11390 }, { "epoch": 0.26, "learning_rate": 8.629639012536817e-06, "loss": 1.0949, "step": 11391 }, { "epoch": 0.26, "learning_rate": 8.629380700320653e-06, "loss": 1.0769, "step": 11392 }, { "epoch": 0.26, "learning_rate": 8.62912236762777e-06, "loss": 1.3344, "step": 11393 }, { "epoch": 0.26, "learning_rate": 8.628864014459624e-06, "loss": 0.9916, "step": 11394 }, { "epoch": 0.26, "learning_rate": 8.628605640817675e-06, "loss": 1.0791, "step": 11395 }, { "epoch": 0.26, "learning_rate": 8.628347246703381e-06, "loss": 1.0336, "step": 11396 }, { "epoch": 0.26, "learning_rate": 8.628088832118196e-06, "loss": 1.1725, "step": 11397 }, { "epoch": 0.26, "learning_rate": 8.627830397063583e-06, "loss": 0.9322, "step": 11398 }, { "epoch": 0.26, "learning_rate": 8.627571941540995e-06, "loss": 0.9986, "step": 11399 }, { "epoch": 0.26, "learning_rate": 8.627313465551895e-06, "loss": 1.143, "step": 11400 }, { "epoch": 0.26, "learning_rate": 8.627054969097739e-06, "loss": 1.2831, "step": 11401 }, { "epoch": 0.26, "learning_rate": 8.626796452179986e-06, "loss": 0.9862, "step": 11402 }, { "epoch": 0.26, "learning_rate": 8.626537914800093e-06, "loss": 1.0008, "step": 11403 }, { "epoch": 0.26, "learning_rate": 8.62627935695952e-06, "loss": 0.7909, "step": 11404 }, { "epoch": 0.26, "learning_rate": 8.626020778659724e-06, "loss": 0.8923, "step": 11405 }, { "epoch": 0.26, "learning_rate": 8.625762179902169e-06, "loss": 1.0391, "step": 11406 }, { "epoch": 0.26, "learning_rate": 8.625503560688308e-06, "loss": 0.9678, "step": 11407 }, { "epoch": 0.26, "learning_rate": 8.625244921019604e-06, "loss": 0.8693, "step": 11408 }, { "epoch": 0.26, "learning_rate": 8.624986260897513e-06, "loss": 0.9954, "step": 11409 }, { "epoch": 0.26, "learning_rate": 8.624727580323497e-06, "loss": 1.2959, "step": 11410 }, { "epoch": 0.26, "learning_rate": 8.624468879299013e-06, "loss": 0.8659, "step": 11411 }, { "epoch": 0.26, "learning_rate": 8.624210157825525e-06, "loss": 1.1028, "step": 11412 }, { "epoch": 0.26, "learning_rate": 8.623951415904488e-06, "loss": 0.8683, "step": 11413 }, { "epoch": 0.26, "learning_rate": 8.623692653537364e-06, "loss": 0.872, "step": 11414 }, { "epoch": 0.26, "learning_rate": 8.623433870725612e-06, "loss": 0.9214, "step": 11415 }, { "epoch": 0.26, "learning_rate": 8.623175067470693e-06, "loss": 0.849, "step": 11416 }, { "epoch": 0.26, "learning_rate": 8.622916243774067e-06, "loss": 1.2403, "step": 11417 }, { "epoch": 0.26, "learning_rate": 8.622657399637194e-06, "loss": 1.1366, "step": 11418 }, { "epoch": 0.26, "learning_rate": 8.622398535061533e-06, "loss": 0.8737, "step": 11419 }, { "epoch": 0.26, "learning_rate": 8.622139650048549e-06, "loss": 0.9615, "step": 11420 }, { "epoch": 0.26, "learning_rate": 8.621880744599696e-06, "loss": 0.8075, "step": 11421 }, { "epoch": 0.26, "learning_rate": 8.62162181871644e-06, "loss": 0.9746, "step": 11422 }, { "epoch": 0.26, "learning_rate": 8.62136287240024e-06, "loss": 1.0668, "step": 11423 }, { "epoch": 0.26, "learning_rate": 8.621103905652556e-06, "loss": 1.1297, "step": 11424 }, { "epoch": 0.26, "learning_rate": 8.620844918474851e-06, "loss": 1.0716, "step": 11425 }, { "epoch": 0.26, "learning_rate": 8.620585910868585e-06, "loss": 1.1064, "step": 11426 }, { "epoch": 0.27, "learning_rate": 8.62032688283522e-06, "loss": 1.2358, "step": 11427 }, { "epoch": 0.27, "learning_rate": 8.620067834376215e-06, "loss": 1.2232, "step": 11428 }, { "epoch": 0.27, "learning_rate": 8.619808765493036e-06, "loss": 1.1551, "step": 11429 }, { "epoch": 0.27, "learning_rate": 8.619549676187142e-06, "loss": 0.9182, "step": 11430 }, { "epoch": 0.27, "learning_rate": 8.619290566459994e-06, "loss": 0.8861, "step": 11431 }, { "epoch": 0.27, "learning_rate": 8.619031436313054e-06, "loss": 1.2386, "step": 11432 }, { "epoch": 0.27, "learning_rate": 8.618772285747787e-06, "loss": 1.4985, "step": 11433 }, { "epoch": 0.27, "learning_rate": 8.618513114765652e-06, "loss": 1.082, "step": 11434 }, { "epoch": 0.27, "learning_rate": 8.61825392336811e-06, "loss": 1.1933, "step": 11435 }, { "epoch": 0.27, "learning_rate": 8.617994711556627e-06, "loss": 1.016, "step": 11436 }, { "epoch": 0.27, "learning_rate": 8.617735479332665e-06, "loss": 1.1505, "step": 11437 }, { "epoch": 0.27, "learning_rate": 8.617476226697685e-06, "loss": 0.9911, "step": 11438 }, { "epoch": 0.27, "learning_rate": 8.61721695365315e-06, "loss": 0.9969, "step": 11439 }, { "epoch": 0.27, "learning_rate": 8.616957660200523e-06, "loss": 0.883, "step": 11440 }, { "epoch": 0.27, "learning_rate": 8.616698346341267e-06, "loss": 0.8538, "step": 11441 }, { "epoch": 0.27, "learning_rate": 8.616439012076844e-06, "loss": 1.2893, "step": 11442 }, { "epoch": 0.27, "learning_rate": 8.61617965740872e-06, "loss": 0.9708, "step": 11443 }, { "epoch": 0.27, "learning_rate": 8.615920282338355e-06, "loss": 0.9519, "step": 11444 }, { "epoch": 0.27, "learning_rate": 8.615660886867215e-06, "loss": 0.7344, "step": 11445 }, { "epoch": 0.27, "learning_rate": 8.61540147099676e-06, "loss": 1.1473, "step": 11446 }, { "epoch": 0.27, "learning_rate": 8.615142034728456e-06, "loss": 0.876, "step": 11447 }, { "epoch": 0.27, "learning_rate": 8.614882578063768e-06, "loss": 0.9045, "step": 11448 }, { "epoch": 0.27, "learning_rate": 8.614623101004158e-06, "loss": 0.935, "step": 11449 }, { "epoch": 0.27, "learning_rate": 8.614363603551091e-06, "loss": 0.988, "step": 11450 }, { "epoch": 0.27, "learning_rate": 8.61410408570603e-06, "loss": 0.778, "step": 11451 }, { "epoch": 0.27, "learning_rate": 8.613844547470437e-06, "loss": 0.9119, "step": 11452 }, { "epoch": 0.27, "learning_rate": 8.613584988845783e-06, "loss": 1.0555, "step": 11453 }, { "epoch": 0.27, "learning_rate": 8.613325409833527e-06, "loss": 1.0586, "step": 11454 }, { "epoch": 0.27, "learning_rate": 8.613065810435134e-06, "loss": 1.0425, "step": 11455 }, { "epoch": 0.27, "learning_rate": 8.61280619065207e-06, "loss": 0.984, "step": 11456 }, { "epoch": 0.27, "learning_rate": 8.612546550485798e-06, "loss": 0.9697, "step": 11457 }, { "epoch": 0.27, "learning_rate": 8.612286889937784e-06, "loss": 0.8134, "step": 11458 }, { "epoch": 0.27, "learning_rate": 8.612027209009495e-06, "loss": 1.3606, "step": 11459 }, { "epoch": 0.27, "learning_rate": 8.611767507702393e-06, "loss": 0.9538, "step": 11460 }, { "epoch": 0.27, "learning_rate": 8.611507786017945e-06, "loss": 1.1926, "step": 11461 }, { "epoch": 0.27, "learning_rate": 8.611248043957615e-06, "loss": 0.8881, "step": 11462 }, { "epoch": 0.27, "learning_rate": 8.610988281522869e-06, "loss": 1.0178, "step": 11463 }, { "epoch": 0.27, "learning_rate": 8.610728498715173e-06, "loss": 1.0346, "step": 11464 }, { "epoch": 0.27, "learning_rate": 8.610468695535993e-06, "loss": 1.1755, "step": 11465 }, { "epoch": 0.27, "learning_rate": 8.610208871986793e-06, "loss": 1.0566, "step": 11466 }, { "epoch": 0.27, "learning_rate": 8.609949028069042e-06, "loss": 0.9001, "step": 11467 }, { "epoch": 0.27, "learning_rate": 8.609689163784203e-06, "loss": 0.9721, "step": 11468 }, { "epoch": 0.27, "learning_rate": 8.609429279133743e-06, "loss": 1.1843, "step": 11469 }, { "epoch": 0.27, "learning_rate": 8.609169374119129e-06, "loss": 0.7927, "step": 11470 }, { "epoch": 0.27, "learning_rate": 8.608909448741827e-06, "loss": 0.9708, "step": 11471 }, { "epoch": 0.27, "learning_rate": 8.608649503003304e-06, "loss": 0.8417, "step": 11472 }, { "epoch": 0.27, "learning_rate": 8.608389536905024e-06, "loss": 1.0053, "step": 11473 }, { "epoch": 0.27, "learning_rate": 8.608129550448456e-06, "loss": 1.4506, "step": 11474 }, { "epoch": 0.27, "learning_rate": 8.607869543635068e-06, "loss": 1.2453, "step": 11475 }, { "epoch": 0.27, "learning_rate": 8.607609516466324e-06, "loss": 0.9092, "step": 11476 }, { "epoch": 0.27, "learning_rate": 8.607349468943695e-06, "loss": 0.7729, "step": 11477 }, { "epoch": 0.27, "learning_rate": 8.607089401068643e-06, "loss": 0.8209, "step": 11478 }, { "epoch": 0.27, "learning_rate": 8.606829312842638e-06, "loss": 0.8485, "step": 11479 }, { "epoch": 0.27, "learning_rate": 8.606569204267149e-06, "loss": 1.0423, "step": 11480 }, { "epoch": 0.27, "learning_rate": 8.60630907534364e-06, "loss": 0.8333, "step": 11481 }, { "epoch": 0.27, "learning_rate": 8.606048926073583e-06, "loss": 0.9311, "step": 11482 }, { "epoch": 0.27, "learning_rate": 8.605788756458442e-06, "loss": 1.1167, "step": 11483 }, { "epoch": 0.27, "learning_rate": 8.605528566499686e-06, "loss": 0.9638, "step": 11484 }, { "epoch": 0.27, "learning_rate": 8.605268356198782e-06, "loss": 0.9786, "step": 11485 }, { "epoch": 0.27, "learning_rate": 8.6050081255572e-06, "loss": 1.1247, "step": 11486 }, { "epoch": 0.27, "learning_rate": 8.604747874576408e-06, "loss": 1.0503, "step": 11487 }, { "epoch": 0.27, "learning_rate": 8.604487603257874e-06, "loss": 0.75, "step": 11488 }, { "epoch": 0.27, "learning_rate": 8.604227311603064e-06, "loss": 0.9574, "step": 11489 }, { "epoch": 0.27, "learning_rate": 8.60396699961345e-06, "loss": 1.324, "step": 11490 }, { "epoch": 0.27, "learning_rate": 8.6037066672905e-06, "loss": 0.969, "step": 11491 }, { "epoch": 0.27, "learning_rate": 8.603446314635681e-06, "loss": 1.2138, "step": 11492 }, { "epoch": 0.27, "learning_rate": 8.603185941650464e-06, "loss": 1.1362, "step": 11493 }, { "epoch": 0.27, "learning_rate": 8.602925548336316e-06, "loss": 1.183, "step": 11494 }, { "epoch": 0.27, "learning_rate": 8.602665134694707e-06, "loss": 1.0354, "step": 11495 }, { "epoch": 0.27, "learning_rate": 8.602404700727108e-06, "loss": 1.241, "step": 11496 }, { "epoch": 0.27, "learning_rate": 8.602144246434985e-06, "loss": 0.9347, "step": 11497 }, { "epoch": 0.27, "learning_rate": 8.60188377181981e-06, "loss": 1.0383, "step": 11498 }, { "epoch": 0.27, "learning_rate": 8.601623276883051e-06, "loss": 1.2054, "step": 11499 }, { "epoch": 0.27, "learning_rate": 8.60136276162618e-06, "loss": 1.1558, "step": 11500 }, { "epoch": 0.27, "learning_rate": 8.601102226050664e-06, "loss": 0.951, "step": 11501 }, { "epoch": 0.27, "learning_rate": 8.600841670157975e-06, "loss": 1.1358, "step": 11502 }, { "epoch": 0.27, "learning_rate": 8.600581093949581e-06, "loss": 0.8224, "step": 11503 }, { "epoch": 0.27, "learning_rate": 8.600320497426955e-06, "loss": 0.8942, "step": 11504 }, { "epoch": 0.27, "learning_rate": 8.600059880591565e-06, "loss": 1.2271, "step": 11505 }, { "epoch": 0.27, "learning_rate": 8.599799243444881e-06, "loss": 0.9502, "step": 11506 }, { "epoch": 0.27, "learning_rate": 8.599538585988376e-06, "loss": 1.1087, "step": 11507 }, { "epoch": 0.27, "learning_rate": 8.599277908223518e-06, "loss": 0.8691, "step": 11508 }, { "epoch": 0.27, "learning_rate": 8.59901721015178e-06, "loss": 1.001, "step": 11509 }, { "epoch": 0.27, "learning_rate": 8.59875649177463e-06, "loss": 1.0034, "step": 11510 }, { "epoch": 0.27, "learning_rate": 8.598495753093541e-06, "loss": 0.9909, "step": 11511 }, { "epoch": 0.27, "learning_rate": 8.598234994109984e-06, "loss": 0.9068, "step": 11512 }, { "epoch": 0.27, "learning_rate": 8.597974214825431e-06, "loss": 0.9522, "step": 11513 }, { "epoch": 0.27, "learning_rate": 8.597713415241353e-06, "loss": 1.1151, "step": 11514 }, { "epoch": 0.27, "learning_rate": 8.597452595359219e-06, "loss": 0.9528, "step": 11515 }, { "epoch": 0.27, "learning_rate": 8.597191755180501e-06, "loss": 1.0933, "step": 11516 }, { "epoch": 0.27, "learning_rate": 8.596930894706675e-06, "loss": 0.8112, "step": 11517 }, { "epoch": 0.27, "learning_rate": 8.596670013939206e-06, "loss": 0.6751, "step": 11518 }, { "epoch": 0.27, "learning_rate": 8.59640911287957e-06, "loss": 0.7681, "step": 11519 }, { "epoch": 0.27, "learning_rate": 8.59614819152924e-06, "loss": 1.0173, "step": 11520 }, { "epoch": 0.27, "learning_rate": 8.595887249889688e-06, "loss": 0.9964, "step": 11521 }, { "epoch": 0.27, "learning_rate": 8.595626287962382e-06, "loss": 1.2695, "step": 11522 }, { "epoch": 0.27, "learning_rate": 8.595365305748797e-06, "loss": 0.6766, "step": 11523 }, { "epoch": 0.27, "learning_rate": 8.595104303250408e-06, "loss": 1.043, "step": 11524 }, { "epoch": 0.27, "learning_rate": 8.594843280468683e-06, "loss": 0.9246, "step": 11525 }, { "epoch": 0.27, "learning_rate": 8.594582237405097e-06, "loss": 0.7058, "step": 11526 }, { "epoch": 0.27, "learning_rate": 8.594321174061123e-06, "loss": 1.072, "step": 11527 }, { "epoch": 0.27, "learning_rate": 8.594060090438231e-06, "loss": 0.9026, "step": 11528 }, { "epoch": 0.27, "learning_rate": 8.5937989865379e-06, "loss": 0.8359, "step": 11529 }, { "epoch": 0.27, "learning_rate": 8.593537862361599e-06, "loss": 0.9204, "step": 11530 }, { "epoch": 0.27, "learning_rate": 8.5932767179108e-06, "loss": 1.2036, "step": 11531 }, { "epoch": 0.27, "learning_rate": 8.593015553186979e-06, "loss": 0.8619, "step": 11532 }, { "epoch": 0.27, "learning_rate": 8.592754368191608e-06, "loss": 1.1998, "step": 11533 }, { "epoch": 0.27, "learning_rate": 8.592493162926163e-06, "loss": 0.8836, "step": 11534 }, { "epoch": 0.27, "learning_rate": 8.592231937392115e-06, "loss": 0.9697, "step": 11535 }, { "epoch": 0.27, "learning_rate": 8.591970691590939e-06, "loss": 0.9188, "step": 11536 }, { "epoch": 0.27, "learning_rate": 8.591709425524107e-06, "loss": 1.0397, "step": 11537 }, { "epoch": 0.27, "learning_rate": 8.591448139193095e-06, "loss": 0.9919, "step": 11538 }, { "epoch": 0.27, "learning_rate": 8.591186832599379e-06, "loss": 0.8355, "step": 11539 }, { "epoch": 0.27, "learning_rate": 8.59092550574443e-06, "loss": 1.0092, "step": 11540 }, { "epoch": 0.27, "learning_rate": 8.590664158629725e-06, "loss": 0.8065, "step": 11541 }, { "epoch": 0.27, "learning_rate": 8.590402791256734e-06, "loss": 0.9919, "step": 11542 }, { "epoch": 0.27, "learning_rate": 8.590141403626937e-06, "loss": 0.8763, "step": 11543 }, { "epoch": 0.27, "learning_rate": 8.589879995741805e-06, "loss": 1.0187, "step": 11544 }, { "epoch": 0.27, "learning_rate": 8.589618567602815e-06, "loss": 0.9968, "step": 11545 }, { "epoch": 0.27, "learning_rate": 8.589357119211443e-06, "loss": 1.0682, "step": 11546 }, { "epoch": 0.27, "learning_rate": 8.58909565056916e-06, "loss": 1.0688, "step": 11547 }, { "epoch": 0.27, "learning_rate": 8.588834161677444e-06, "loss": 1.0924, "step": 11548 }, { "epoch": 0.27, "learning_rate": 8.58857265253777e-06, "loss": 0.9446, "step": 11549 }, { "epoch": 0.27, "learning_rate": 8.588311123151613e-06, "loss": 0.9241, "step": 11550 }, { "epoch": 0.27, "learning_rate": 8.588049573520449e-06, "loss": 0.97, "step": 11551 }, { "epoch": 0.27, "learning_rate": 8.587788003645752e-06, "loss": 0.9067, "step": 11552 }, { "epoch": 0.27, "learning_rate": 8.587526413529001e-06, "loss": 0.8008, "step": 11553 }, { "epoch": 0.27, "learning_rate": 8.587264803171668e-06, "loss": 0.9707, "step": 11554 }, { "epoch": 0.27, "learning_rate": 8.587003172575232e-06, "loss": 0.9551, "step": 11555 }, { "epoch": 0.27, "learning_rate": 8.58674152174117e-06, "loss": 1.1431, "step": 11556 }, { "epoch": 0.27, "learning_rate": 8.586479850670953e-06, "loss": 1.0441, "step": 11557 }, { "epoch": 0.27, "learning_rate": 8.586218159366063e-06, "loss": 1.0299, "step": 11558 }, { "epoch": 0.27, "learning_rate": 8.585956447827973e-06, "loss": 1.0782, "step": 11559 }, { "epoch": 0.27, "learning_rate": 8.58569471605816e-06, "loss": 0.997, "step": 11560 }, { "epoch": 0.27, "learning_rate": 8.585432964058103e-06, "loss": 1.0391, "step": 11561 }, { "epoch": 0.27, "learning_rate": 8.585171191829276e-06, "loss": 1.0248, "step": 11562 }, { "epoch": 0.27, "learning_rate": 8.584909399373157e-06, "loss": 1.0367, "step": 11563 }, { "epoch": 0.27, "learning_rate": 8.584647586691224e-06, "loss": 1.0135, "step": 11564 }, { "epoch": 0.27, "learning_rate": 8.584385753784951e-06, "loss": 0.9537, "step": 11565 }, { "epoch": 0.27, "learning_rate": 8.58412390065582e-06, "loss": 1.0866, "step": 11566 }, { "epoch": 0.27, "learning_rate": 8.583862027305305e-06, "loss": 0.74, "step": 11567 }, { "epoch": 0.27, "learning_rate": 8.583600133734885e-06, "loss": 0.7768, "step": 11568 }, { "epoch": 0.27, "learning_rate": 8.583338219946034e-06, "loss": 0.8498, "step": 11569 }, { "epoch": 0.27, "learning_rate": 8.583076285940234e-06, "loss": 0.9379, "step": 11570 }, { "epoch": 0.27, "learning_rate": 8.582814331718961e-06, "loss": 0.5536, "step": 11571 }, { "epoch": 0.27, "learning_rate": 8.582552357283695e-06, "loss": 0.873, "step": 11572 }, { "epoch": 0.27, "learning_rate": 8.58229036263591e-06, "loss": 0.9942, "step": 11573 }, { "epoch": 0.27, "learning_rate": 8.582028347777086e-06, "loss": 1.2312, "step": 11574 }, { "epoch": 0.27, "learning_rate": 8.581766312708704e-06, "loss": 1.1087, "step": 11575 }, { "epoch": 0.27, "learning_rate": 8.58150425743224e-06, "loss": 0.8622, "step": 11576 }, { "epoch": 0.27, "learning_rate": 8.581242181949172e-06, "loss": 0.8006, "step": 11577 }, { "epoch": 0.27, "learning_rate": 8.58098008626098e-06, "loss": 0.7788, "step": 11578 }, { "epoch": 0.27, "learning_rate": 8.58071797036914e-06, "loss": 0.8205, "step": 11579 }, { "epoch": 0.27, "learning_rate": 8.580455834275134e-06, "loss": 0.9851, "step": 11580 }, { "epoch": 0.27, "learning_rate": 8.58019367798044e-06, "loss": 0.9842, "step": 11581 }, { "epoch": 0.27, "learning_rate": 8.579931501486536e-06, "loss": 0.83, "step": 11582 }, { "epoch": 0.27, "learning_rate": 8.579669304794901e-06, "loss": 0.8765, "step": 11583 }, { "epoch": 0.27, "learning_rate": 8.579407087907018e-06, "loss": 0.9055, "step": 11584 }, { "epoch": 0.27, "learning_rate": 8.579144850824361e-06, "loss": 0.8791, "step": 11585 }, { "epoch": 0.27, "learning_rate": 8.578882593548415e-06, "loss": 0.7396, "step": 11586 }, { "epoch": 0.27, "learning_rate": 8.578620316080655e-06, "loss": 1.0916, "step": 11587 }, { "epoch": 0.27, "learning_rate": 8.578358018422561e-06, "loss": 0.8484, "step": 11588 }, { "epoch": 0.27, "learning_rate": 8.578095700575617e-06, "loss": 0.9186, "step": 11589 }, { "epoch": 0.27, "learning_rate": 8.5778333625413e-06, "loss": 0.8003, "step": 11590 }, { "epoch": 0.27, "learning_rate": 8.57757100432109e-06, "loss": 0.9285, "step": 11591 }, { "epoch": 0.27, "learning_rate": 8.577308625916467e-06, "loss": 1.025, "step": 11592 }, { "epoch": 0.27, "learning_rate": 8.577046227328913e-06, "loss": 1.2512, "step": 11593 }, { "epoch": 0.27, "learning_rate": 8.576783808559909e-06, "loss": 1.0948, "step": 11594 }, { "epoch": 0.27, "learning_rate": 8.576521369610933e-06, "loss": 1.0861, "step": 11595 }, { "epoch": 0.27, "learning_rate": 8.576258910483467e-06, "loss": 0.8203, "step": 11596 }, { "epoch": 0.27, "learning_rate": 8.575996431178989e-06, "loss": 0.9515, "step": 11597 }, { "epoch": 0.27, "learning_rate": 8.575733931698985e-06, "loss": 1.4244, "step": 11598 }, { "epoch": 0.27, "learning_rate": 8.575471412044932e-06, "loss": 0.7307, "step": 11599 }, { "epoch": 0.27, "learning_rate": 8.575208872218312e-06, "loss": 0.9964, "step": 11600 }, { "epoch": 0.27, "learning_rate": 8.574946312220609e-06, "loss": 1.0445, "step": 11601 }, { "epoch": 0.27, "learning_rate": 8.574683732053301e-06, "loss": 0.7952, "step": 11602 }, { "epoch": 0.27, "learning_rate": 8.57442113171787e-06, "loss": 1.1141, "step": 11603 }, { "epoch": 0.27, "learning_rate": 8.574158511215799e-06, "loss": 0.7779, "step": 11604 }, { "epoch": 0.27, "learning_rate": 8.573895870548568e-06, "loss": 1.0299, "step": 11605 }, { "epoch": 0.27, "learning_rate": 8.57363320971766e-06, "loss": 1.1654, "step": 11606 }, { "epoch": 0.27, "learning_rate": 8.573370528724557e-06, "loss": 0.79, "step": 11607 }, { "epoch": 0.27, "learning_rate": 8.573107827570739e-06, "loss": 1.141, "step": 11608 }, { "epoch": 0.27, "learning_rate": 8.57284510625769e-06, "loss": 0.9787, "step": 11609 }, { "epoch": 0.27, "learning_rate": 8.572582364786893e-06, "loss": 1.1121, "step": 11610 }, { "epoch": 0.27, "learning_rate": 8.572319603159828e-06, "loss": 0.7755, "step": 11611 }, { "epoch": 0.27, "learning_rate": 8.572056821377981e-06, "loss": 1.03, "step": 11612 }, { "epoch": 0.27, "learning_rate": 8.57179401944283e-06, "loss": 0.9733, "step": 11613 }, { "epoch": 0.27, "learning_rate": 8.571531197355862e-06, "loss": 0.9915, "step": 11614 }, { "epoch": 0.27, "learning_rate": 8.571268355118558e-06, "loss": 1.0273, "step": 11615 }, { "epoch": 0.27, "learning_rate": 8.5710054927324e-06, "loss": 1.2422, "step": 11616 }, { "epoch": 0.27, "learning_rate": 8.570742610198872e-06, "loss": 1.1342, "step": 11617 }, { "epoch": 0.27, "learning_rate": 8.570479707519456e-06, "loss": 0.9411, "step": 11618 }, { "epoch": 0.27, "learning_rate": 8.570216784695637e-06, "loss": 0.8774, "step": 11619 }, { "epoch": 0.27, "learning_rate": 8.569953841728897e-06, "loss": 0.9468, "step": 11620 }, { "epoch": 0.27, "learning_rate": 8.569690878620721e-06, "loss": 1.1143, "step": 11621 }, { "epoch": 0.27, "learning_rate": 8.569427895372593e-06, "loss": 1.0404, "step": 11622 }, { "epoch": 0.27, "learning_rate": 8.569164891985994e-06, "loss": 0.8014, "step": 11623 }, { "epoch": 0.27, "learning_rate": 8.568901868462411e-06, "loss": 0.9048, "step": 11624 }, { "epoch": 0.27, "learning_rate": 8.568638824803327e-06, "loss": 1.2012, "step": 11625 }, { "epoch": 0.27, "learning_rate": 8.568375761010223e-06, "loss": 1.1555, "step": 11626 }, { "epoch": 0.27, "learning_rate": 8.568112677084587e-06, "loss": 0.8145, "step": 11627 }, { "epoch": 0.27, "learning_rate": 8.567849573027903e-06, "loss": 1.1562, "step": 11628 }, { "epoch": 0.27, "learning_rate": 8.567586448841652e-06, "loss": 0.9312, "step": 11629 }, { "epoch": 0.27, "learning_rate": 8.567323304527321e-06, "loss": 0.7813, "step": 11630 }, { "epoch": 0.27, "learning_rate": 8.567060140086397e-06, "loss": 1.0016, "step": 11631 }, { "epoch": 0.27, "learning_rate": 8.56679695552036e-06, "loss": 0.7938, "step": 11632 }, { "epoch": 0.27, "learning_rate": 8.5665337508307e-06, "loss": 0.966, "step": 11633 }, { "epoch": 0.27, "learning_rate": 8.566270526018896e-06, "loss": 1.0365, "step": 11634 }, { "epoch": 0.27, "learning_rate": 8.566007281086437e-06, "loss": 0.8021, "step": 11635 }, { "epoch": 0.27, "learning_rate": 8.565744016034808e-06, "loss": 1.1521, "step": 11636 }, { "epoch": 0.27, "learning_rate": 8.565480730865494e-06, "loss": 1.0309, "step": 11637 }, { "epoch": 0.27, "learning_rate": 8.56521742557998e-06, "loss": 1.0409, "step": 11638 }, { "epoch": 0.27, "learning_rate": 8.564954100179752e-06, "loss": 1.098, "step": 11639 }, { "epoch": 0.27, "learning_rate": 8.564690754666295e-06, "loss": 0.8702, "step": 11640 }, { "epoch": 0.27, "learning_rate": 8.564427389041095e-06, "loss": 0.897, "step": 11641 }, { "epoch": 0.27, "learning_rate": 8.56416400330564e-06, "loss": 0.9441, "step": 11642 }, { "epoch": 0.27, "learning_rate": 8.563900597461413e-06, "loss": 1.1201, "step": 11643 }, { "epoch": 0.27, "learning_rate": 8.563637171509901e-06, "loss": 1.0018, "step": 11644 }, { "epoch": 0.27, "learning_rate": 8.56337372545259e-06, "loss": 0.8689, "step": 11645 }, { "epoch": 0.27, "learning_rate": 8.563110259290968e-06, "loss": 0.8515, "step": 11646 }, { "epoch": 0.27, "learning_rate": 8.56284677302652e-06, "loss": 0.9286, "step": 11647 }, { "epoch": 0.27, "learning_rate": 8.562583266660732e-06, "loss": 0.9484, "step": 11648 }, { "epoch": 0.27, "learning_rate": 8.562319740195092e-06, "loss": 1.1461, "step": 11649 }, { "epoch": 0.27, "learning_rate": 8.562056193631087e-06, "loss": 0.9034, "step": 11650 }, { "epoch": 0.27, "learning_rate": 8.561792626970203e-06, "loss": 0.7989, "step": 11651 }, { "epoch": 0.27, "learning_rate": 8.561529040213926e-06, "loss": 0.9667, "step": 11652 }, { "epoch": 0.27, "learning_rate": 8.561265433363746e-06, "loss": 0.9295, "step": 11653 }, { "epoch": 0.27, "learning_rate": 8.561001806421147e-06, "loss": 0.8033, "step": 11654 }, { "epoch": 0.27, "learning_rate": 8.56073815938762e-06, "loss": 1.1216, "step": 11655 }, { "epoch": 0.27, "learning_rate": 8.560474492264648e-06, "loss": 0.7516, "step": 11656 }, { "epoch": 0.27, "learning_rate": 8.560210805053724e-06, "loss": 0.8931, "step": 11657 }, { "epoch": 0.27, "learning_rate": 8.559947097756331e-06, "loss": 0.8561, "step": 11658 }, { "epoch": 0.27, "learning_rate": 8.559683370373959e-06, "loss": 0.9948, "step": 11659 }, { "epoch": 0.27, "learning_rate": 8.559419622908096e-06, "loss": 0.9323, "step": 11660 }, { "epoch": 0.27, "learning_rate": 8.559155855360228e-06, "loss": 0.7189, "step": 11661 }, { "epoch": 0.27, "learning_rate": 8.558892067731846e-06, "loss": 1.0849, "step": 11662 }, { "epoch": 0.27, "learning_rate": 8.558628260024437e-06, "loss": 1.1091, "step": 11663 }, { "epoch": 0.27, "learning_rate": 8.558364432239489e-06, "loss": 1.2649, "step": 11664 }, { "epoch": 0.27, "learning_rate": 8.558100584378493e-06, "loss": 0.8709, "step": 11665 }, { "epoch": 0.27, "learning_rate": 8.557836716442933e-06, "loss": 1.1181, "step": 11666 }, { "epoch": 0.27, "learning_rate": 8.557572828434302e-06, "loss": 1.0991, "step": 11667 }, { "epoch": 0.27, "learning_rate": 8.557308920354086e-06, "loss": 0.8494, "step": 11668 }, { "epoch": 0.27, "learning_rate": 8.557044992203774e-06, "loss": 0.9431, "step": 11669 }, { "epoch": 0.27, "learning_rate": 8.556781043984858e-06, "loss": 0.9781, "step": 11670 }, { "epoch": 0.27, "learning_rate": 8.556517075698825e-06, "loss": 0.9786, "step": 11671 }, { "epoch": 0.27, "learning_rate": 8.556253087347164e-06, "loss": 0.8013, "step": 11672 }, { "epoch": 0.27, "learning_rate": 8.555989078931366e-06, "loss": 1.0685, "step": 11673 }, { "epoch": 0.27, "learning_rate": 8.555725050452918e-06, "loss": 0.8564, "step": 11674 }, { "epoch": 0.27, "learning_rate": 8.555461001913312e-06, "loss": 0.8376, "step": 11675 }, { "epoch": 0.27, "learning_rate": 8.555196933314035e-06, "loss": 1.2428, "step": 11676 }, { "epoch": 0.27, "learning_rate": 8.554932844656582e-06, "loss": 0.8431, "step": 11677 }, { "epoch": 0.27, "learning_rate": 8.554668735942437e-06, "loss": 0.909, "step": 11678 }, { "epoch": 0.27, "learning_rate": 8.554404607173095e-06, "loss": 1.2907, "step": 11679 }, { "epoch": 0.27, "learning_rate": 8.554140458350042e-06, "loss": 1.1462, "step": 11680 }, { "epoch": 0.27, "learning_rate": 8.553876289474772e-06, "loss": 0.937, "step": 11681 }, { "epoch": 0.27, "learning_rate": 8.553612100548772e-06, "loss": 0.8591, "step": 11682 }, { "epoch": 0.27, "learning_rate": 8.553347891573536e-06, "loss": 1.1512, "step": 11683 }, { "epoch": 0.27, "learning_rate": 8.553083662550552e-06, "loss": 0.9843, "step": 11684 }, { "epoch": 0.27, "learning_rate": 8.552819413481311e-06, "loss": 0.9143, "step": 11685 }, { "epoch": 0.27, "learning_rate": 8.552555144367305e-06, "loss": 1.0073, "step": 11686 }, { "epoch": 0.27, "learning_rate": 8.552290855210026e-06, "loss": 1.0597, "step": 11687 }, { "epoch": 0.27, "learning_rate": 8.552026546010961e-06, "loss": 0.7847, "step": 11688 }, { "epoch": 0.27, "learning_rate": 8.551762216771606e-06, "loss": 1.1191, "step": 11689 }, { "epoch": 0.27, "learning_rate": 8.55149786749345e-06, "loss": 1.0417, "step": 11690 }, { "epoch": 0.27, "learning_rate": 8.551233498177982e-06, "loss": 1.031, "step": 11691 }, { "epoch": 0.27, "learning_rate": 8.550969108826698e-06, "loss": 1.0639, "step": 11692 }, { "epoch": 0.27, "learning_rate": 8.550704699441089e-06, "loss": 0.7531, "step": 11693 }, { "epoch": 0.27, "learning_rate": 8.550440270022645e-06, "loss": 0.9985, "step": 11694 }, { "epoch": 0.27, "learning_rate": 8.550175820572858e-06, "loss": 0.9275, "step": 11695 }, { "epoch": 0.27, "learning_rate": 8.54991135109322e-06, "loss": 0.9247, "step": 11696 }, { "epoch": 0.27, "learning_rate": 8.549646861585223e-06, "loss": 0.9496, "step": 11697 }, { "epoch": 0.27, "learning_rate": 8.549382352050361e-06, "loss": 0.9697, "step": 11698 }, { "epoch": 0.27, "learning_rate": 8.549117822490124e-06, "loss": 1.003, "step": 11699 }, { "epoch": 0.27, "learning_rate": 8.548853272906008e-06, "loss": 0.958, "step": 11700 }, { "epoch": 0.27, "learning_rate": 8.548588703299503e-06, "loss": 1.1542, "step": 11701 }, { "epoch": 0.27, "learning_rate": 8.5483241136721e-06, "loss": 0.8342, "step": 11702 }, { "epoch": 0.27, "learning_rate": 8.548059504025295e-06, "loss": 1.0575, "step": 11703 }, { "epoch": 0.27, "learning_rate": 8.54779487436058e-06, "loss": 0.7482, "step": 11704 }, { "epoch": 0.27, "learning_rate": 8.547530224679446e-06, "loss": 1.1171, "step": 11705 }, { "epoch": 0.27, "learning_rate": 8.54726555498339e-06, "loss": 1.0421, "step": 11706 }, { "epoch": 0.27, "learning_rate": 8.547000865273901e-06, "loss": 1.0774, "step": 11707 }, { "epoch": 0.27, "learning_rate": 8.546736155552475e-06, "loss": 0.9116, "step": 11708 }, { "epoch": 0.27, "learning_rate": 8.546471425820606e-06, "loss": 1.1404, "step": 11709 }, { "epoch": 0.27, "learning_rate": 8.546206676079785e-06, "loss": 1.0616, "step": 11710 }, { "epoch": 0.27, "learning_rate": 8.545941906331507e-06, "loss": 1.0166, "step": 11711 }, { "epoch": 0.27, "learning_rate": 8.545677116577267e-06, "loss": 0.9871, "step": 11712 }, { "epoch": 0.27, "learning_rate": 8.545412306818558e-06, "loss": 1.0961, "step": 11713 }, { "epoch": 0.27, "learning_rate": 8.545147477056873e-06, "loss": 0.7208, "step": 11714 }, { "epoch": 0.27, "learning_rate": 8.544882627293708e-06, "loss": 1.0241, "step": 11715 }, { "epoch": 0.27, "learning_rate": 8.544617757530556e-06, "loss": 0.8709, "step": 11716 }, { "epoch": 0.27, "learning_rate": 8.54435286776891e-06, "loss": 1.0398, "step": 11717 }, { "epoch": 0.27, "learning_rate": 8.544087958010268e-06, "loss": 0.8347, "step": 11718 }, { "epoch": 0.27, "learning_rate": 8.543823028256124e-06, "loss": 0.843, "step": 11719 }, { "epoch": 0.27, "learning_rate": 8.543558078507968e-06, "loss": 1.1837, "step": 11720 }, { "epoch": 0.27, "learning_rate": 8.543293108767302e-06, "loss": 1.2195, "step": 11721 }, { "epoch": 0.27, "learning_rate": 8.543028119035615e-06, "loss": 1.0501, "step": 11722 }, { "epoch": 0.27, "learning_rate": 8.542763109314406e-06, "loss": 1.2067, "step": 11723 }, { "epoch": 0.27, "learning_rate": 8.542498079605167e-06, "loss": 1.0135, "step": 11724 }, { "epoch": 0.27, "learning_rate": 8.542233029909395e-06, "loss": 0.885, "step": 11725 }, { "epoch": 0.27, "learning_rate": 8.541967960228586e-06, "loss": 0.9312, "step": 11726 }, { "epoch": 0.27, "learning_rate": 8.541702870564233e-06, "loss": 0.8059, "step": 11727 }, { "epoch": 0.27, "learning_rate": 8.541437760917835e-06, "loss": 1.0162, "step": 11728 }, { "epoch": 0.27, "learning_rate": 8.541172631290886e-06, "loss": 0.9309, "step": 11729 }, { "epoch": 0.27, "learning_rate": 8.540907481684881e-06, "loss": 1.0952, "step": 11730 }, { "epoch": 0.27, "learning_rate": 8.540642312101316e-06, "loss": 1.0038, "step": 11731 }, { "epoch": 0.27, "learning_rate": 8.54037712254169e-06, "loss": 1.1989, "step": 11732 }, { "epoch": 0.27, "learning_rate": 8.540111913007498e-06, "loss": 0.9275, "step": 11733 }, { "epoch": 0.27, "learning_rate": 8.539846683500233e-06, "loss": 0.8696, "step": 11734 }, { "epoch": 0.27, "learning_rate": 8.539581434021395e-06, "loss": 0.8997, "step": 11735 }, { "epoch": 0.27, "learning_rate": 8.539316164572478e-06, "loss": 0.8213, "step": 11736 }, { "epoch": 0.27, "learning_rate": 8.539050875154982e-06, "loss": 1.096, "step": 11737 }, { "epoch": 0.27, "learning_rate": 8.5387855657704e-06, "loss": 0.7523, "step": 11738 }, { "epoch": 0.27, "learning_rate": 8.53852023642023e-06, "loss": 0.7146, "step": 11739 }, { "epoch": 0.27, "learning_rate": 8.538254887105971e-06, "loss": 1.0432, "step": 11740 }, { "epoch": 0.27, "learning_rate": 8.537989517829118e-06, "loss": 0.8014, "step": 11741 }, { "epoch": 0.27, "learning_rate": 8.537724128591169e-06, "loss": 1.0685, "step": 11742 }, { "epoch": 0.27, "learning_rate": 8.537458719393621e-06, "loss": 0.9859, "step": 11743 }, { "epoch": 0.27, "learning_rate": 8.537193290237972e-06, "loss": 1.1719, "step": 11744 }, { "epoch": 0.27, "learning_rate": 8.53692784112572e-06, "loss": 0.8641, "step": 11745 }, { "epoch": 0.27, "learning_rate": 8.536662372058358e-06, "loss": 0.7807, "step": 11746 }, { "epoch": 0.27, "learning_rate": 8.53639688303739e-06, "loss": 1.1313, "step": 11747 }, { "epoch": 0.27, "learning_rate": 8.536131374064311e-06, "loss": 1.2162, "step": 11748 }, { "epoch": 0.27, "learning_rate": 8.535865845140621e-06, "loss": 0.9482, "step": 11749 }, { "epoch": 0.27, "learning_rate": 8.535600296267813e-06, "loss": 1.0586, "step": 11750 }, { "epoch": 0.27, "learning_rate": 8.535334727447391e-06, "loss": 1.034, "step": 11751 }, { "epoch": 0.27, "learning_rate": 8.53506913868085e-06, "loss": 1.126, "step": 11752 }, { "epoch": 0.27, "learning_rate": 8.53480352996969e-06, "loss": 0.968, "step": 11753 }, { "epoch": 0.27, "learning_rate": 8.53453790131541e-06, "loss": 0.8914, "step": 11754 }, { "epoch": 0.27, "learning_rate": 8.534272252719504e-06, "loss": 0.9984, "step": 11755 }, { "epoch": 0.27, "learning_rate": 8.534006584183477e-06, "loss": 0.9604, "step": 11756 }, { "epoch": 0.27, "learning_rate": 8.533740895708826e-06, "loss": 1.08, "step": 11757 }, { "epoch": 0.27, "learning_rate": 8.533475187297047e-06, "loss": 1.1465, "step": 11758 }, { "epoch": 0.27, "learning_rate": 8.533209458949643e-06, "loss": 0.8192, "step": 11759 }, { "epoch": 0.27, "learning_rate": 8.53294371066811e-06, "loss": 1.1666, "step": 11760 }, { "epoch": 0.27, "learning_rate": 8.53267794245395e-06, "loss": 0.7603, "step": 11761 }, { "epoch": 0.27, "learning_rate": 8.532412154308662e-06, "loss": 0.9418, "step": 11762 }, { "epoch": 0.27, "learning_rate": 8.532146346233743e-06, "loss": 0.6971, "step": 11763 }, { "epoch": 0.27, "learning_rate": 8.531880518230697e-06, "loss": 0.637, "step": 11764 }, { "epoch": 0.27, "learning_rate": 8.53161467030102e-06, "loss": 0.8879, "step": 11765 }, { "epoch": 0.27, "learning_rate": 8.531348802446212e-06, "loss": 1.0603, "step": 11766 }, { "epoch": 0.27, "learning_rate": 8.531082914667777e-06, "loss": 0.7864, "step": 11767 }, { "epoch": 0.27, "learning_rate": 8.53081700696721e-06, "loss": 1.2085, "step": 11768 }, { "epoch": 0.27, "learning_rate": 8.530551079346015e-06, "loss": 0.905, "step": 11769 }, { "epoch": 0.27, "learning_rate": 8.530285131805692e-06, "loss": 0.9938, "step": 11770 }, { "epoch": 0.27, "learning_rate": 8.530019164347738e-06, "loss": 0.8588, "step": 11771 }, { "epoch": 0.27, "learning_rate": 8.529753176973656e-06, "loss": 0.9781, "step": 11772 }, { "epoch": 0.27, "learning_rate": 8.52948716968495e-06, "loss": 1.0376, "step": 11773 }, { "epoch": 0.27, "learning_rate": 8.529221142483112e-06, "loss": 1.2195, "step": 11774 }, { "epoch": 0.27, "learning_rate": 8.528955095369653e-06, "loss": 0.8604, "step": 11775 }, { "epoch": 0.27, "learning_rate": 8.528689028346066e-06, "loss": 0.7689, "step": 11776 }, { "epoch": 0.27, "learning_rate": 8.528422941413859e-06, "loss": 1.0808, "step": 11777 }, { "epoch": 0.27, "learning_rate": 8.528156834574528e-06, "loss": 0.9351, "step": 11778 }, { "epoch": 0.27, "learning_rate": 8.527890707829575e-06, "loss": 1.0471, "step": 11779 }, { "epoch": 0.27, "learning_rate": 8.527624561180505e-06, "loss": 1.0787, "step": 11780 }, { "epoch": 0.27, "learning_rate": 8.527358394628816e-06, "loss": 1.0474, "step": 11781 }, { "epoch": 0.27, "learning_rate": 8.52709220817601e-06, "loss": 1.2113, "step": 11782 }, { "epoch": 0.27, "learning_rate": 8.526826001823591e-06, "loss": 1.1081, "step": 11783 }, { "epoch": 0.27, "learning_rate": 8.52655977557306e-06, "loss": 0.9822, "step": 11784 }, { "epoch": 0.27, "learning_rate": 8.526293529425917e-06, "loss": 0.7885, "step": 11785 }, { "epoch": 0.27, "learning_rate": 8.526027263383667e-06, "loss": 0.9942, "step": 11786 }, { "epoch": 0.27, "learning_rate": 8.52576097744781e-06, "loss": 1.0324, "step": 11787 }, { "epoch": 0.27, "learning_rate": 8.52549467161985e-06, "loss": 0.7177, "step": 11788 }, { "epoch": 0.27, "learning_rate": 8.525228345901289e-06, "loss": 0.9643, "step": 11789 }, { "epoch": 0.27, "learning_rate": 8.524962000293629e-06, "loss": 0.9298, "step": 11790 }, { "epoch": 0.27, "learning_rate": 8.524695634798374e-06, "loss": 1.0869, "step": 11791 }, { "epoch": 0.27, "learning_rate": 8.524429249417025e-06, "loss": 0.9841, "step": 11792 }, { "epoch": 0.27, "learning_rate": 8.524162844151085e-06, "loss": 0.9344, "step": 11793 }, { "epoch": 0.27, "learning_rate": 8.52389641900206e-06, "loss": 0.9935, "step": 11794 }, { "epoch": 0.27, "learning_rate": 8.523629973971451e-06, "loss": 0.7786, "step": 11795 }, { "epoch": 0.27, "learning_rate": 8.523363509060761e-06, "loss": 1.0424, "step": 11796 }, { "epoch": 0.27, "learning_rate": 8.523097024271494e-06, "loss": 1.2348, "step": 11797 }, { "epoch": 0.27, "learning_rate": 8.522830519605153e-06, "loss": 0.9111, "step": 11798 }, { "epoch": 0.27, "learning_rate": 8.52256399506324e-06, "loss": 1.1011, "step": 11799 }, { "epoch": 0.27, "learning_rate": 8.522297450647262e-06, "loss": 1.0868, "step": 11800 }, { "epoch": 0.27, "learning_rate": 8.522030886358721e-06, "loss": 1.1849, "step": 11801 }, { "epoch": 0.27, "learning_rate": 8.521764302199123e-06, "loss": 1.2569, "step": 11802 }, { "epoch": 0.27, "learning_rate": 8.52149769816997e-06, "loss": 1.1192, "step": 11803 }, { "epoch": 0.27, "learning_rate": 8.521231074272764e-06, "loss": 0.8306, "step": 11804 }, { "epoch": 0.27, "learning_rate": 8.520964430509014e-06, "loss": 0.857, "step": 11805 }, { "epoch": 0.27, "learning_rate": 8.520697766880222e-06, "loss": 1.0354, "step": 11806 }, { "epoch": 0.27, "learning_rate": 8.520431083387892e-06, "loss": 1.0838, "step": 11807 }, { "epoch": 0.27, "learning_rate": 8.520164380033529e-06, "loss": 1.0605, "step": 11808 }, { "epoch": 0.27, "learning_rate": 8.519897656818639e-06, "loss": 1.0482, "step": 11809 }, { "epoch": 0.27, "learning_rate": 8.519630913744726e-06, "loss": 0.9266, "step": 11810 }, { "epoch": 0.27, "learning_rate": 8.519364150813295e-06, "loss": 1.1546, "step": 11811 }, { "epoch": 0.27, "learning_rate": 8.519097368025849e-06, "loss": 1.1633, "step": 11812 }, { "epoch": 0.27, "learning_rate": 8.518830565383895e-06, "loss": 1.0956, "step": 11813 }, { "epoch": 0.27, "learning_rate": 8.51856374288894e-06, "loss": 0.9794, "step": 11814 }, { "epoch": 0.27, "learning_rate": 8.518296900542487e-06, "loss": 1.0029, "step": 11815 }, { "epoch": 0.27, "learning_rate": 8.518030038346043e-06, "loss": 0.7993, "step": 11816 }, { "epoch": 0.27, "learning_rate": 8.517763156301111e-06, "loss": 0.881, "step": 11817 }, { "epoch": 0.27, "learning_rate": 8.5174962544092e-06, "loss": 0.9428, "step": 11818 }, { "epoch": 0.27, "learning_rate": 8.517229332671815e-06, "loss": 0.9666, "step": 11819 }, { "epoch": 0.27, "learning_rate": 8.51696239109046e-06, "loss": 1.1216, "step": 11820 }, { "epoch": 0.27, "learning_rate": 8.516695429666643e-06, "loss": 1.0864, "step": 11821 }, { "epoch": 0.27, "learning_rate": 8.516428448401868e-06, "loss": 0.8644, "step": 11822 }, { "epoch": 0.27, "learning_rate": 8.516161447297647e-06, "loss": 1.0144, "step": 11823 }, { "epoch": 0.27, "learning_rate": 8.515894426355479e-06, "loss": 1.1903, "step": 11824 }, { "epoch": 0.27, "learning_rate": 8.515627385576873e-06, "loss": 0.9919, "step": 11825 }, { "epoch": 0.27, "learning_rate": 8.515360324963337e-06, "loss": 0.9713, "step": 11826 }, { "epoch": 0.27, "learning_rate": 8.515093244516379e-06, "loss": 0.9046, "step": 11827 }, { "epoch": 0.27, "learning_rate": 8.514826144237503e-06, "loss": 0.8662, "step": 11828 }, { "epoch": 0.27, "learning_rate": 8.514559024128217e-06, "loss": 0.761, "step": 11829 }, { "epoch": 0.27, "learning_rate": 8.514291884190027e-06, "loss": 1.1161, "step": 11830 }, { "epoch": 0.27, "learning_rate": 8.514024724424443e-06, "loss": 0.9502, "step": 11831 }, { "epoch": 0.27, "learning_rate": 8.51375754483297e-06, "loss": 1.0691, "step": 11832 }, { "epoch": 0.27, "learning_rate": 8.513490345417115e-06, "loss": 1.0527, "step": 11833 }, { "epoch": 0.27, "learning_rate": 8.513223126178386e-06, "loss": 0.8438, "step": 11834 }, { "epoch": 0.27, "learning_rate": 8.512955887118293e-06, "loss": 0.8176, "step": 11835 }, { "epoch": 0.27, "learning_rate": 8.512688628238341e-06, "loss": 1.1335, "step": 11836 }, { "epoch": 0.27, "learning_rate": 8.51242134954004e-06, "loss": 1.0015, "step": 11837 }, { "epoch": 0.27, "learning_rate": 8.512154051024894e-06, "loss": 0.9692, "step": 11838 }, { "epoch": 0.27, "learning_rate": 8.511886732694417e-06, "loss": 1.0063, "step": 11839 }, { "epoch": 0.27, "learning_rate": 8.511619394550112e-06, "loss": 1.2649, "step": 11840 }, { "epoch": 0.27, "learning_rate": 8.511352036593488e-06, "loss": 0.7989, "step": 11841 }, { "epoch": 0.27, "learning_rate": 8.511084658826057e-06, "loss": 0.8144, "step": 11842 }, { "epoch": 0.27, "learning_rate": 8.510817261249325e-06, "loss": 0.9422, "step": 11843 }, { "epoch": 0.27, "learning_rate": 8.5105498438648e-06, "loss": 0.9476, "step": 11844 }, { "epoch": 0.27, "learning_rate": 8.51028240667399e-06, "loss": 0.7999, "step": 11845 }, { "epoch": 0.27, "learning_rate": 8.510014949678407e-06, "loss": 1.1169, "step": 11846 }, { "epoch": 0.27, "learning_rate": 8.50974747287956e-06, "loss": 0.6305, "step": 11847 }, { "epoch": 0.27, "learning_rate": 8.509479976278953e-06, "loss": 0.8881, "step": 11848 }, { "epoch": 0.27, "learning_rate": 8.509212459878101e-06, "loss": 0.871, "step": 11849 }, { "epoch": 0.27, "learning_rate": 8.508944923678512e-06, "loss": 0.8345, "step": 11850 }, { "epoch": 0.27, "learning_rate": 8.508677367681692e-06, "loss": 0.9579, "step": 11851 }, { "epoch": 0.27, "learning_rate": 8.508409791889154e-06, "loss": 0.8759, "step": 11852 }, { "epoch": 0.27, "learning_rate": 8.508142196302407e-06, "loss": 1.0853, "step": 11853 }, { "epoch": 0.27, "learning_rate": 8.507874580922958e-06, "loss": 0.8448, "step": 11854 }, { "epoch": 0.27, "learning_rate": 8.507606945752323e-06, "loss": 1.1172, "step": 11855 }, { "epoch": 0.27, "learning_rate": 8.507339290792005e-06, "loss": 1.2386, "step": 11856 }, { "epoch": 0.27, "learning_rate": 8.507071616043518e-06, "loss": 0.8747, "step": 11857 }, { "epoch": 0.28, "learning_rate": 8.506803921508373e-06, "loss": 0.9723, "step": 11858 }, { "epoch": 0.28, "learning_rate": 8.506536207188078e-06, "loss": 1.0243, "step": 11859 }, { "epoch": 0.28, "learning_rate": 8.506268473084145e-06, "loss": 0.8783, "step": 11860 }, { "epoch": 0.28, "learning_rate": 8.506000719198082e-06, "loss": 0.983, "step": 11861 }, { "epoch": 0.28, "learning_rate": 8.505732945531401e-06, "loss": 1.0828, "step": 11862 }, { "epoch": 0.28, "learning_rate": 8.505465152085617e-06, "loss": 0.9012, "step": 11863 }, { "epoch": 0.28, "learning_rate": 8.505197338862234e-06, "loss": 0.9401, "step": 11864 }, { "epoch": 0.28, "learning_rate": 8.504929505862767e-06, "loss": 0.9596, "step": 11865 }, { "epoch": 0.28, "learning_rate": 8.504661653088725e-06, "loss": 0.8764, "step": 11866 }, { "epoch": 0.28, "learning_rate": 8.504393780541622e-06, "loss": 0.917, "step": 11867 }, { "epoch": 0.28, "learning_rate": 8.504125888222966e-06, "loss": 0.9525, "step": 11868 }, { "epoch": 0.28, "learning_rate": 8.503857976134271e-06, "loss": 1.1751, "step": 11869 }, { "epoch": 0.28, "learning_rate": 8.503590044277048e-06, "loss": 1.0806, "step": 11870 }, { "epoch": 0.28, "learning_rate": 8.503322092652808e-06, "loss": 0.7203, "step": 11871 }, { "epoch": 0.28, "learning_rate": 8.503054121263062e-06, "loss": 0.884, "step": 11872 }, { "epoch": 0.28, "learning_rate": 8.502786130109324e-06, "loss": 1.0812, "step": 11873 }, { "epoch": 0.28, "learning_rate": 8.502518119193104e-06, "loss": 1.107, "step": 11874 }, { "epoch": 0.28, "learning_rate": 8.502250088515915e-06, "loss": 1.3359, "step": 11875 }, { "epoch": 0.28, "learning_rate": 8.50198203807927e-06, "loss": 0.7995, "step": 11876 }, { "epoch": 0.28, "learning_rate": 8.501713967884682e-06, "loss": 1.1943, "step": 11877 }, { "epoch": 0.28, "learning_rate": 8.50144587793366e-06, "loss": 1.04, "step": 11878 }, { "epoch": 0.28, "learning_rate": 8.501177768227719e-06, "loss": 0.9134, "step": 11879 }, { "epoch": 0.28, "learning_rate": 8.50090963876837e-06, "loss": 0.9105, "step": 11880 }, { "epoch": 0.28, "learning_rate": 8.500641489557129e-06, "loss": 0.6211, "step": 11881 }, { "epoch": 0.28, "learning_rate": 8.500373320595506e-06, "loss": 0.8125, "step": 11882 }, { "epoch": 0.28, "learning_rate": 8.500105131885014e-06, "loss": 1.1665, "step": 11883 }, { "epoch": 0.28, "learning_rate": 8.499836923427167e-06, "loss": 1.2113, "step": 11884 }, { "epoch": 0.28, "learning_rate": 8.49956869522348e-06, "loss": 1.0149, "step": 11885 }, { "epoch": 0.28, "learning_rate": 8.499300447275463e-06, "loss": 0.7353, "step": 11886 }, { "epoch": 0.28, "learning_rate": 8.499032179584633e-06, "loss": 0.9645, "step": 11887 }, { "epoch": 0.28, "learning_rate": 8.498763892152498e-06, "loss": 1.1015, "step": 11888 }, { "epoch": 0.28, "learning_rate": 8.498495584980575e-06, "loss": 1.088, "step": 11889 }, { "epoch": 0.28, "learning_rate": 8.498227258070381e-06, "loss": 1.0809, "step": 11890 }, { "epoch": 0.28, "learning_rate": 8.497958911423425e-06, "loss": 0.9876, "step": 11891 }, { "epoch": 0.28, "learning_rate": 8.497690545041223e-06, "loss": 0.87, "step": 11892 }, { "epoch": 0.28, "learning_rate": 8.49742215892529e-06, "loss": 0.9262, "step": 11893 }, { "epoch": 0.28, "learning_rate": 8.497153753077136e-06, "loss": 1.1907, "step": 11894 }, { "epoch": 0.28, "learning_rate": 8.496885327498281e-06, "loss": 0.7889, "step": 11895 }, { "epoch": 0.28, "learning_rate": 8.496616882190237e-06, "loss": 0.9094, "step": 11896 }, { "epoch": 0.28, "learning_rate": 8.49634841715452e-06, "loss": 1.1205, "step": 11897 }, { "epoch": 0.28, "learning_rate": 8.496079932392637e-06, "loss": 1.2068, "step": 11898 }, { "epoch": 0.28, "learning_rate": 8.495811427906114e-06, "loss": 1.0281, "step": 11899 }, { "epoch": 0.28, "learning_rate": 8.495542903696458e-06, "loss": 0.9506, "step": 11900 }, { "epoch": 0.28, "learning_rate": 8.495274359765188e-06, "loss": 1.0606, "step": 11901 }, { "epoch": 0.28, "learning_rate": 8.49500579611382e-06, "loss": 0.7836, "step": 11902 }, { "epoch": 0.28, "learning_rate": 8.494737212743864e-06, "loss": 0.9064, "step": 11903 }, { "epoch": 0.28, "learning_rate": 8.49446860965684e-06, "loss": 0.9486, "step": 11904 }, { "epoch": 0.28, "learning_rate": 8.49419998685426e-06, "loss": 0.8625, "step": 11905 }, { "epoch": 0.28, "learning_rate": 8.493931344337643e-06, "loss": 1.0296, "step": 11906 }, { "epoch": 0.28, "learning_rate": 8.493662682108501e-06, "loss": 0.7683, "step": 11907 }, { "epoch": 0.28, "learning_rate": 8.493394000168354e-06, "loss": 0.9676, "step": 11908 }, { "epoch": 0.28, "learning_rate": 8.493125298518714e-06, "loss": 0.8108, "step": 11909 }, { "epoch": 0.28, "learning_rate": 8.4928565771611e-06, "loss": 0.8876, "step": 11910 }, { "epoch": 0.28, "learning_rate": 8.492587836097025e-06, "loss": 1.0474, "step": 11911 }, { "epoch": 0.28, "learning_rate": 8.49231907532801e-06, "loss": 0.8009, "step": 11912 }, { "epoch": 0.28, "learning_rate": 8.492050294855567e-06, "loss": 1.1537, "step": 11913 }, { "epoch": 0.28, "learning_rate": 8.491781494681212e-06, "loss": 0.9135, "step": 11914 }, { "epoch": 0.28, "learning_rate": 8.491512674806466e-06, "loss": 1.3407, "step": 11915 }, { "epoch": 0.28, "learning_rate": 8.49124383523284e-06, "loss": 1.0711, "step": 11916 }, { "epoch": 0.28, "learning_rate": 8.490974975961856e-06, "loss": 0.9459, "step": 11917 }, { "epoch": 0.28, "learning_rate": 8.490706096995027e-06, "loss": 0.97, "step": 11918 }, { "epoch": 0.28, "learning_rate": 8.490437198333875e-06, "loss": 1.1172, "step": 11919 }, { "epoch": 0.28, "learning_rate": 8.49016827997991e-06, "loss": 1.2528, "step": 11920 }, { "epoch": 0.28, "learning_rate": 8.489899341934655e-06, "loss": 0.9313, "step": 11921 }, { "epoch": 0.28, "learning_rate": 8.489630384199625e-06, "loss": 0.9308, "step": 11922 }, { "epoch": 0.28, "learning_rate": 8.489361406776337e-06, "loss": 0.8105, "step": 11923 }, { "epoch": 0.28, "learning_rate": 8.489092409666309e-06, "loss": 0.9109, "step": 11924 }, { "epoch": 0.28, "learning_rate": 8.488823392871059e-06, "loss": 0.8405, "step": 11925 }, { "epoch": 0.28, "learning_rate": 8.488554356392107e-06, "loss": 1.2133, "step": 11926 }, { "epoch": 0.28, "learning_rate": 8.488285300230966e-06, "loss": 0.8234, "step": 11927 }, { "epoch": 0.28, "learning_rate": 8.488016224389158e-06, "loss": 1.0255, "step": 11928 }, { "epoch": 0.28, "learning_rate": 8.4877471288682e-06, "loss": 0.9265, "step": 11929 }, { "epoch": 0.28, "learning_rate": 8.487478013669609e-06, "loss": 0.7051, "step": 11930 }, { "epoch": 0.28, "learning_rate": 8.487208878794903e-06, "loss": 0.9545, "step": 11931 }, { "epoch": 0.28, "learning_rate": 8.486939724245605e-06, "loss": 0.9999, "step": 11932 }, { "epoch": 0.28, "learning_rate": 8.486670550023227e-06, "loss": 1.0519, "step": 11933 }, { "epoch": 0.28, "learning_rate": 8.486401356129292e-06, "loss": 0.9877, "step": 11934 }, { "epoch": 0.28, "learning_rate": 8.486132142565319e-06, "loss": 1.0001, "step": 11935 }, { "epoch": 0.28, "learning_rate": 8.485862909332824e-06, "loss": 1.129, "step": 11936 }, { "epoch": 0.28, "learning_rate": 8.485593656433329e-06, "loss": 0.9613, "step": 11937 }, { "epoch": 0.28, "learning_rate": 8.485324383868351e-06, "loss": 0.7839, "step": 11938 }, { "epoch": 0.28, "learning_rate": 8.48505509163941e-06, "loss": 0.8497, "step": 11939 }, { "epoch": 0.28, "learning_rate": 8.484785779748024e-06, "loss": 1.2481, "step": 11940 }, { "epoch": 0.28, "learning_rate": 8.484516448195716e-06, "loss": 0.7942, "step": 11941 }, { "epoch": 0.28, "learning_rate": 8.484247096984001e-06, "loss": 0.9695, "step": 11942 }, { "epoch": 0.28, "learning_rate": 8.483977726114402e-06, "loss": 0.7096, "step": 11943 }, { "epoch": 0.28, "learning_rate": 8.483708335588438e-06, "loss": 0.9236, "step": 11944 }, { "epoch": 0.28, "learning_rate": 8.483438925407628e-06, "loss": 0.925, "step": 11945 }, { "epoch": 0.28, "learning_rate": 8.483169495573492e-06, "loss": 1.0044, "step": 11946 }, { "epoch": 0.28, "learning_rate": 8.48290004608755e-06, "loss": 0.8663, "step": 11947 }, { "epoch": 0.28, "learning_rate": 8.482630576951325e-06, "loss": 1.011, "step": 11948 }, { "epoch": 0.28, "learning_rate": 8.482361088166335e-06, "loss": 0.9752, "step": 11949 }, { "epoch": 0.28, "learning_rate": 8.4820915797341e-06, "loss": 0.8004, "step": 11950 }, { "epoch": 0.28, "learning_rate": 8.48182205165614e-06, "loss": 1.1185, "step": 11951 }, { "epoch": 0.28, "learning_rate": 8.481552503933979e-06, "loss": 0.8892, "step": 11952 }, { "epoch": 0.28, "learning_rate": 8.481282936569133e-06, "loss": 0.8752, "step": 11953 }, { "epoch": 0.28, "learning_rate": 8.481013349563128e-06, "loss": 0.6404, "step": 11954 }, { "epoch": 0.28, "learning_rate": 8.48074374291748e-06, "loss": 0.8137, "step": 11955 }, { "epoch": 0.28, "learning_rate": 8.480474116633715e-06, "loss": 1.0567, "step": 11956 }, { "epoch": 0.28, "learning_rate": 8.48020447071335e-06, "loss": 0.8217, "step": 11957 }, { "epoch": 0.28, "learning_rate": 8.47993480515791e-06, "loss": 0.9395, "step": 11958 }, { "epoch": 0.28, "learning_rate": 8.479665119968912e-06, "loss": 1.2045, "step": 11959 }, { "epoch": 0.28, "learning_rate": 8.479395415147881e-06, "loss": 1.095, "step": 11960 }, { "epoch": 0.28, "learning_rate": 8.479125690696339e-06, "loss": 0.9978, "step": 11961 }, { "epoch": 0.28, "learning_rate": 8.478855946615805e-06, "loss": 0.888, "step": 11962 }, { "epoch": 0.28, "learning_rate": 8.478586182907804e-06, "loss": 0.9062, "step": 11963 }, { "epoch": 0.28, "learning_rate": 8.478316399573854e-06, "loss": 0.9779, "step": 11964 }, { "epoch": 0.28, "learning_rate": 8.47804659661548e-06, "loss": 0.908, "step": 11965 }, { "epoch": 0.28, "learning_rate": 8.477776774034206e-06, "loss": 1.063, "step": 11966 }, { "epoch": 0.28, "learning_rate": 8.47750693183155e-06, "loss": 0.8665, "step": 11967 }, { "epoch": 0.28, "learning_rate": 8.477237070009037e-06, "loss": 0.8137, "step": 11968 }, { "epoch": 0.28, "learning_rate": 8.476967188568187e-06, "loss": 1.2045, "step": 11969 }, { "epoch": 0.28, "learning_rate": 8.476697287510528e-06, "loss": 0.7956, "step": 11970 }, { "epoch": 0.28, "learning_rate": 8.476427366837579e-06, "loss": 1.1139, "step": 11971 }, { "epoch": 0.28, "learning_rate": 8.476157426550862e-06, "loss": 1.0567, "step": 11972 }, { "epoch": 0.28, "learning_rate": 8.4758874666519e-06, "loss": 0.9722, "step": 11973 }, { "epoch": 0.28, "learning_rate": 8.47561748714222e-06, "loss": 1.0038, "step": 11974 }, { "epoch": 0.28, "learning_rate": 8.47534748802334e-06, "loss": 1.1021, "step": 11975 }, { "epoch": 0.28, "learning_rate": 8.475077469296788e-06, "loss": 0.9721, "step": 11976 }, { "epoch": 0.28, "learning_rate": 8.474807430964085e-06, "loss": 0.91, "step": 11977 }, { "epoch": 0.28, "learning_rate": 8.474537373026755e-06, "loss": 0.7277, "step": 11978 }, { "epoch": 0.28, "learning_rate": 8.47426729548632e-06, "loss": 1.2044, "step": 11979 }, { "epoch": 0.28, "learning_rate": 8.473997198344305e-06, "loss": 0.9901, "step": 11980 }, { "epoch": 0.28, "learning_rate": 8.473727081602235e-06, "loss": 0.9051, "step": 11981 }, { "epoch": 0.28, "learning_rate": 8.473456945261633e-06, "loss": 0.7966, "step": 11982 }, { "epoch": 0.28, "learning_rate": 8.473186789324024e-06, "loss": 1.1092, "step": 11983 }, { "epoch": 0.28, "learning_rate": 8.472916613790931e-06, "loss": 0.7303, "step": 11984 }, { "epoch": 0.28, "learning_rate": 8.47264641866388e-06, "loss": 0.8856, "step": 11985 }, { "epoch": 0.28, "learning_rate": 8.47237620394439e-06, "loss": 0.8754, "step": 11986 }, { "epoch": 0.28, "learning_rate": 8.472105969633992e-06, "loss": 1.0694, "step": 11987 }, { "epoch": 0.28, "learning_rate": 8.471835715734209e-06, "loss": 0.9714, "step": 11988 }, { "epoch": 0.28, "learning_rate": 8.471565442246565e-06, "loss": 0.801, "step": 11989 }, { "epoch": 0.28, "learning_rate": 8.471295149172584e-06, "loss": 0.9219, "step": 11990 }, { "epoch": 0.28, "learning_rate": 8.471024836513792e-06, "loss": 1.0164, "step": 11991 }, { "epoch": 0.28, "learning_rate": 8.470754504271715e-06, "loss": 1.0039, "step": 11992 }, { "epoch": 0.28, "learning_rate": 8.470484152447878e-06, "loss": 1.0558, "step": 11993 }, { "epoch": 0.28, "learning_rate": 8.470213781043801e-06, "loss": 0.7579, "step": 11994 }, { "epoch": 0.28, "learning_rate": 8.46994339006102e-06, "loss": 0.8249, "step": 11995 }, { "epoch": 0.28, "learning_rate": 8.46967297950105e-06, "loss": 0.8247, "step": 11996 }, { "epoch": 0.28, "learning_rate": 8.469402549365421e-06, "loss": 0.7478, "step": 11997 }, { "epoch": 0.28, "learning_rate": 8.469132099655662e-06, "loss": 1.1746, "step": 11998 }, { "epoch": 0.28, "learning_rate": 8.468861630373293e-06, "loss": 1.2767, "step": 11999 }, { "epoch": 0.28, "learning_rate": 8.468591141519843e-06, "loss": 1.0246, "step": 12000 }, { "epoch": 0.28, "learning_rate": 8.468320633096838e-06, "loss": 0.8042, "step": 12001 }, { "epoch": 0.28, "learning_rate": 8.468050105105805e-06, "loss": 0.8355, "step": 12002 }, { "epoch": 0.28, "learning_rate": 8.467779557548268e-06, "loss": 0.9851, "step": 12003 }, { "epoch": 0.28, "learning_rate": 8.467508990425754e-06, "loss": 0.6598, "step": 12004 }, { "epoch": 0.28, "learning_rate": 8.467238403739792e-06, "loss": 0.842, "step": 12005 }, { "epoch": 0.28, "learning_rate": 8.466967797491906e-06, "loss": 1.1367, "step": 12006 }, { "epoch": 0.28, "learning_rate": 8.466697171683624e-06, "loss": 1.1261, "step": 12007 }, { "epoch": 0.28, "learning_rate": 8.466426526316472e-06, "loss": 0.9645, "step": 12008 }, { "epoch": 0.28, "learning_rate": 8.466155861391976e-06, "loss": 1.1097, "step": 12009 }, { "epoch": 0.28, "learning_rate": 8.465885176911666e-06, "loss": 1.0274, "step": 12010 }, { "epoch": 0.28, "learning_rate": 8.465614472877067e-06, "loss": 1.2033, "step": 12011 }, { "epoch": 0.28, "learning_rate": 8.465343749289707e-06, "loss": 0.847, "step": 12012 }, { "epoch": 0.28, "learning_rate": 8.465073006151112e-06, "loss": 1.1966, "step": 12013 }, { "epoch": 0.28, "learning_rate": 8.464802243462812e-06, "loss": 1.073, "step": 12014 }, { "epoch": 0.28, "learning_rate": 8.464531461226335e-06, "loss": 1.2968, "step": 12015 }, { "epoch": 0.28, "learning_rate": 8.464260659443205e-06, "loss": 1.0419, "step": 12016 }, { "epoch": 0.28, "learning_rate": 8.463989838114953e-06, "loss": 0.8484, "step": 12017 }, { "epoch": 0.28, "learning_rate": 8.463718997243105e-06, "loss": 1.1589, "step": 12018 }, { "epoch": 0.28, "learning_rate": 8.463448136829188e-06, "loss": 1.0356, "step": 12019 }, { "epoch": 0.28, "learning_rate": 8.463177256874738e-06, "loss": 0.8156, "step": 12020 }, { "epoch": 0.28, "learning_rate": 8.462906357381272e-06, "loss": 0.7554, "step": 12021 }, { "epoch": 0.28, "learning_rate": 8.462635438350326e-06, "loss": 0.7228, "step": 12022 }, { "epoch": 0.28, "learning_rate": 8.462364499783427e-06, "loss": 0.9789, "step": 12023 }, { "epoch": 0.28, "learning_rate": 8.462093541682102e-06, "loss": 0.9108, "step": 12024 }, { "epoch": 0.28, "learning_rate": 8.461822564047882e-06, "loss": 0.7754, "step": 12025 }, { "epoch": 0.28, "learning_rate": 8.461551566882294e-06, "loss": 0.8744, "step": 12026 }, { "epoch": 0.28, "learning_rate": 8.461280550186866e-06, "loss": 0.8028, "step": 12027 }, { "epoch": 0.28, "learning_rate": 8.46100951396313e-06, "loss": 1.0059, "step": 12028 }, { "epoch": 0.28, "learning_rate": 8.460738458212614e-06, "loss": 0.7586, "step": 12029 }, { "epoch": 0.28, "learning_rate": 8.460467382936846e-06, "loss": 0.6952, "step": 12030 }, { "epoch": 0.28, "learning_rate": 8.460196288137357e-06, "loss": 1.0458, "step": 12031 }, { "epoch": 0.28, "learning_rate": 8.459925173815676e-06, "loss": 1.1688, "step": 12032 }, { "epoch": 0.28, "learning_rate": 8.459654039973334e-06, "loss": 1.055, "step": 12033 }, { "epoch": 0.28, "learning_rate": 8.459382886611856e-06, "loss": 0.8704, "step": 12034 }, { "epoch": 0.28, "learning_rate": 8.459111713732777e-06, "loss": 1.0234, "step": 12035 }, { "epoch": 0.28, "learning_rate": 8.458840521337624e-06, "loss": 0.8965, "step": 12036 }, { "epoch": 0.28, "learning_rate": 8.458569309427928e-06, "loss": 0.8014, "step": 12037 }, { "epoch": 0.28, "learning_rate": 8.458298078005222e-06, "loss": 0.7992, "step": 12038 }, { "epoch": 0.28, "learning_rate": 8.45802682707103e-06, "loss": 1.0747, "step": 12039 }, { "epoch": 0.28, "learning_rate": 8.457755556626887e-06, "loss": 0.8053, "step": 12040 }, { "epoch": 0.28, "learning_rate": 8.457484266674323e-06, "loss": 1.0575, "step": 12041 }, { "epoch": 0.28, "learning_rate": 8.457212957214868e-06, "loss": 0.9016, "step": 12042 }, { "epoch": 0.28, "learning_rate": 8.456941628250054e-06, "loss": 0.8635, "step": 12043 }, { "epoch": 0.28, "learning_rate": 8.456670279781408e-06, "loss": 0.7843, "step": 12044 }, { "epoch": 0.28, "learning_rate": 8.456398911810463e-06, "loss": 0.9034, "step": 12045 }, { "epoch": 0.28, "learning_rate": 8.45612752433875e-06, "loss": 1.0151, "step": 12046 }, { "epoch": 0.28, "learning_rate": 8.455856117367805e-06, "loss": 1.0222, "step": 12047 }, { "epoch": 0.28, "learning_rate": 8.45558469089915e-06, "loss": 1.0275, "step": 12048 }, { "epoch": 0.28, "learning_rate": 8.455313244934324e-06, "loss": 1.0594, "step": 12049 }, { "epoch": 0.28, "learning_rate": 8.455041779474855e-06, "loss": 0.9115, "step": 12050 }, { "epoch": 0.28, "learning_rate": 8.454770294522274e-06, "loss": 1.0122, "step": 12051 }, { "epoch": 0.28, "learning_rate": 8.454498790078116e-06, "loss": 1.0178, "step": 12052 }, { "epoch": 0.28, "learning_rate": 8.45422726614391e-06, "loss": 0.9996, "step": 12053 }, { "epoch": 0.28, "learning_rate": 8.45395572272119e-06, "loss": 0.8403, "step": 12054 }, { "epoch": 0.28, "learning_rate": 8.453684159811485e-06, "loss": 0.7234, "step": 12055 }, { "epoch": 0.28, "learning_rate": 8.453412577416328e-06, "loss": 0.9336, "step": 12056 }, { "epoch": 0.28, "learning_rate": 8.453140975537256e-06, "loss": 0.8755, "step": 12057 }, { "epoch": 0.28, "learning_rate": 8.452869354175794e-06, "loss": 0.9762, "step": 12058 }, { "epoch": 0.28, "learning_rate": 8.452597713333478e-06, "loss": 0.8433, "step": 12059 }, { "epoch": 0.28, "learning_rate": 8.452326053011843e-06, "loss": 0.9715, "step": 12060 }, { "epoch": 0.28, "learning_rate": 8.452054373212418e-06, "loss": 0.9469, "step": 12061 }, { "epoch": 0.28, "learning_rate": 8.451782673936737e-06, "loss": 0.8915, "step": 12062 }, { "epoch": 0.28, "learning_rate": 8.45151095518633e-06, "loss": 1.0613, "step": 12063 }, { "epoch": 0.28, "learning_rate": 8.451239216962737e-06, "loss": 0.9478, "step": 12064 }, { "epoch": 0.28, "learning_rate": 8.450967459267487e-06, "loss": 1.1297, "step": 12065 }, { "epoch": 0.28, "learning_rate": 8.450695682102112e-06, "loss": 0.9436, "step": 12066 }, { "epoch": 0.28, "learning_rate": 8.450423885468147e-06, "loss": 1.1477, "step": 12067 }, { "epoch": 0.28, "learning_rate": 8.450152069367124e-06, "loss": 0.5919, "step": 12068 }, { "epoch": 0.28, "learning_rate": 8.449880233800577e-06, "loss": 1.0063, "step": 12069 }, { "epoch": 0.28, "learning_rate": 8.449608378770044e-06, "loss": 0.6891, "step": 12070 }, { "epoch": 0.28, "learning_rate": 8.449336504277053e-06, "loss": 1.0921, "step": 12071 }, { "epoch": 0.28, "learning_rate": 8.44906461032314e-06, "loss": 1.0386, "step": 12072 }, { "epoch": 0.28, "learning_rate": 8.44879269690984e-06, "loss": 0.7575, "step": 12073 }, { "epoch": 0.28, "learning_rate": 8.448520764038686e-06, "loss": 1.063, "step": 12074 }, { "epoch": 0.28, "learning_rate": 8.44824881171121e-06, "loss": 1.0473, "step": 12075 }, { "epoch": 0.28, "learning_rate": 8.447976839928954e-06, "loss": 1.0623, "step": 12076 }, { "epoch": 0.28, "learning_rate": 8.447704848693442e-06, "loss": 0.9582, "step": 12077 }, { "epoch": 0.28, "learning_rate": 8.447432838006216e-06, "loss": 1.1208, "step": 12078 }, { "epoch": 0.28, "learning_rate": 8.447160807868808e-06, "loss": 1.1602, "step": 12079 }, { "epoch": 0.28, "learning_rate": 8.446888758282754e-06, "loss": 1.036, "step": 12080 }, { "epoch": 0.28, "learning_rate": 8.446616689249586e-06, "loss": 0.8672, "step": 12081 }, { "epoch": 0.28, "learning_rate": 8.446344600770843e-06, "loss": 1.0507, "step": 12082 }, { "epoch": 0.28, "learning_rate": 8.446072492848057e-06, "loss": 1.0338, "step": 12083 }, { "epoch": 0.28, "learning_rate": 8.445800365482766e-06, "loss": 0.8648, "step": 12084 }, { "epoch": 0.28, "learning_rate": 8.445528218676503e-06, "loss": 0.9401, "step": 12085 }, { "epoch": 0.28, "learning_rate": 8.445256052430804e-06, "loss": 0.9133, "step": 12086 }, { "epoch": 0.28, "learning_rate": 8.444983866747204e-06, "loss": 1.0169, "step": 12087 }, { "epoch": 0.28, "learning_rate": 8.444711661627238e-06, "loss": 1.2164, "step": 12088 }, { "epoch": 0.28, "learning_rate": 8.444439437072447e-06, "loss": 1.101, "step": 12089 }, { "epoch": 0.28, "learning_rate": 8.44416719308436e-06, "loss": 1.1934, "step": 12090 }, { "epoch": 0.28, "learning_rate": 8.443894929664517e-06, "loss": 0.9678, "step": 12091 }, { "epoch": 0.28, "learning_rate": 8.443622646814454e-06, "loss": 1.1146, "step": 12092 }, { "epoch": 0.28, "learning_rate": 8.443350344535704e-06, "loss": 0.8853, "step": 12093 }, { "epoch": 0.28, "learning_rate": 8.443078022829808e-06, "loss": 0.9604, "step": 12094 }, { "epoch": 0.28, "learning_rate": 8.442805681698298e-06, "loss": 1.1677, "step": 12095 }, { "epoch": 0.28, "learning_rate": 8.442533321142714e-06, "loss": 0.8888, "step": 12096 }, { "epoch": 0.28, "learning_rate": 8.44226094116459e-06, "loss": 1.0926, "step": 12097 }, { "epoch": 0.28, "learning_rate": 8.441988541765465e-06, "loss": 1.074, "step": 12098 }, { "epoch": 0.28, "learning_rate": 8.441716122946874e-06, "loss": 0.9184, "step": 12099 }, { "epoch": 0.28, "learning_rate": 8.441443684710355e-06, "loss": 1.0088, "step": 12100 }, { "epoch": 0.28, "learning_rate": 8.441171227057445e-06, "loss": 1.2735, "step": 12101 }, { "epoch": 0.28, "learning_rate": 8.440898749989682e-06, "loss": 0.818, "step": 12102 }, { "epoch": 0.28, "learning_rate": 8.440626253508602e-06, "loss": 0.7719, "step": 12103 }, { "epoch": 0.28, "learning_rate": 8.440353737615741e-06, "loss": 0.8854, "step": 12104 }, { "epoch": 0.28, "learning_rate": 8.440081202312639e-06, "loss": 1.1738, "step": 12105 }, { "epoch": 0.28, "learning_rate": 8.439808647600834e-06, "loss": 0.968, "step": 12106 }, { "epoch": 0.28, "learning_rate": 8.43953607348186e-06, "loss": 0.9035, "step": 12107 }, { "epoch": 0.28, "learning_rate": 8.43926347995726e-06, "loss": 0.8406, "step": 12108 }, { "epoch": 0.28, "learning_rate": 8.438990867028569e-06, "loss": 1.1911, "step": 12109 }, { "epoch": 0.28, "learning_rate": 8.438718234697322e-06, "loss": 1.0608, "step": 12110 }, { "epoch": 0.28, "learning_rate": 8.438445582965064e-06, "loss": 0.8769, "step": 12111 }, { "epoch": 0.28, "learning_rate": 8.438172911833331e-06, "loss": 1.0731, "step": 12112 }, { "epoch": 0.28, "learning_rate": 8.437900221303659e-06, "loss": 1.1514, "step": 12113 }, { "epoch": 0.28, "learning_rate": 8.437627511377586e-06, "loss": 0.8774, "step": 12114 }, { "epoch": 0.28, "learning_rate": 8.437354782056654e-06, "loss": 1.3696, "step": 12115 }, { "epoch": 0.28, "learning_rate": 8.437082033342402e-06, "loss": 0.8816, "step": 12116 }, { "epoch": 0.28, "learning_rate": 8.436809265236363e-06, "loss": 0.6279, "step": 12117 }, { "epoch": 0.28, "learning_rate": 8.436536477740082e-06, "loss": 0.7116, "step": 12118 }, { "epoch": 0.28, "learning_rate": 8.436263670855096e-06, "loss": 0.983, "step": 12119 }, { "epoch": 0.28, "learning_rate": 8.435990844582945e-06, "loss": 0.7874, "step": 12120 }, { "epoch": 0.28, "learning_rate": 8.435717998925166e-06, "loss": 0.8872, "step": 12121 }, { "epoch": 0.28, "learning_rate": 8.435445133883299e-06, "loss": 1.0444, "step": 12122 }, { "epoch": 0.28, "learning_rate": 8.435172249458886e-06, "loss": 0.9241, "step": 12123 }, { "epoch": 0.28, "learning_rate": 8.434899345653463e-06, "loss": 0.9252, "step": 12124 }, { "epoch": 0.28, "learning_rate": 8.434626422468572e-06, "loss": 1.1054, "step": 12125 }, { "epoch": 0.28, "learning_rate": 8.434353479905754e-06, "loss": 0.9264, "step": 12126 }, { "epoch": 0.28, "learning_rate": 8.434080517966546e-06, "loss": 0.7807, "step": 12127 }, { "epoch": 0.28, "learning_rate": 8.433807536652489e-06, "loss": 1.0046, "step": 12128 }, { "epoch": 0.28, "learning_rate": 8.433534535965125e-06, "loss": 0.9553, "step": 12129 }, { "epoch": 0.28, "learning_rate": 8.43326151590599e-06, "loss": 0.8531, "step": 12130 }, { "epoch": 0.28, "learning_rate": 8.43298847647663e-06, "loss": 1.2116, "step": 12131 }, { "epoch": 0.28, "learning_rate": 8.432715417678581e-06, "loss": 0.7733, "step": 12132 }, { "epoch": 0.28, "learning_rate": 8.432442339513386e-06, "loss": 0.9216, "step": 12133 }, { "epoch": 0.28, "learning_rate": 8.432169241982584e-06, "loss": 0.8595, "step": 12134 }, { "epoch": 0.28, "learning_rate": 8.431896125087717e-06, "loss": 1.1049, "step": 12135 }, { "epoch": 0.28, "learning_rate": 8.431622988830326e-06, "loss": 0.7792, "step": 12136 }, { "epoch": 0.28, "learning_rate": 8.43134983321195e-06, "loss": 0.8577, "step": 12137 }, { "epoch": 0.28, "learning_rate": 8.431076658234132e-06, "loss": 1.0008, "step": 12138 }, { "epoch": 0.28, "learning_rate": 8.430803463898414e-06, "loss": 0.8596, "step": 12139 }, { "epoch": 0.28, "learning_rate": 8.430530250206335e-06, "loss": 0.9801, "step": 12140 }, { "epoch": 0.28, "learning_rate": 8.430257017159438e-06, "loss": 0.769, "step": 12141 }, { "epoch": 0.28, "learning_rate": 8.429983764759264e-06, "loss": 0.9682, "step": 12142 }, { "epoch": 0.28, "learning_rate": 8.429710493007355e-06, "loss": 0.7701, "step": 12143 }, { "epoch": 0.28, "learning_rate": 8.429437201905254e-06, "loss": 0.775, "step": 12144 }, { "epoch": 0.28, "learning_rate": 8.429163891454502e-06, "loss": 0.9593, "step": 12145 }, { "epoch": 0.28, "learning_rate": 8.428890561656637e-06, "loss": 1.1929, "step": 12146 }, { "epoch": 0.28, "learning_rate": 8.428617212513207e-06, "loss": 0.7817, "step": 12147 }, { "epoch": 0.28, "learning_rate": 8.428343844025753e-06, "loss": 0.8166, "step": 12148 }, { "epoch": 0.28, "learning_rate": 8.428070456195814e-06, "loss": 0.9103, "step": 12149 }, { "epoch": 0.28, "learning_rate": 8.427797049024936e-06, "loss": 0.7181, "step": 12150 }, { "epoch": 0.28, "learning_rate": 8.42752362251466e-06, "loss": 0.7392, "step": 12151 }, { "epoch": 0.28, "learning_rate": 8.427250176666529e-06, "loss": 1.1594, "step": 12152 }, { "epoch": 0.28, "learning_rate": 8.426976711482084e-06, "loss": 1.0252, "step": 12153 }, { "epoch": 0.28, "learning_rate": 8.426703226962871e-06, "loss": 1.0339, "step": 12154 }, { "epoch": 0.28, "learning_rate": 8.426429723110432e-06, "loss": 0.9085, "step": 12155 }, { "epoch": 0.28, "learning_rate": 8.426156199926308e-06, "loss": 1.3609, "step": 12156 }, { "epoch": 0.28, "learning_rate": 8.425882657412046e-06, "loss": 1.1234, "step": 12157 }, { "epoch": 0.28, "learning_rate": 8.425609095569185e-06, "loss": 1.2323, "step": 12158 }, { "epoch": 0.28, "learning_rate": 8.425335514399271e-06, "loss": 1.0094, "step": 12159 }, { "epoch": 0.28, "learning_rate": 8.425061913903847e-06, "loss": 1.0059, "step": 12160 }, { "epoch": 0.28, "learning_rate": 8.424788294084457e-06, "loss": 0.9245, "step": 12161 }, { "epoch": 0.28, "learning_rate": 8.424514654942645e-06, "loss": 0.9085, "step": 12162 }, { "epoch": 0.28, "learning_rate": 8.424240996479953e-06, "loss": 1.0267, "step": 12163 }, { "epoch": 0.28, "learning_rate": 8.423967318697928e-06, "loss": 1.0803, "step": 12164 }, { "epoch": 0.28, "learning_rate": 8.42369362159811e-06, "loss": 0.9091, "step": 12165 }, { "epoch": 0.28, "learning_rate": 8.423419905182047e-06, "loss": 0.9088, "step": 12166 }, { "epoch": 0.28, "learning_rate": 8.423146169451282e-06, "loss": 1.058, "step": 12167 }, { "epoch": 0.28, "learning_rate": 8.422872414407356e-06, "loss": 1.161, "step": 12168 }, { "epoch": 0.28, "learning_rate": 8.42259864005182e-06, "loss": 0.7841, "step": 12169 }, { "epoch": 0.28, "learning_rate": 8.422324846386215e-06, "loss": 0.8751, "step": 12170 }, { "epoch": 0.28, "learning_rate": 8.422051033412085e-06, "loss": 0.9624, "step": 12171 }, { "epoch": 0.28, "learning_rate": 8.421777201130977e-06, "loss": 0.9879, "step": 12172 }, { "epoch": 0.28, "learning_rate": 8.421503349544433e-06, "loss": 0.7682, "step": 12173 }, { "epoch": 0.28, "learning_rate": 8.421229478654001e-06, "loss": 0.6303, "step": 12174 }, { "epoch": 0.28, "learning_rate": 8.420955588461225e-06, "loss": 0.9302, "step": 12175 }, { "epoch": 0.28, "learning_rate": 8.42068167896765e-06, "loss": 0.676, "step": 12176 }, { "epoch": 0.28, "learning_rate": 8.420407750174822e-06, "loss": 1.1016, "step": 12177 }, { "epoch": 0.28, "learning_rate": 8.420133802084286e-06, "loss": 1.0607, "step": 12178 }, { "epoch": 0.28, "learning_rate": 8.419859834697588e-06, "loss": 1.0404, "step": 12179 }, { "epoch": 0.28, "learning_rate": 8.419585848016273e-06, "loss": 1.031, "step": 12180 }, { "epoch": 0.28, "learning_rate": 8.419311842041886e-06, "loss": 0.984, "step": 12181 }, { "epoch": 0.28, "learning_rate": 8.419037816775976e-06, "loss": 0.9444, "step": 12182 }, { "epoch": 0.28, "learning_rate": 8.418763772220087e-06, "loss": 1.2448, "step": 12183 }, { "epoch": 0.28, "learning_rate": 8.418489708375764e-06, "loss": 1.1957, "step": 12184 }, { "epoch": 0.28, "learning_rate": 8.418215625244557e-06, "loss": 0.927, "step": 12185 }, { "epoch": 0.28, "learning_rate": 8.417941522828009e-06, "loss": 1.1094, "step": 12186 }, { "epoch": 0.28, "learning_rate": 8.417667401127665e-06, "loss": 0.9622, "step": 12187 }, { "epoch": 0.28, "learning_rate": 8.417393260145076e-06, "loss": 1.0492, "step": 12188 }, { "epoch": 0.28, "learning_rate": 8.417119099881788e-06, "loss": 1.2515, "step": 12189 }, { "epoch": 0.28, "learning_rate": 8.416844920339345e-06, "loss": 1.0082, "step": 12190 }, { "epoch": 0.28, "learning_rate": 8.416570721519295e-06, "loss": 1.2882, "step": 12191 }, { "epoch": 0.28, "learning_rate": 8.416296503423185e-06, "loss": 0.8015, "step": 12192 }, { "epoch": 0.28, "learning_rate": 8.416022266052563e-06, "loss": 0.8914, "step": 12193 }, { "epoch": 0.28, "learning_rate": 8.415748009408977e-06, "loss": 0.7914, "step": 12194 }, { "epoch": 0.28, "learning_rate": 8.415473733493973e-06, "loss": 0.9037, "step": 12195 }, { "epoch": 0.28, "learning_rate": 8.415199438309097e-06, "loss": 0.9634, "step": 12196 }, { "epoch": 0.28, "learning_rate": 8.4149251238559e-06, "loss": 0.8803, "step": 12197 }, { "epoch": 0.28, "learning_rate": 8.414650790135926e-06, "loss": 1.0437, "step": 12198 }, { "epoch": 0.28, "learning_rate": 8.414376437150724e-06, "loss": 0.9486, "step": 12199 }, { "epoch": 0.28, "learning_rate": 8.414102064901843e-06, "loss": 0.858, "step": 12200 }, { "epoch": 0.28, "learning_rate": 8.41382767339083e-06, "loss": 0.9786, "step": 12201 }, { "epoch": 0.28, "learning_rate": 8.413553262619236e-06, "loss": 0.8186, "step": 12202 }, { "epoch": 0.28, "learning_rate": 8.413278832588606e-06, "loss": 0.8151, "step": 12203 }, { "epoch": 0.28, "learning_rate": 8.413004383300488e-06, "loss": 0.8559, "step": 12204 }, { "epoch": 0.28, "learning_rate": 8.41272991475643e-06, "loss": 0.9593, "step": 12205 }, { "epoch": 0.28, "learning_rate": 8.412455426957983e-06, "loss": 0.8517, "step": 12206 }, { "epoch": 0.28, "learning_rate": 8.412180919906696e-06, "loss": 1.1227, "step": 12207 }, { "epoch": 0.28, "learning_rate": 8.411906393604115e-06, "loss": 0.9215, "step": 12208 }, { "epoch": 0.28, "learning_rate": 8.41163184805179e-06, "loss": 0.8908, "step": 12209 }, { "epoch": 0.28, "learning_rate": 8.41135728325127e-06, "loss": 0.9214, "step": 12210 }, { "epoch": 0.28, "learning_rate": 8.411082699204104e-06, "loss": 0.8304, "step": 12211 }, { "epoch": 0.28, "learning_rate": 8.410808095911844e-06, "loss": 0.9265, "step": 12212 }, { "epoch": 0.28, "learning_rate": 8.410533473376035e-06, "loss": 0.7886, "step": 12213 }, { "epoch": 0.28, "learning_rate": 8.410258831598228e-06, "loss": 0.9059, "step": 12214 }, { "epoch": 0.28, "learning_rate": 8.409984170579973e-06, "loss": 1.0049, "step": 12215 }, { "epoch": 0.28, "learning_rate": 8.409709490322817e-06, "loss": 1.3726, "step": 12216 }, { "epoch": 0.28, "learning_rate": 8.409434790828314e-06, "loss": 0.9853, "step": 12217 }, { "epoch": 0.28, "learning_rate": 8.409160072098013e-06, "loss": 0.9191, "step": 12218 }, { "epoch": 0.28, "learning_rate": 8.408885334133462e-06, "loss": 0.9355, "step": 12219 }, { "epoch": 0.28, "learning_rate": 8.40861057693621e-06, "loss": 0.8003, "step": 12220 }, { "epoch": 0.28, "learning_rate": 8.408335800507812e-06, "loss": 0.8229, "step": 12221 }, { "epoch": 0.28, "learning_rate": 8.408061004849814e-06, "loss": 0.8937, "step": 12222 }, { "epoch": 0.28, "learning_rate": 8.407786189963767e-06, "loss": 1.059, "step": 12223 }, { "epoch": 0.28, "learning_rate": 8.407511355851222e-06, "loss": 1.0881, "step": 12224 }, { "epoch": 0.28, "learning_rate": 8.407236502513729e-06, "loss": 1.0047, "step": 12225 }, { "epoch": 0.28, "learning_rate": 8.40696162995284e-06, "loss": 0.788, "step": 12226 }, { "epoch": 0.28, "learning_rate": 8.406686738170107e-06, "loss": 0.6801, "step": 12227 }, { "epoch": 0.28, "learning_rate": 8.406411827167078e-06, "loss": 1.1094, "step": 12228 }, { "epoch": 0.28, "learning_rate": 8.406136896945305e-06, "loss": 0.8707, "step": 12229 }, { "epoch": 0.28, "learning_rate": 8.405861947506339e-06, "loss": 1.1903, "step": 12230 }, { "epoch": 0.28, "learning_rate": 8.405586978851733e-06, "loss": 0.9287, "step": 12231 }, { "epoch": 0.28, "learning_rate": 8.405311990983036e-06, "loss": 0.8529, "step": 12232 }, { "epoch": 0.28, "learning_rate": 8.4050369839018e-06, "loss": 1.151, "step": 12233 }, { "epoch": 0.28, "learning_rate": 8.404761957609578e-06, "loss": 1.0049, "step": 12234 }, { "epoch": 0.28, "learning_rate": 8.40448691210792e-06, "loss": 1.0194, "step": 12235 }, { "epoch": 0.28, "learning_rate": 8.404211847398378e-06, "loss": 0.9246, "step": 12236 }, { "epoch": 0.28, "learning_rate": 8.403936763482503e-06, "loss": 1.0943, "step": 12237 }, { "epoch": 0.28, "learning_rate": 8.40366166036185e-06, "loss": 0.995, "step": 12238 }, { "epoch": 0.28, "learning_rate": 8.403386538037969e-06, "loss": 1.1649, "step": 12239 }, { "epoch": 0.28, "learning_rate": 8.403111396512414e-06, "loss": 1.0257, "step": 12240 }, { "epoch": 0.28, "learning_rate": 8.402836235786736e-06, "loss": 0.9328, "step": 12241 }, { "epoch": 0.28, "learning_rate": 8.402561055862485e-06, "loss": 1.0218, "step": 12242 }, { "epoch": 0.28, "learning_rate": 8.402285856741217e-06, "loss": 1.3869, "step": 12243 }, { "epoch": 0.28, "learning_rate": 8.402010638424485e-06, "loss": 1.1674, "step": 12244 }, { "epoch": 0.28, "learning_rate": 8.401735400913837e-06, "loss": 1.218, "step": 12245 }, { "epoch": 0.28, "learning_rate": 8.401460144210833e-06, "loss": 0.986, "step": 12246 }, { "epoch": 0.28, "learning_rate": 8.40118486831702e-06, "loss": 1.0294, "step": 12247 }, { "epoch": 0.28, "learning_rate": 8.400909573233956e-06, "loss": 0.6514, "step": 12248 }, { "epoch": 0.28, "learning_rate": 8.400634258963188e-06, "loss": 0.9699, "step": 12249 }, { "epoch": 0.28, "learning_rate": 8.400358925506274e-06, "loss": 0.9063, "step": 12250 }, { "epoch": 0.28, "learning_rate": 8.400083572864769e-06, "loss": 0.9411, "step": 12251 }, { "epoch": 0.28, "learning_rate": 8.39980820104022e-06, "loss": 1.0346, "step": 12252 }, { "epoch": 0.28, "learning_rate": 8.399532810034186e-06, "loss": 1.0227, "step": 12253 }, { "epoch": 0.28, "learning_rate": 8.39925739984822e-06, "loss": 1.1358, "step": 12254 }, { "epoch": 0.28, "learning_rate": 8.398981970483873e-06, "loss": 1.0072, "step": 12255 }, { "epoch": 0.28, "learning_rate": 8.398706521942701e-06, "loss": 0.8489, "step": 12256 }, { "epoch": 0.28, "learning_rate": 8.398431054226259e-06, "loss": 0.8395, "step": 12257 }, { "epoch": 0.28, "learning_rate": 8.3981555673361e-06, "loss": 0.9782, "step": 12258 }, { "epoch": 0.28, "learning_rate": 8.397880061273779e-06, "loss": 1.0362, "step": 12259 }, { "epoch": 0.28, "learning_rate": 8.397604536040848e-06, "loss": 0.9939, "step": 12260 }, { "epoch": 0.28, "learning_rate": 8.397328991638866e-06, "loss": 0.9029, "step": 12261 }, { "epoch": 0.28, "learning_rate": 8.397053428069384e-06, "loss": 0.8794, "step": 12262 }, { "epoch": 0.28, "learning_rate": 8.396777845333956e-06, "loss": 0.9495, "step": 12263 }, { "epoch": 0.28, "learning_rate": 8.396502243434139e-06, "loss": 0.9751, "step": 12264 }, { "epoch": 0.28, "learning_rate": 8.396226622371489e-06, "loss": 0.78, "step": 12265 }, { "epoch": 0.28, "learning_rate": 8.395950982147557e-06, "loss": 0.9718, "step": 12266 }, { "epoch": 0.28, "learning_rate": 8.395675322763903e-06, "loss": 1.1068, "step": 12267 }, { "epoch": 0.28, "learning_rate": 8.395399644222079e-06, "loss": 1.0426, "step": 12268 }, { "epoch": 0.28, "learning_rate": 8.39512394652364e-06, "loss": 1.0403, "step": 12269 }, { "epoch": 0.28, "learning_rate": 8.394848229670144e-06, "loss": 0.9311, "step": 12270 }, { "epoch": 0.28, "learning_rate": 8.394572493663144e-06, "loss": 0.7318, "step": 12271 }, { "epoch": 0.28, "learning_rate": 8.394296738504197e-06, "loss": 1.0394, "step": 12272 }, { "epoch": 0.28, "learning_rate": 8.39402096419486e-06, "loss": 1.2382, "step": 12273 }, { "epoch": 0.28, "learning_rate": 8.393745170736687e-06, "loss": 0.9178, "step": 12274 }, { "epoch": 0.28, "learning_rate": 8.393469358131234e-06, "loss": 1.0476, "step": 12275 }, { "epoch": 0.28, "learning_rate": 8.393193526380059e-06, "loss": 0.953, "step": 12276 }, { "epoch": 0.28, "learning_rate": 8.392917675484715e-06, "loss": 1.0973, "step": 12277 }, { "epoch": 0.28, "learning_rate": 8.392641805446762e-06, "loss": 0.9345, "step": 12278 }, { "epoch": 0.28, "learning_rate": 8.392365916267754e-06, "loss": 1.06, "step": 12279 }, { "epoch": 0.28, "learning_rate": 8.39209000794925e-06, "loss": 0.8234, "step": 12280 }, { "epoch": 0.28, "learning_rate": 8.391814080492802e-06, "loss": 0.8768, "step": 12281 }, { "epoch": 0.28, "learning_rate": 8.391538133899971e-06, "loss": 0.9779, "step": 12282 }, { "epoch": 0.28, "learning_rate": 8.391262168172311e-06, "loss": 0.8021, "step": 12283 }, { "epoch": 0.28, "learning_rate": 8.390986183311382e-06, "loss": 1.2984, "step": 12284 }, { "epoch": 0.28, "learning_rate": 8.39071017931874e-06, "loss": 0.8391, "step": 12285 }, { "epoch": 0.28, "learning_rate": 8.390434156195942e-06, "loss": 1.116, "step": 12286 }, { "epoch": 0.28, "learning_rate": 8.390158113944544e-06, "loss": 0.8793, "step": 12287 }, { "epoch": 0.28, "learning_rate": 8.389882052566106e-06, "loss": 0.9154, "step": 12288 }, { "epoch": 0.29, "learning_rate": 8.389605972062182e-06, "loss": 1.2971, "step": 12289 }, { "epoch": 0.29, "learning_rate": 8.389329872434332e-06, "loss": 0.9954, "step": 12290 }, { "epoch": 0.29, "learning_rate": 8.389053753684115e-06, "loss": 0.9044, "step": 12291 }, { "epoch": 0.29, "learning_rate": 8.388777615813085e-06, "loss": 1.0021, "step": 12292 }, { "epoch": 0.29, "learning_rate": 8.388501458822805e-06, "loss": 0.7274, "step": 12293 }, { "epoch": 0.29, "learning_rate": 8.388225282714828e-06, "loss": 1.0143, "step": 12294 }, { "epoch": 0.29, "learning_rate": 8.387949087490715e-06, "loss": 1.1119, "step": 12295 }, { "epoch": 0.29, "learning_rate": 8.387672873152024e-06, "loss": 0.7295, "step": 12296 }, { "epoch": 0.29, "learning_rate": 8.387396639700313e-06, "loss": 0.9799, "step": 12297 }, { "epoch": 0.29, "learning_rate": 8.387120387137141e-06, "loss": 1.225, "step": 12298 }, { "epoch": 0.29, "learning_rate": 8.386844115464066e-06, "loss": 0.893, "step": 12299 }, { "epoch": 0.29, "learning_rate": 8.386567824682645e-06, "loss": 1.009, "step": 12300 }, { "epoch": 0.29, "learning_rate": 8.386291514794442e-06, "loss": 0.7587, "step": 12301 }, { "epoch": 0.29, "learning_rate": 8.38601518580101e-06, "loss": 0.8272, "step": 12302 }, { "epoch": 0.29, "learning_rate": 8.385738837703912e-06, "loss": 0.7476, "step": 12303 }, { "epoch": 0.29, "learning_rate": 8.385462470504705e-06, "loss": 1.0585, "step": 12304 }, { "epoch": 0.29, "learning_rate": 8.38518608420495e-06, "loss": 0.945, "step": 12305 }, { "epoch": 0.29, "learning_rate": 8.384909678806203e-06, "loss": 0.9668, "step": 12306 }, { "epoch": 0.29, "learning_rate": 8.38463325431003e-06, "loss": 1.0765, "step": 12307 }, { "epoch": 0.29, "learning_rate": 8.384356810717984e-06, "loss": 1.1374, "step": 12308 }, { "epoch": 0.29, "learning_rate": 8.384080348031625e-06, "loss": 1.0499, "step": 12309 }, { "epoch": 0.29, "learning_rate": 8.383803866252519e-06, "loss": 0.7925, "step": 12310 }, { "epoch": 0.29, "learning_rate": 8.383527365382218e-06, "loss": 0.916, "step": 12311 }, { "epoch": 0.29, "learning_rate": 8.383250845422288e-06, "loss": 0.9823, "step": 12312 }, { "epoch": 0.29, "learning_rate": 8.382974306374285e-06, "loss": 1.0421, "step": 12313 }, { "epoch": 0.29, "learning_rate": 8.382697748239771e-06, "loss": 1.0185, "step": 12314 }, { "epoch": 0.29, "learning_rate": 8.38242117102031e-06, "loss": 0.8283, "step": 12315 }, { "epoch": 0.29, "learning_rate": 8.382144574717456e-06, "loss": 0.9423, "step": 12316 }, { "epoch": 0.29, "learning_rate": 8.381867959332773e-06, "loss": 1.1035, "step": 12317 }, { "epoch": 0.29, "learning_rate": 8.381591324867821e-06, "loss": 0.9664, "step": 12318 }, { "epoch": 0.29, "learning_rate": 8.38131467132416e-06, "loss": 1.1012, "step": 12319 }, { "epoch": 0.29, "learning_rate": 8.381037998703352e-06, "loss": 0.976, "step": 12320 }, { "epoch": 0.29, "learning_rate": 8.380761307006959e-06, "loss": 1.0312, "step": 12321 }, { "epoch": 0.29, "learning_rate": 8.38048459623654e-06, "loss": 1.1079, "step": 12322 }, { "epoch": 0.29, "learning_rate": 8.380207866393655e-06, "loss": 0.7972, "step": 12323 }, { "epoch": 0.29, "learning_rate": 8.379931117479869e-06, "loss": 1.2228, "step": 12324 }, { "epoch": 0.29, "learning_rate": 8.379654349496742e-06, "loss": 0.9997, "step": 12325 }, { "epoch": 0.29, "learning_rate": 8.379377562445834e-06, "loss": 1.2135, "step": 12326 }, { "epoch": 0.29, "learning_rate": 8.379100756328708e-06, "loss": 0.9122, "step": 12327 }, { "epoch": 0.29, "learning_rate": 8.378823931146924e-06, "loss": 1.0292, "step": 12328 }, { "epoch": 0.29, "learning_rate": 8.378547086902046e-06, "loss": 0.8026, "step": 12329 }, { "epoch": 0.29, "learning_rate": 8.378270223595636e-06, "loss": 1.1267, "step": 12330 }, { "epoch": 0.29, "learning_rate": 8.377993341229255e-06, "loss": 1.123, "step": 12331 }, { "epoch": 0.29, "learning_rate": 8.377716439804465e-06, "loss": 0.9784, "step": 12332 }, { "epoch": 0.29, "learning_rate": 8.37743951932283e-06, "loss": 0.8192, "step": 12333 }, { "epoch": 0.29, "learning_rate": 8.377162579785908e-06, "loss": 1.0639, "step": 12334 }, { "epoch": 0.29, "learning_rate": 8.376885621195266e-06, "loss": 1.2043, "step": 12335 }, { "epoch": 0.29, "learning_rate": 8.376608643552466e-06, "loss": 1.1928, "step": 12336 }, { "epoch": 0.29, "learning_rate": 8.376331646859068e-06, "loss": 0.9606, "step": 12337 }, { "epoch": 0.29, "learning_rate": 8.376054631116636e-06, "loss": 1.301, "step": 12338 }, { "epoch": 0.29, "learning_rate": 8.375777596326737e-06, "loss": 0.853, "step": 12339 }, { "epoch": 0.29, "learning_rate": 8.375500542490926e-06, "loss": 0.8155, "step": 12340 }, { "epoch": 0.29, "learning_rate": 8.375223469610774e-06, "loss": 0.8267, "step": 12341 }, { "epoch": 0.29, "learning_rate": 8.37494637768784e-06, "loss": 0.8856, "step": 12342 }, { "epoch": 0.29, "learning_rate": 8.374669266723687e-06, "loss": 1.2311, "step": 12343 }, { "epoch": 0.29, "learning_rate": 8.37439213671988e-06, "loss": 0.9185, "step": 12344 }, { "epoch": 0.29, "learning_rate": 8.37411498767798e-06, "loss": 1.1661, "step": 12345 }, { "epoch": 0.29, "learning_rate": 8.373837819599556e-06, "loss": 0.897, "step": 12346 }, { "epoch": 0.29, "learning_rate": 8.373560632486169e-06, "loss": 0.8828, "step": 12347 }, { "epoch": 0.29, "learning_rate": 8.37328342633938e-06, "loss": 0.7996, "step": 12348 }, { "epoch": 0.29, "learning_rate": 8.373006201160756e-06, "loss": 0.9519, "step": 12349 }, { "epoch": 0.29, "learning_rate": 8.37272895695186e-06, "loss": 0.993, "step": 12350 }, { "epoch": 0.29, "learning_rate": 8.372451693714257e-06, "loss": 1.0086, "step": 12351 }, { "epoch": 0.29, "learning_rate": 8.372174411449512e-06, "loss": 1.0287, "step": 12352 }, { "epoch": 0.29, "learning_rate": 8.371897110159186e-06, "loss": 1.1169, "step": 12353 }, { "epoch": 0.29, "learning_rate": 8.371619789844849e-06, "loss": 0.7213, "step": 12354 }, { "epoch": 0.29, "learning_rate": 8.37134245050806e-06, "loss": 0.8331, "step": 12355 }, { "epoch": 0.29, "learning_rate": 8.371065092150388e-06, "loss": 0.9328, "step": 12356 }, { "epoch": 0.29, "learning_rate": 8.370787714773395e-06, "loss": 1.0155, "step": 12357 }, { "epoch": 0.29, "learning_rate": 8.370510318378648e-06, "loss": 1.057, "step": 12358 }, { "epoch": 0.29, "learning_rate": 8.37023290296771e-06, "loss": 1.0032, "step": 12359 }, { "epoch": 0.29, "learning_rate": 8.369955468542146e-06, "loss": 0.9315, "step": 12360 }, { "epoch": 0.29, "learning_rate": 8.369678015103524e-06, "loss": 0.8759, "step": 12361 }, { "epoch": 0.29, "learning_rate": 8.369400542653407e-06, "loss": 0.7404, "step": 12362 }, { "epoch": 0.29, "learning_rate": 8.369123051193362e-06, "loss": 0.9243, "step": 12363 }, { "epoch": 0.29, "learning_rate": 8.368845540724954e-06, "loss": 1.1044, "step": 12364 }, { "epoch": 0.29, "learning_rate": 8.368568011249748e-06, "loss": 0.9036, "step": 12365 }, { "epoch": 0.29, "learning_rate": 8.368290462769312e-06, "loss": 0.8972, "step": 12366 }, { "epoch": 0.29, "learning_rate": 8.36801289528521e-06, "loss": 0.8186, "step": 12367 }, { "epoch": 0.29, "learning_rate": 8.367735308799007e-06, "loss": 0.8571, "step": 12368 }, { "epoch": 0.29, "learning_rate": 8.367457703312271e-06, "loss": 1.0227, "step": 12369 }, { "epoch": 0.29, "learning_rate": 8.367180078826569e-06, "loss": 1.0377, "step": 12370 }, { "epoch": 0.29, "learning_rate": 8.366902435343464e-06, "loss": 0.9241, "step": 12371 }, { "epoch": 0.29, "learning_rate": 8.366624772864526e-06, "loss": 0.9322, "step": 12372 }, { "epoch": 0.29, "learning_rate": 8.366347091391318e-06, "loss": 1.0348, "step": 12373 }, { "epoch": 0.29, "learning_rate": 8.36606939092541e-06, "loss": 0.7278, "step": 12374 }, { "epoch": 0.29, "learning_rate": 8.365791671468368e-06, "loss": 1.1431, "step": 12375 }, { "epoch": 0.29, "learning_rate": 8.365513933021759e-06, "loss": 1.2327, "step": 12376 }, { "epoch": 0.29, "learning_rate": 8.365236175587148e-06, "loss": 0.8773, "step": 12377 }, { "epoch": 0.29, "learning_rate": 8.364958399166101e-06, "loss": 1.0217, "step": 12378 }, { "epoch": 0.29, "learning_rate": 8.36468060376019e-06, "loss": 1.0093, "step": 12379 }, { "epoch": 0.29, "learning_rate": 8.364402789370982e-06, "loss": 0.8865, "step": 12380 }, { "epoch": 0.29, "learning_rate": 8.36412495600004e-06, "loss": 1.1611, "step": 12381 }, { "epoch": 0.29, "learning_rate": 8.363847103648935e-06, "loss": 0.7612, "step": 12382 }, { "epoch": 0.29, "learning_rate": 8.36356923231923e-06, "loss": 0.9645, "step": 12383 }, { "epoch": 0.29, "learning_rate": 8.3632913420125e-06, "loss": 0.9747, "step": 12384 }, { "epoch": 0.29, "learning_rate": 8.363013432730308e-06, "loss": 1.1486, "step": 12385 }, { "epoch": 0.29, "learning_rate": 8.362735504474224e-06, "loss": 0.896, "step": 12386 }, { "epoch": 0.29, "learning_rate": 8.362457557245814e-06, "loss": 0.7542, "step": 12387 }, { "epoch": 0.29, "learning_rate": 8.362179591046646e-06, "loss": 0.8108, "step": 12388 }, { "epoch": 0.29, "learning_rate": 8.36190160587829e-06, "loss": 0.8309, "step": 12389 }, { "epoch": 0.29, "learning_rate": 8.361623601742315e-06, "loss": 0.7592, "step": 12390 }, { "epoch": 0.29, "learning_rate": 8.361345578640287e-06, "loss": 0.7792, "step": 12391 }, { "epoch": 0.29, "learning_rate": 8.361067536573776e-06, "loss": 1.1355, "step": 12392 }, { "epoch": 0.29, "learning_rate": 8.36078947554435e-06, "loss": 0.8705, "step": 12393 }, { "epoch": 0.29, "learning_rate": 8.36051139555358e-06, "loss": 1.0198, "step": 12394 }, { "epoch": 0.29, "learning_rate": 8.360233296603034e-06, "loss": 1.0299, "step": 12395 }, { "epoch": 0.29, "learning_rate": 8.359955178694278e-06, "loss": 0.7993, "step": 12396 }, { "epoch": 0.29, "learning_rate": 8.359677041828883e-06, "loss": 0.987, "step": 12397 }, { "epoch": 0.29, "learning_rate": 8.359398886008422e-06, "loss": 1.1154, "step": 12398 }, { "epoch": 0.29, "learning_rate": 8.359120711234459e-06, "loss": 1.0843, "step": 12399 }, { "epoch": 0.29, "learning_rate": 8.358842517508566e-06, "loss": 0.8615, "step": 12400 }, { "epoch": 0.29, "learning_rate": 8.35856430483231e-06, "loss": 0.8859, "step": 12401 }, { "epoch": 0.29, "learning_rate": 8.358286073207265e-06, "loss": 1.0105, "step": 12402 }, { "epoch": 0.29, "learning_rate": 8.358007822634998e-06, "loss": 1.1678, "step": 12403 }, { "epoch": 0.29, "learning_rate": 8.357729553117077e-06, "loss": 1.1159, "step": 12404 }, { "epoch": 0.29, "learning_rate": 8.357451264655077e-06, "loss": 1.0803, "step": 12405 }, { "epoch": 0.29, "learning_rate": 8.357172957250564e-06, "loss": 1.0958, "step": 12406 }, { "epoch": 0.29, "learning_rate": 8.35689463090511e-06, "loss": 0.9249, "step": 12407 }, { "epoch": 0.29, "learning_rate": 8.356616285620285e-06, "loss": 1.1077, "step": 12408 }, { "epoch": 0.29, "learning_rate": 8.356337921397659e-06, "loss": 0.9005, "step": 12409 }, { "epoch": 0.29, "learning_rate": 8.356059538238801e-06, "loss": 0.8492, "step": 12410 }, { "epoch": 0.29, "learning_rate": 8.355781136145286e-06, "loss": 1.0208, "step": 12411 }, { "epoch": 0.29, "learning_rate": 8.355502715118683e-06, "loss": 0.6765, "step": 12412 }, { "epoch": 0.29, "learning_rate": 8.355224275160559e-06, "loss": 0.8406, "step": 12413 }, { "epoch": 0.29, "learning_rate": 8.354945816272488e-06, "loss": 1.2886, "step": 12414 }, { "epoch": 0.29, "learning_rate": 8.354667338456042e-06, "loss": 0.7766, "step": 12415 }, { "epoch": 0.29, "learning_rate": 8.35438884171279e-06, "loss": 0.877, "step": 12416 }, { "epoch": 0.29, "learning_rate": 8.354110326044307e-06, "loss": 0.8281, "step": 12417 }, { "epoch": 0.29, "learning_rate": 8.353831791452159e-06, "loss": 0.9723, "step": 12418 }, { "epoch": 0.29, "learning_rate": 8.353553237937922e-06, "loss": 0.9577, "step": 12419 }, { "epoch": 0.29, "learning_rate": 8.353274665503164e-06, "loss": 0.8612, "step": 12420 }, { "epoch": 0.29, "learning_rate": 8.35299607414946e-06, "loss": 0.974, "step": 12421 }, { "epoch": 0.29, "learning_rate": 8.35271746387838e-06, "loss": 1.187, "step": 12422 }, { "epoch": 0.29, "learning_rate": 8.352438834691495e-06, "loss": 1.0947, "step": 12423 }, { "epoch": 0.29, "learning_rate": 8.352160186590377e-06, "loss": 0.8609, "step": 12424 }, { "epoch": 0.29, "learning_rate": 8.351881519576602e-06, "loss": 0.9603, "step": 12425 }, { "epoch": 0.29, "learning_rate": 8.351602833651738e-06, "loss": 0.8414, "step": 12426 }, { "epoch": 0.29, "learning_rate": 8.35132412881736e-06, "loss": 0.8088, "step": 12427 }, { "epoch": 0.29, "learning_rate": 8.351045405075038e-06, "loss": 0.8282, "step": 12428 }, { "epoch": 0.29, "learning_rate": 8.350766662426347e-06, "loss": 0.9593, "step": 12429 }, { "epoch": 0.29, "learning_rate": 8.350487900872857e-06, "loss": 1.1633, "step": 12430 }, { "epoch": 0.29, "learning_rate": 8.350209120416143e-06, "loss": 0.9637, "step": 12431 }, { "epoch": 0.29, "learning_rate": 8.349930321057776e-06, "loss": 1.1481, "step": 12432 }, { "epoch": 0.29, "learning_rate": 8.349651502799332e-06, "loss": 0.9995, "step": 12433 }, { "epoch": 0.29, "learning_rate": 8.34937266564238e-06, "loss": 1.1919, "step": 12434 }, { "epoch": 0.29, "learning_rate": 8.349093809588497e-06, "loss": 1.1391, "step": 12435 }, { "epoch": 0.29, "learning_rate": 8.348814934639253e-06, "loss": 0.9824, "step": 12436 }, { "epoch": 0.29, "learning_rate": 8.348536040796224e-06, "loss": 0.7388, "step": 12437 }, { "epoch": 0.29, "learning_rate": 8.348257128060982e-06, "loss": 0.9953, "step": 12438 }, { "epoch": 0.29, "learning_rate": 8.347978196435101e-06, "loss": 0.9938, "step": 12439 }, { "epoch": 0.29, "learning_rate": 8.347699245920155e-06, "loss": 1.0452, "step": 12440 }, { "epoch": 0.29, "learning_rate": 8.347420276517718e-06, "loss": 1.1459, "step": 12441 }, { "epoch": 0.29, "learning_rate": 8.347141288229361e-06, "loss": 1.16, "step": 12442 }, { "epoch": 0.29, "learning_rate": 8.346862281056663e-06, "loss": 1.1156, "step": 12443 }, { "epoch": 0.29, "learning_rate": 8.346583255001194e-06, "loss": 0.7088, "step": 12444 }, { "epoch": 0.29, "learning_rate": 8.346304210064533e-06, "loss": 0.9704, "step": 12445 }, { "epoch": 0.29, "learning_rate": 8.346025146248247e-06, "loss": 1.1665, "step": 12446 }, { "epoch": 0.29, "learning_rate": 8.345746063553917e-06, "loss": 1.09, "step": 12447 }, { "epoch": 0.29, "learning_rate": 8.345466961983115e-06, "loss": 0.8243, "step": 12448 }, { "epoch": 0.29, "learning_rate": 8.345187841537417e-06, "loss": 0.9754, "step": 12449 }, { "epoch": 0.29, "learning_rate": 8.344908702218396e-06, "loss": 0.9868, "step": 12450 }, { "epoch": 0.29, "learning_rate": 8.344629544027628e-06, "loss": 1.1904, "step": 12451 }, { "epoch": 0.29, "learning_rate": 8.344350366966686e-06, "loss": 1.0301, "step": 12452 }, { "epoch": 0.29, "learning_rate": 8.34407117103715e-06, "loss": 0.7925, "step": 12453 }, { "epoch": 0.29, "learning_rate": 8.343791956240588e-06, "loss": 1.0899, "step": 12454 }, { "epoch": 0.29, "learning_rate": 8.343512722578581e-06, "loss": 0.744, "step": 12455 }, { "epoch": 0.29, "learning_rate": 8.343233470052703e-06, "loss": 1.1659, "step": 12456 }, { "epoch": 0.29, "learning_rate": 8.34295419866453e-06, "loss": 0.9792, "step": 12457 }, { "epoch": 0.29, "learning_rate": 8.342674908415634e-06, "loss": 1.1639, "step": 12458 }, { "epoch": 0.29, "learning_rate": 8.342395599307596e-06, "loss": 0.9507, "step": 12459 }, { "epoch": 0.29, "learning_rate": 8.342116271341988e-06, "loss": 0.8445, "step": 12460 }, { "epoch": 0.29, "learning_rate": 8.341836924520387e-06, "loss": 1.1521, "step": 12461 }, { "epoch": 0.29, "learning_rate": 8.34155755884437e-06, "loss": 0.9075, "step": 12462 }, { "epoch": 0.29, "learning_rate": 8.341278174315515e-06, "loss": 0.9394, "step": 12463 }, { "epoch": 0.29, "learning_rate": 8.340998770935392e-06, "loss": 1.0067, "step": 12464 }, { "epoch": 0.29, "learning_rate": 8.340719348705583e-06, "loss": 0.9348, "step": 12465 }, { "epoch": 0.29, "learning_rate": 8.340439907627662e-06, "loss": 1.0744, "step": 12466 }, { "epoch": 0.29, "learning_rate": 8.340160447703207e-06, "loss": 1.0066, "step": 12467 }, { "epoch": 0.29, "learning_rate": 8.339880968933794e-06, "loss": 0.9268, "step": 12468 }, { "epoch": 0.29, "learning_rate": 8.339601471320999e-06, "loss": 1.0713, "step": 12469 }, { "epoch": 0.29, "learning_rate": 8.3393219548664e-06, "loss": 1.0441, "step": 12470 }, { "epoch": 0.29, "learning_rate": 8.339042419571574e-06, "loss": 1.0976, "step": 12471 }, { "epoch": 0.29, "learning_rate": 8.338762865438097e-06, "loss": 1.214, "step": 12472 }, { "epoch": 0.29, "learning_rate": 8.33848329246755e-06, "loss": 0.8348, "step": 12473 }, { "epoch": 0.29, "learning_rate": 8.338203700661503e-06, "loss": 1.0245, "step": 12474 }, { "epoch": 0.29, "learning_rate": 8.33792409002154e-06, "loss": 0.6749, "step": 12475 }, { "epoch": 0.29, "learning_rate": 8.337644460549235e-06, "loss": 1.1055, "step": 12476 }, { "epoch": 0.29, "learning_rate": 8.337364812246169e-06, "loss": 0.954, "step": 12477 }, { "epoch": 0.29, "learning_rate": 8.337085145113917e-06, "loss": 0.938, "step": 12478 }, { "epoch": 0.29, "learning_rate": 8.336805459154057e-06, "loss": 1.0313, "step": 12479 }, { "epoch": 0.29, "learning_rate": 8.336525754368167e-06, "loss": 0.8914, "step": 12480 }, { "epoch": 0.29, "learning_rate": 8.336246030757827e-06, "loss": 0.8828, "step": 12481 }, { "epoch": 0.29, "learning_rate": 8.335966288324614e-06, "loss": 1.0262, "step": 12482 }, { "epoch": 0.29, "learning_rate": 8.335686527070104e-06, "loss": 1.1532, "step": 12483 }, { "epoch": 0.29, "learning_rate": 8.33540674699588e-06, "loss": 1.3713, "step": 12484 }, { "epoch": 0.29, "learning_rate": 8.335126948103518e-06, "loss": 1.2325, "step": 12485 }, { "epoch": 0.29, "learning_rate": 8.334847130394594e-06, "loss": 0.7422, "step": 12486 }, { "epoch": 0.29, "learning_rate": 8.334567293870693e-06, "loss": 1.007, "step": 12487 }, { "epoch": 0.29, "learning_rate": 8.334287438533385e-06, "loss": 0.7571, "step": 12488 }, { "epoch": 0.29, "learning_rate": 8.334007564384259e-06, "loss": 0.8425, "step": 12489 }, { "epoch": 0.29, "learning_rate": 8.333727671424887e-06, "loss": 0.996, "step": 12490 }, { "epoch": 0.29, "learning_rate": 8.333447759656851e-06, "loss": 0.8979, "step": 12491 }, { "epoch": 0.29, "learning_rate": 8.333167829081729e-06, "loss": 0.9701, "step": 12492 }, { "epoch": 0.29, "learning_rate": 8.332887879701101e-06, "loss": 1.1844, "step": 12493 }, { "epoch": 0.29, "learning_rate": 8.332607911516545e-06, "loss": 0.9733, "step": 12494 }, { "epoch": 0.29, "learning_rate": 8.332327924529644e-06, "loss": 0.9214, "step": 12495 }, { "epoch": 0.29, "learning_rate": 8.332047918741975e-06, "loss": 0.9824, "step": 12496 }, { "epoch": 0.29, "learning_rate": 8.331767894155117e-06, "loss": 0.8848, "step": 12497 }, { "epoch": 0.29, "learning_rate": 8.331487850770652e-06, "loss": 0.9776, "step": 12498 }, { "epoch": 0.29, "learning_rate": 8.331207788590159e-06, "loss": 1.0921, "step": 12499 }, { "epoch": 0.29, "learning_rate": 8.330927707615218e-06, "loss": 0.9505, "step": 12500 }, { "epoch": 0.29, "learning_rate": 8.330647607847409e-06, "loss": 0.7948, "step": 12501 }, { "epoch": 0.29, "learning_rate": 8.330367489288315e-06, "loss": 1.0268, "step": 12502 }, { "epoch": 0.29, "learning_rate": 8.330087351939512e-06, "loss": 1.1741, "step": 12503 }, { "epoch": 0.29, "learning_rate": 8.329807195802584e-06, "loss": 0.9333, "step": 12504 }, { "epoch": 0.29, "learning_rate": 8.329527020879109e-06, "loss": 1.2459, "step": 12505 }, { "epoch": 0.29, "learning_rate": 8.329246827170669e-06, "loss": 1.1295, "step": 12506 }, { "epoch": 0.29, "learning_rate": 8.328966614678847e-06, "loss": 0.7652, "step": 12507 }, { "epoch": 0.29, "learning_rate": 8.32868638340522e-06, "loss": 1.016, "step": 12508 }, { "epoch": 0.29, "learning_rate": 8.328406133351371e-06, "loss": 1.0314, "step": 12509 }, { "epoch": 0.29, "learning_rate": 8.328125864518881e-06, "loss": 0.9294, "step": 12510 }, { "epoch": 0.29, "learning_rate": 8.327845576909333e-06, "loss": 1.1375, "step": 12511 }, { "epoch": 0.29, "learning_rate": 8.327565270524303e-06, "loss": 0.8226, "step": 12512 }, { "epoch": 0.29, "learning_rate": 8.327284945365378e-06, "loss": 1.0819, "step": 12513 }, { "epoch": 0.29, "learning_rate": 8.32700460143414e-06, "loss": 0.8762, "step": 12514 }, { "epoch": 0.29, "learning_rate": 8.326724238732164e-06, "loss": 0.9287, "step": 12515 }, { "epoch": 0.29, "learning_rate": 8.32644385726104e-06, "loss": 1.1108, "step": 12516 }, { "epoch": 0.29, "learning_rate": 8.326163457022343e-06, "loss": 0.7924, "step": 12517 }, { "epoch": 0.29, "learning_rate": 8.325883038017659e-06, "loss": 0.9199, "step": 12518 }, { "epoch": 0.29, "learning_rate": 8.32560260024857e-06, "loss": 0.8961, "step": 12519 }, { "epoch": 0.29, "learning_rate": 8.325322143716656e-06, "loss": 0.799, "step": 12520 }, { "epoch": 0.29, "learning_rate": 8.325041668423502e-06, "loss": 0.9509, "step": 12521 }, { "epoch": 0.29, "learning_rate": 8.324761174370687e-06, "loss": 0.8074, "step": 12522 }, { "epoch": 0.29, "learning_rate": 8.324480661559798e-06, "loss": 0.8654, "step": 12523 }, { "epoch": 0.29, "learning_rate": 8.324200129992414e-06, "loss": 0.9847, "step": 12524 }, { "epoch": 0.29, "learning_rate": 8.32391957967012e-06, "loss": 1.0831, "step": 12525 }, { "epoch": 0.29, "learning_rate": 8.323639010594498e-06, "loss": 0.9038, "step": 12526 }, { "epoch": 0.29, "learning_rate": 8.32335842276713e-06, "loss": 0.907, "step": 12527 }, { "epoch": 0.29, "learning_rate": 8.323077816189598e-06, "loss": 1.0125, "step": 12528 }, { "epoch": 0.29, "learning_rate": 8.32279719086349e-06, "loss": 0.9932, "step": 12529 }, { "epoch": 0.29, "learning_rate": 8.322516546790385e-06, "loss": 0.895, "step": 12530 }, { "epoch": 0.29, "learning_rate": 8.322235883971868e-06, "loss": 0.9568, "step": 12531 }, { "epoch": 0.29, "learning_rate": 8.321955202409522e-06, "loss": 0.8694, "step": 12532 }, { "epoch": 0.29, "learning_rate": 8.321674502104928e-06, "loss": 1.1636, "step": 12533 }, { "epoch": 0.29, "learning_rate": 8.321393783059677e-06, "loss": 0.9108, "step": 12534 }, { "epoch": 0.29, "learning_rate": 8.321113045275345e-06, "loss": 1.0165, "step": 12535 }, { "epoch": 0.29, "learning_rate": 8.32083228875352e-06, "loss": 0.9243, "step": 12536 }, { "epoch": 0.29, "learning_rate": 8.320551513495786e-06, "loss": 1.2241, "step": 12537 }, { "epoch": 0.29, "learning_rate": 8.320270719503725e-06, "loss": 0.962, "step": 12538 }, { "epoch": 0.29, "learning_rate": 8.319989906778924e-06, "loss": 0.8435, "step": 12539 }, { "epoch": 0.29, "learning_rate": 8.319709075322964e-06, "loss": 0.7674, "step": 12540 }, { "epoch": 0.29, "learning_rate": 8.31942822513743e-06, "loss": 0.815, "step": 12541 }, { "epoch": 0.29, "learning_rate": 8.31914735622391e-06, "loss": 1.1545, "step": 12542 }, { "epoch": 0.29, "learning_rate": 8.318866468583988e-06, "loss": 0.6242, "step": 12543 }, { "epoch": 0.29, "learning_rate": 8.318585562219246e-06, "loss": 1.0915, "step": 12544 }, { "epoch": 0.29, "learning_rate": 8.318304637131267e-06, "loss": 1.0004, "step": 12545 }, { "epoch": 0.29, "learning_rate": 8.318023693321641e-06, "loss": 1.0738, "step": 12546 }, { "epoch": 0.29, "learning_rate": 8.317742730791953e-06, "loss": 1.1523, "step": 12547 }, { "epoch": 0.29, "learning_rate": 8.317461749543783e-06, "loss": 1.1638, "step": 12548 }, { "epoch": 0.29, "learning_rate": 8.317180749578721e-06, "loss": 1.0392, "step": 12549 }, { "epoch": 0.29, "learning_rate": 8.316899730898351e-06, "loss": 1.1049, "step": 12550 }, { "epoch": 0.29, "learning_rate": 8.316618693504258e-06, "loss": 1.0729, "step": 12551 }, { "epoch": 0.29, "learning_rate": 8.316337637398027e-06, "loss": 0.9739, "step": 12552 }, { "epoch": 0.29, "learning_rate": 8.316056562581248e-06, "loss": 0.7407, "step": 12553 }, { "epoch": 0.29, "learning_rate": 8.3157754690555e-06, "loss": 0.6098, "step": 12554 }, { "epoch": 0.29, "learning_rate": 8.315494356822374e-06, "loss": 0.89, "step": 12555 }, { "epoch": 0.29, "learning_rate": 8.315213225883452e-06, "loss": 0.8305, "step": 12556 }, { "epoch": 0.29, "learning_rate": 8.314932076240326e-06, "loss": 0.8422, "step": 12557 }, { "epoch": 0.29, "learning_rate": 8.314650907894575e-06, "loss": 0.9481, "step": 12558 }, { "epoch": 0.29, "learning_rate": 8.314369720847791e-06, "loss": 0.8479, "step": 12559 }, { "epoch": 0.29, "learning_rate": 8.31408851510156e-06, "loss": 1.0384, "step": 12560 }, { "epoch": 0.29, "learning_rate": 8.313807290657464e-06, "loss": 1.0247, "step": 12561 }, { "epoch": 0.29, "learning_rate": 8.313526047517094e-06, "loss": 0.6805, "step": 12562 }, { "epoch": 0.29, "learning_rate": 8.313244785682036e-06, "loss": 0.7965, "step": 12563 }, { "epoch": 0.29, "learning_rate": 8.312963505153875e-06, "loss": 0.8765, "step": 12564 }, { "epoch": 0.29, "learning_rate": 8.312682205934201e-06, "loss": 1.1027, "step": 12565 }, { "epoch": 0.29, "learning_rate": 8.312400888024599e-06, "loss": 1.0285, "step": 12566 }, { "epoch": 0.29, "learning_rate": 8.312119551426655e-06, "loss": 0.9497, "step": 12567 }, { "epoch": 0.29, "learning_rate": 8.31183819614196e-06, "loss": 0.864, "step": 12568 }, { "epoch": 0.29, "learning_rate": 8.311556822172095e-06, "loss": 0.9352, "step": 12569 }, { "epoch": 0.29, "learning_rate": 8.311275429518657e-06, "loss": 1.1898, "step": 12570 }, { "epoch": 0.29, "learning_rate": 8.310994018183225e-06, "loss": 1.1505, "step": 12571 }, { "epoch": 0.29, "learning_rate": 8.31071258816739e-06, "loss": 0.9562, "step": 12572 }, { "epoch": 0.29, "learning_rate": 8.31043113947274e-06, "loss": 0.5883, "step": 12573 }, { "epoch": 0.29, "learning_rate": 8.310149672100865e-06, "loss": 1.0518, "step": 12574 }, { "epoch": 0.29, "learning_rate": 8.309868186053349e-06, "loss": 0.9206, "step": 12575 }, { "epoch": 0.29, "learning_rate": 8.30958668133178e-06, "loss": 1.2729, "step": 12576 }, { "epoch": 0.29, "learning_rate": 8.30930515793775e-06, "loss": 0.8554, "step": 12577 }, { "epoch": 0.29, "learning_rate": 8.309023615872846e-06, "loss": 0.9865, "step": 12578 }, { "epoch": 0.29, "learning_rate": 8.308742055138654e-06, "loss": 0.9268, "step": 12579 }, { "epoch": 0.29, "learning_rate": 8.308460475736765e-06, "loss": 1.2239, "step": 12580 }, { "epoch": 0.29, "learning_rate": 8.30817887766877e-06, "loss": 1.2987, "step": 12581 }, { "epoch": 0.29, "learning_rate": 8.30789726093625e-06, "loss": 1.0878, "step": 12582 }, { "epoch": 0.29, "learning_rate": 8.307615625540802e-06, "loss": 1.1841, "step": 12583 }, { "epoch": 0.29, "learning_rate": 8.30733397148401e-06, "loss": 0.9035, "step": 12584 }, { "epoch": 0.29, "learning_rate": 8.307052298767464e-06, "loss": 1.1991, "step": 12585 }, { "epoch": 0.29, "learning_rate": 8.306770607392755e-06, "loss": 0.9753, "step": 12586 }, { "epoch": 0.29, "learning_rate": 8.306488897361473e-06, "loss": 0.8415, "step": 12587 }, { "epoch": 0.29, "learning_rate": 8.306207168675203e-06, "loss": 0.8635, "step": 12588 }, { "epoch": 0.29, "learning_rate": 8.305925421335538e-06, "loss": 0.9262, "step": 12589 }, { "epoch": 0.29, "learning_rate": 8.305643655344067e-06, "loss": 0.75, "step": 12590 }, { "epoch": 0.29, "learning_rate": 8.305361870702377e-06, "loss": 1.0454, "step": 12591 }, { "epoch": 0.29, "learning_rate": 8.305080067412064e-06, "loss": 1.0485, "step": 12592 }, { "epoch": 0.29, "learning_rate": 8.304798245474712e-06, "loss": 0.9347, "step": 12593 }, { "epoch": 0.29, "learning_rate": 8.304516404891912e-06, "loss": 1.0621, "step": 12594 }, { "epoch": 0.29, "learning_rate": 8.304234545665257e-06, "loss": 0.735, "step": 12595 }, { "epoch": 0.29, "learning_rate": 8.303952667796335e-06, "loss": 0.9465, "step": 12596 }, { "epoch": 0.29, "learning_rate": 8.303670771286736e-06, "loss": 1.1205, "step": 12597 }, { "epoch": 0.29, "learning_rate": 8.303388856138053e-06, "loss": 1.2844, "step": 12598 }, { "epoch": 0.29, "learning_rate": 8.303106922351872e-06, "loss": 0.8565, "step": 12599 }, { "epoch": 0.29, "learning_rate": 8.302824969929788e-06, "loss": 1.1674, "step": 12600 }, { "epoch": 0.29, "learning_rate": 8.30254299887339e-06, "loss": 0.8872, "step": 12601 }, { "epoch": 0.29, "learning_rate": 8.30226100918427e-06, "loss": 0.8777, "step": 12602 }, { "epoch": 0.29, "learning_rate": 8.301979000864018e-06, "loss": 1.0643, "step": 12603 }, { "epoch": 0.29, "learning_rate": 8.301696973914223e-06, "loss": 1.067, "step": 12604 }, { "epoch": 0.29, "learning_rate": 8.30141492833648e-06, "loss": 1.1065, "step": 12605 }, { "epoch": 0.29, "learning_rate": 8.301132864132378e-06, "loss": 1.0933, "step": 12606 }, { "epoch": 0.29, "learning_rate": 8.30085078130351e-06, "loss": 0.812, "step": 12607 }, { "epoch": 0.29, "learning_rate": 8.300568679851465e-06, "loss": 0.815, "step": 12608 }, { "epoch": 0.29, "learning_rate": 8.300286559777836e-06, "loss": 1.0347, "step": 12609 }, { "epoch": 0.29, "learning_rate": 8.300004421084216e-06, "loss": 0.9389, "step": 12610 }, { "epoch": 0.29, "learning_rate": 8.299722263772194e-06, "loss": 0.9583, "step": 12611 }, { "epoch": 0.29, "learning_rate": 8.299440087843364e-06, "loss": 1.0225, "step": 12612 }, { "epoch": 0.29, "learning_rate": 8.299157893299317e-06, "loss": 1.0572, "step": 12613 }, { "epoch": 0.29, "learning_rate": 8.298875680141647e-06, "loss": 1.0979, "step": 12614 }, { "epoch": 0.29, "learning_rate": 8.298593448371944e-06, "loss": 0.9205, "step": 12615 }, { "epoch": 0.29, "learning_rate": 8.298311197991802e-06, "loss": 0.9461, "step": 12616 }, { "epoch": 0.29, "learning_rate": 8.29802892900281e-06, "loss": 0.8953, "step": 12617 }, { "epoch": 0.29, "learning_rate": 8.297746641406566e-06, "loss": 1.0625, "step": 12618 }, { "epoch": 0.29, "learning_rate": 8.297464335204657e-06, "loss": 0.9738, "step": 12619 }, { "epoch": 0.29, "learning_rate": 8.297182010398681e-06, "loss": 0.6201, "step": 12620 }, { "epoch": 0.29, "learning_rate": 8.296899666990229e-06, "loss": 1.1152, "step": 12621 }, { "epoch": 0.29, "learning_rate": 8.29661730498089e-06, "loss": 0.9498, "step": 12622 }, { "epoch": 0.29, "learning_rate": 8.296334924372263e-06, "loss": 0.8088, "step": 12623 }, { "epoch": 0.29, "learning_rate": 8.296052525165937e-06, "loss": 1.0002, "step": 12624 }, { "epoch": 0.29, "learning_rate": 8.295770107363507e-06, "loss": 1.0587, "step": 12625 }, { "epoch": 0.29, "learning_rate": 8.295487670966566e-06, "loss": 0.8686, "step": 12626 }, { "epoch": 0.29, "learning_rate": 8.29520521597671e-06, "loss": 0.9024, "step": 12627 }, { "epoch": 0.29, "learning_rate": 8.29492274239553e-06, "loss": 0.7582, "step": 12628 }, { "epoch": 0.29, "learning_rate": 8.294640250224618e-06, "loss": 1.0335, "step": 12629 }, { "epoch": 0.29, "learning_rate": 8.29435773946557e-06, "loss": 0.8163, "step": 12630 }, { "epoch": 0.29, "learning_rate": 8.294075210119981e-06, "loss": 0.7627, "step": 12631 }, { "epoch": 0.29, "learning_rate": 8.293792662189443e-06, "loss": 1.0235, "step": 12632 }, { "epoch": 0.29, "learning_rate": 8.293510095675551e-06, "loss": 0.9152, "step": 12633 }, { "epoch": 0.29, "learning_rate": 8.2932275105799e-06, "loss": 1.1449, "step": 12634 }, { "epoch": 0.29, "learning_rate": 8.29294490690408e-06, "loss": 1.0409, "step": 12635 }, { "epoch": 0.29, "learning_rate": 8.292662284649693e-06, "loss": 0.8774, "step": 12636 }, { "epoch": 0.29, "learning_rate": 8.292379643818327e-06, "loss": 0.8453, "step": 12637 }, { "epoch": 0.29, "learning_rate": 8.29209698441158e-06, "loss": 0.9279, "step": 12638 }, { "epoch": 0.29, "learning_rate": 8.291814306431046e-06, "loss": 1.1957, "step": 12639 }, { "epoch": 0.29, "learning_rate": 8.291531609878318e-06, "loss": 1.0837, "step": 12640 }, { "epoch": 0.29, "learning_rate": 8.291248894754993e-06, "loss": 1.1144, "step": 12641 }, { "epoch": 0.29, "learning_rate": 8.290966161062667e-06, "loss": 0.9536, "step": 12642 }, { "epoch": 0.29, "learning_rate": 8.290683408802934e-06, "loss": 0.8366, "step": 12643 }, { "epoch": 0.29, "learning_rate": 8.290400637977387e-06, "loss": 1.2711, "step": 12644 }, { "epoch": 0.29, "learning_rate": 8.290117848587624e-06, "loss": 0.8451, "step": 12645 }, { "epoch": 0.29, "learning_rate": 8.289835040635239e-06, "loss": 0.9502, "step": 12646 }, { "epoch": 0.29, "learning_rate": 8.289552214121831e-06, "loss": 0.8294, "step": 12647 }, { "epoch": 0.29, "learning_rate": 8.289269369048991e-06, "loss": 1.1821, "step": 12648 }, { "epoch": 0.29, "learning_rate": 8.28898650541832e-06, "loss": 0.9262, "step": 12649 }, { "epoch": 0.29, "learning_rate": 8.288703623231407e-06, "loss": 0.905, "step": 12650 }, { "epoch": 0.29, "learning_rate": 8.288420722489854e-06, "loss": 0.8927, "step": 12651 }, { "epoch": 0.29, "learning_rate": 8.288137803195254e-06, "loss": 0.8986, "step": 12652 }, { "epoch": 0.29, "learning_rate": 8.287854865349205e-06, "loss": 1.0465, "step": 12653 }, { "epoch": 0.29, "learning_rate": 8.287571908953303e-06, "loss": 0.9821, "step": 12654 }, { "epoch": 0.29, "learning_rate": 8.287288934009143e-06, "loss": 0.9546, "step": 12655 }, { "epoch": 0.29, "learning_rate": 8.287005940518321e-06, "loss": 0.9038, "step": 12656 }, { "epoch": 0.29, "learning_rate": 8.286722928482438e-06, "loss": 0.9469, "step": 12657 }, { "epoch": 0.29, "learning_rate": 8.286439897903084e-06, "loss": 0.8692, "step": 12658 }, { "epoch": 0.29, "learning_rate": 8.286156848781864e-06, "loss": 0.9345, "step": 12659 }, { "epoch": 0.29, "learning_rate": 8.285873781120368e-06, "loss": 1.1656, "step": 12660 }, { "epoch": 0.29, "learning_rate": 8.285590694920196e-06, "loss": 1.0902, "step": 12661 }, { "epoch": 0.29, "learning_rate": 8.285307590182945e-06, "loss": 1.1397, "step": 12662 }, { "epoch": 0.29, "learning_rate": 8.285024466910212e-06, "loss": 1.0325, "step": 12663 }, { "epoch": 0.29, "learning_rate": 8.284741325103596e-06, "loss": 1.2371, "step": 12664 }, { "epoch": 0.29, "learning_rate": 8.28445816476469e-06, "loss": 0.9695, "step": 12665 }, { "epoch": 0.29, "learning_rate": 8.284174985895097e-06, "loss": 0.9897, "step": 12666 }, { "epoch": 0.29, "learning_rate": 8.28389178849641e-06, "loss": 1.0644, "step": 12667 }, { "epoch": 0.29, "learning_rate": 8.28360857257023e-06, "loss": 1.0676, "step": 12668 }, { "epoch": 0.29, "learning_rate": 8.283325338118154e-06, "loss": 0.9187, "step": 12669 }, { "epoch": 0.29, "learning_rate": 8.283042085141778e-06, "loss": 1.0216, "step": 12670 }, { "epoch": 0.29, "learning_rate": 8.282758813642703e-06, "loss": 0.9539, "step": 12671 }, { "epoch": 0.29, "learning_rate": 8.282475523622526e-06, "loss": 1.1904, "step": 12672 }, { "epoch": 0.29, "learning_rate": 8.282192215082846e-06, "loss": 0.7766, "step": 12673 }, { "epoch": 0.29, "learning_rate": 8.28190888802526e-06, "loss": 1.1158, "step": 12674 }, { "epoch": 0.29, "learning_rate": 8.281625542451369e-06, "loss": 1.0248, "step": 12675 }, { "epoch": 0.29, "learning_rate": 8.281342178362768e-06, "loss": 0.9915, "step": 12676 }, { "epoch": 0.29, "learning_rate": 8.281058795761058e-06, "loss": 0.9099, "step": 12677 }, { "epoch": 0.29, "learning_rate": 8.280775394647838e-06, "loss": 0.8873, "step": 12678 }, { "epoch": 0.29, "learning_rate": 8.280491975024706e-06, "loss": 1.0933, "step": 12679 }, { "epoch": 0.29, "learning_rate": 8.280208536893261e-06, "loss": 0.7789, "step": 12680 }, { "epoch": 0.29, "learning_rate": 8.279925080255105e-06, "loss": 0.8536, "step": 12681 }, { "epoch": 0.29, "learning_rate": 8.279641605111832e-06, "loss": 0.8696, "step": 12682 }, { "epoch": 0.29, "learning_rate": 8.279358111465044e-06, "loss": 0.7161, "step": 12683 }, { "epoch": 0.29, "learning_rate": 8.279074599316343e-06, "loss": 1.1156, "step": 12684 }, { "epoch": 0.29, "learning_rate": 8.278791068667324e-06, "loss": 1.0301, "step": 12685 }, { "epoch": 0.29, "learning_rate": 8.278507519519589e-06, "loss": 0.8937, "step": 12686 }, { "epoch": 0.29, "learning_rate": 8.27822395187474e-06, "loss": 0.909, "step": 12687 }, { "epoch": 0.29, "learning_rate": 8.277940365734371e-06, "loss": 1.2473, "step": 12688 }, { "epoch": 0.29, "learning_rate": 8.277656761100088e-06, "loss": 1.1576, "step": 12689 }, { "epoch": 0.29, "learning_rate": 8.277373137973487e-06, "loss": 0.9095, "step": 12690 }, { "epoch": 0.29, "learning_rate": 8.27708949635617e-06, "loss": 0.82, "step": 12691 }, { "epoch": 0.29, "learning_rate": 8.276805836249737e-06, "loss": 0.7818, "step": 12692 }, { "epoch": 0.29, "learning_rate": 8.276522157655789e-06, "loss": 0.9931, "step": 12693 }, { "epoch": 0.29, "learning_rate": 8.276238460575925e-06, "loss": 1.2038, "step": 12694 }, { "epoch": 0.29, "learning_rate": 8.275954745011748e-06, "loss": 0.8527, "step": 12695 }, { "epoch": 0.29, "learning_rate": 8.275671010964857e-06, "loss": 0.7981, "step": 12696 }, { "epoch": 0.29, "learning_rate": 8.27538725843685e-06, "loss": 0.9983, "step": 12697 }, { "epoch": 0.29, "learning_rate": 8.275103487429334e-06, "loss": 1.0296, "step": 12698 }, { "epoch": 0.29, "learning_rate": 8.274819697943906e-06, "loss": 1.1361, "step": 12699 }, { "epoch": 0.29, "learning_rate": 8.274535889982167e-06, "loss": 0.9047, "step": 12700 }, { "epoch": 0.29, "learning_rate": 8.27425206354572e-06, "loss": 0.7626, "step": 12701 }, { "epoch": 0.29, "learning_rate": 8.273968218636166e-06, "loss": 1.3138, "step": 12702 }, { "epoch": 0.29, "learning_rate": 8.273684355255104e-06, "loss": 1.0534, "step": 12703 }, { "epoch": 0.29, "learning_rate": 8.27340047340414e-06, "loss": 0.9622, "step": 12704 }, { "epoch": 0.29, "learning_rate": 8.273116573084871e-06, "loss": 0.8189, "step": 12705 }, { "epoch": 0.29, "learning_rate": 8.272832654298903e-06, "loss": 1.1439, "step": 12706 }, { "epoch": 0.29, "learning_rate": 8.272548717047834e-06, "loss": 0.8007, "step": 12707 }, { "epoch": 0.29, "learning_rate": 8.272264761333271e-06, "loss": 0.9187, "step": 12708 }, { "epoch": 0.29, "learning_rate": 8.27198078715681e-06, "loss": 0.7108, "step": 12709 }, { "epoch": 0.29, "learning_rate": 8.271696794520057e-06, "loss": 0.9023, "step": 12710 }, { "epoch": 0.29, "learning_rate": 8.271412783424613e-06, "loss": 1.2293, "step": 12711 }, { "epoch": 0.29, "learning_rate": 8.27112875387208e-06, "loss": 1.1228, "step": 12712 }, { "epoch": 0.29, "learning_rate": 8.27084470586406e-06, "loss": 0.8862, "step": 12713 }, { "epoch": 0.29, "learning_rate": 8.270560639402159e-06, "loss": 0.87, "step": 12714 }, { "epoch": 0.29, "learning_rate": 8.270276554487976e-06, "loss": 0.9899, "step": 12715 }, { "epoch": 0.29, "learning_rate": 8.269992451123117e-06, "loss": 0.7301, "step": 12716 }, { "epoch": 0.29, "learning_rate": 8.269708329309181e-06, "loss": 0.9425, "step": 12717 }, { "epoch": 0.29, "learning_rate": 8.269424189047774e-06, "loss": 1.105, "step": 12718 }, { "epoch": 0.29, "learning_rate": 8.269140030340496e-06, "loss": 1.1185, "step": 12719 }, { "epoch": 0.29, "learning_rate": 8.268855853188956e-06, "loss": 0.9894, "step": 12720 }, { "epoch": 0.3, "learning_rate": 8.26857165759475e-06, "loss": 0.8445, "step": 12721 }, { "epoch": 0.3, "learning_rate": 8.268287443559487e-06, "loss": 0.9178, "step": 12722 }, { "epoch": 0.3, "learning_rate": 8.268003211084769e-06, "loss": 0.8508, "step": 12723 }, { "epoch": 0.3, "learning_rate": 8.267718960172198e-06, "loss": 0.7514, "step": 12724 }, { "epoch": 0.3, "learning_rate": 8.26743469082338e-06, "loss": 1.0418, "step": 12725 }, { "epoch": 0.3, "learning_rate": 8.267150403039916e-06, "loss": 0.9883, "step": 12726 }, { "epoch": 0.3, "learning_rate": 8.266866096823412e-06, "loss": 0.7828, "step": 12727 }, { "epoch": 0.3, "learning_rate": 8.266581772175473e-06, "loss": 0.8334, "step": 12728 }, { "epoch": 0.3, "learning_rate": 8.266297429097702e-06, "loss": 1.1808, "step": 12729 }, { "epoch": 0.3, "learning_rate": 8.266013067591704e-06, "loss": 1.0613, "step": 12730 }, { "epoch": 0.3, "learning_rate": 8.265728687659078e-06, "loss": 0.8475, "step": 12731 }, { "epoch": 0.3, "learning_rate": 8.265444289301436e-06, "loss": 1.1014, "step": 12732 }, { "epoch": 0.3, "learning_rate": 8.265159872520378e-06, "loss": 1.2287, "step": 12733 }, { "epoch": 0.3, "learning_rate": 8.264875437317513e-06, "loss": 0.8262, "step": 12734 }, { "epoch": 0.3, "learning_rate": 8.26459098369444e-06, "loss": 0.9218, "step": 12735 }, { "epoch": 0.3, "learning_rate": 8.264306511652769e-06, "loss": 0.9435, "step": 12736 }, { "epoch": 0.3, "learning_rate": 8.2640220211941e-06, "loss": 0.9651, "step": 12737 }, { "epoch": 0.3, "learning_rate": 8.263737512320043e-06, "loss": 1.0463, "step": 12738 }, { "epoch": 0.3, "learning_rate": 8.263452985032199e-06, "loss": 0.7415, "step": 12739 }, { "epoch": 0.3, "learning_rate": 8.263168439332178e-06, "loss": 1.2033, "step": 12740 }, { "epoch": 0.3, "learning_rate": 8.26288387522158e-06, "loss": 0.7518, "step": 12741 }, { "epoch": 0.3, "learning_rate": 8.262599292702013e-06, "loss": 1.0364, "step": 12742 }, { "epoch": 0.3, "learning_rate": 8.262314691775085e-06, "loss": 1.0256, "step": 12743 }, { "epoch": 0.3, "learning_rate": 8.262030072442398e-06, "loss": 1.0806, "step": 12744 }, { "epoch": 0.3, "learning_rate": 8.26174543470556e-06, "loss": 0.9402, "step": 12745 }, { "epoch": 0.3, "learning_rate": 8.261460778566176e-06, "loss": 0.7478, "step": 12746 }, { "epoch": 0.3, "learning_rate": 8.261176104025852e-06, "loss": 1.0875, "step": 12747 }, { "epoch": 0.3, "learning_rate": 8.260891411086193e-06, "loss": 0.9388, "step": 12748 }, { "epoch": 0.3, "learning_rate": 8.260606699748808e-06, "loss": 0.6984, "step": 12749 }, { "epoch": 0.3, "learning_rate": 8.260321970015301e-06, "loss": 0.8124, "step": 12750 }, { "epoch": 0.3, "learning_rate": 8.260037221887279e-06, "loss": 0.8467, "step": 12751 }, { "epoch": 0.3, "learning_rate": 8.25975245536635e-06, "loss": 0.9568, "step": 12752 }, { "epoch": 0.3, "learning_rate": 8.259467670454117e-06, "loss": 0.7146, "step": 12753 }, { "epoch": 0.3, "learning_rate": 8.259182867152192e-06, "loss": 0.82, "step": 12754 }, { "epoch": 0.3, "learning_rate": 8.258898045462177e-06, "loss": 1.0808, "step": 12755 }, { "epoch": 0.3, "learning_rate": 8.25861320538568e-06, "loss": 0.8588, "step": 12756 }, { "epoch": 0.3, "learning_rate": 8.258328346924312e-06, "loss": 0.9821, "step": 12757 }, { "epoch": 0.3, "learning_rate": 8.258043470079676e-06, "loss": 1.0924, "step": 12758 }, { "epoch": 0.3, "learning_rate": 8.25775857485338e-06, "loss": 0.9783, "step": 12759 }, { "epoch": 0.3, "learning_rate": 8.257473661247032e-06, "loss": 0.7344, "step": 12760 }, { "epoch": 0.3, "learning_rate": 8.257188729262238e-06, "loss": 1.158, "step": 12761 }, { "epoch": 0.3, "learning_rate": 8.256903778900607e-06, "loss": 0.9402, "step": 12762 }, { "epoch": 0.3, "learning_rate": 8.256618810163749e-06, "loss": 1.011, "step": 12763 }, { "epoch": 0.3, "learning_rate": 8.256333823053264e-06, "loss": 0.8893, "step": 12764 }, { "epoch": 0.3, "learning_rate": 8.25604881757077e-06, "loss": 0.9105, "step": 12765 }, { "epoch": 0.3, "learning_rate": 8.255763793717868e-06, "loss": 1.1561, "step": 12766 }, { "epoch": 0.3, "learning_rate": 8.25547875149617e-06, "loss": 1.0309, "step": 12767 }, { "epoch": 0.3, "learning_rate": 8.25519369090728e-06, "loss": 1.0617, "step": 12768 }, { "epoch": 0.3, "learning_rate": 8.254908611952808e-06, "loss": 0.8173, "step": 12769 }, { "epoch": 0.3, "learning_rate": 8.254623514634366e-06, "loss": 1.0606, "step": 12770 }, { "epoch": 0.3, "learning_rate": 8.254338398953557e-06, "loss": 0.853, "step": 12771 }, { "epoch": 0.3, "learning_rate": 8.254053264911993e-06, "loss": 0.898, "step": 12772 }, { "epoch": 0.3, "learning_rate": 8.253768112511283e-06, "loss": 0.9501, "step": 12773 }, { "epoch": 0.3, "learning_rate": 8.253482941753032e-06, "loss": 1.16, "step": 12774 }, { "epoch": 0.3, "learning_rate": 8.253197752638853e-06, "loss": 1.1767, "step": 12775 }, { "epoch": 0.3, "learning_rate": 8.252912545170352e-06, "loss": 0.797, "step": 12776 }, { "epoch": 0.3, "learning_rate": 8.252627319349143e-06, "loss": 0.865, "step": 12777 }, { "epoch": 0.3, "learning_rate": 8.252342075176829e-06, "loss": 0.8291, "step": 12778 }, { "epoch": 0.3, "learning_rate": 8.252056812655026e-06, "loss": 0.8146, "step": 12779 }, { "epoch": 0.3, "learning_rate": 8.251771531785335e-06, "loss": 1.0228, "step": 12780 }, { "epoch": 0.3, "learning_rate": 8.251486232569373e-06, "loss": 0.6876, "step": 12781 }, { "epoch": 0.3, "learning_rate": 8.251200915008746e-06, "loss": 0.7695, "step": 12782 }, { "epoch": 0.3, "learning_rate": 8.250915579105064e-06, "loss": 0.9942, "step": 12783 }, { "epoch": 0.3, "learning_rate": 8.25063022485994e-06, "loss": 0.792, "step": 12784 }, { "epoch": 0.3, "learning_rate": 8.250344852274978e-06, "loss": 0.8008, "step": 12785 }, { "epoch": 0.3, "learning_rate": 8.250059461351792e-06, "loss": 0.8289, "step": 12786 }, { "epoch": 0.3, "learning_rate": 8.249774052091993e-06, "loss": 0.9175, "step": 12787 }, { "epoch": 0.3, "learning_rate": 8.24948862449719e-06, "loss": 1.3057, "step": 12788 }, { "epoch": 0.3, "learning_rate": 8.249203178568993e-06, "loss": 0.934, "step": 12789 }, { "epoch": 0.3, "learning_rate": 8.248917714309012e-06, "loss": 0.922, "step": 12790 }, { "epoch": 0.3, "learning_rate": 8.248632231718858e-06, "loss": 0.9274, "step": 12791 }, { "epoch": 0.3, "learning_rate": 8.248346730800143e-06, "loss": 1.1491, "step": 12792 }, { "epoch": 0.3, "learning_rate": 8.248061211554476e-06, "loss": 1.2396, "step": 12793 }, { "epoch": 0.3, "learning_rate": 8.24777567398347e-06, "loss": 0.649, "step": 12794 }, { "epoch": 0.3, "learning_rate": 8.247490118088732e-06, "loss": 1.2028, "step": 12795 }, { "epoch": 0.3, "learning_rate": 8.247204543871877e-06, "loss": 1.0459, "step": 12796 }, { "epoch": 0.3, "learning_rate": 8.246918951334516e-06, "loss": 0.8695, "step": 12797 }, { "epoch": 0.3, "learning_rate": 8.246633340478256e-06, "loss": 1.174, "step": 12798 }, { "epoch": 0.3, "learning_rate": 8.246347711304714e-06, "loss": 0.9332, "step": 12799 }, { "epoch": 0.3, "learning_rate": 8.246062063815498e-06, "loss": 0.8419, "step": 12800 }, { "epoch": 0.3, "learning_rate": 8.245776398012221e-06, "loss": 0.6467, "step": 12801 }, { "epoch": 0.3, "learning_rate": 8.245490713896495e-06, "loss": 0.7509, "step": 12802 }, { "epoch": 0.3, "learning_rate": 8.24520501146993e-06, "loss": 1.1399, "step": 12803 }, { "epoch": 0.3, "learning_rate": 8.244919290734139e-06, "loss": 1.0971, "step": 12804 }, { "epoch": 0.3, "learning_rate": 8.244633551690735e-06, "loss": 1.1091, "step": 12805 }, { "epoch": 0.3, "learning_rate": 8.24434779434133e-06, "loss": 0.8629, "step": 12806 }, { "epoch": 0.3, "learning_rate": 8.244062018687533e-06, "loss": 1.0409, "step": 12807 }, { "epoch": 0.3, "learning_rate": 8.24377622473096e-06, "loss": 0.8404, "step": 12808 }, { "epoch": 0.3, "learning_rate": 8.243490412473223e-06, "loss": 1.1698, "step": 12809 }, { "epoch": 0.3, "learning_rate": 8.243204581915933e-06, "loss": 1.1583, "step": 12810 }, { "epoch": 0.3, "learning_rate": 8.242918733060703e-06, "loss": 0.9813, "step": 12811 }, { "epoch": 0.3, "learning_rate": 8.242632865909146e-06, "loss": 1.0065, "step": 12812 }, { "epoch": 0.3, "learning_rate": 8.242346980462876e-06, "loss": 0.8879, "step": 12813 }, { "epoch": 0.3, "learning_rate": 8.242061076723504e-06, "loss": 0.8579, "step": 12814 }, { "epoch": 0.3, "learning_rate": 8.241775154692644e-06, "loss": 1.0668, "step": 12815 }, { "epoch": 0.3, "learning_rate": 8.24148921437191e-06, "loss": 1.1164, "step": 12816 }, { "epoch": 0.3, "learning_rate": 8.241203255762913e-06, "loss": 0.8927, "step": 12817 }, { "epoch": 0.3, "learning_rate": 8.240917278867269e-06, "loss": 1.0043, "step": 12818 }, { "epoch": 0.3, "learning_rate": 8.24063128368659e-06, "loss": 0.7449, "step": 12819 }, { "epoch": 0.3, "learning_rate": 8.240345270222487e-06, "loss": 1.0999, "step": 12820 }, { "epoch": 0.3, "learning_rate": 8.240059238476579e-06, "loss": 0.9788, "step": 12821 }, { "epoch": 0.3, "learning_rate": 8.239773188450477e-06, "loss": 0.9327, "step": 12822 }, { "epoch": 0.3, "learning_rate": 8.239487120145795e-06, "loss": 0.8619, "step": 12823 }, { "epoch": 0.3, "learning_rate": 8.239201033564146e-06, "loss": 0.8784, "step": 12824 }, { "epoch": 0.3, "learning_rate": 8.238914928707147e-06, "loss": 0.8015, "step": 12825 }, { "epoch": 0.3, "learning_rate": 8.23862880557641e-06, "loss": 1.0325, "step": 12826 }, { "epoch": 0.3, "learning_rate": 8.238342664173547e-06, "loss": 1.2964, "step": 12827 }, { "epoch": 0.3, "learning_rate": 8.238056504500177e-06, "loss": 0.8932, "step": 12828 }, { "epoch": 0.3, "learning_rate": 8.237770326557912e-06, "loss": 1.3082, "step": 12829 }, { "epoch": 0.3, "learning_rate": 8.237484130348367e-06, "loss": 1.1881, "step": 12830 }, { "epoch": 0.3, "learning_rate": 8.237197915873158e-06, "loss": 0.8077, "step": 12831 }, { "epoch": 0.3, "learning_rate": 8.236911683133897e-06, "loss": 1.1811, "step": 12832 }, { "epoch": 0.3, "learning_rate": 8.236625432132201e-06, "loss": 1.0136, "step": 12833 }, { "epoch": 0.3, "learning_rate": 8.236339162869685e-06, "loss": 0.868, "step": 12834 }, { "epoch": 0.3, "learning_rate": 8.236052875347962e-06, "loss": 1.0742, "step": 12835 }, { "epoch": 0.3, "learning_rate": 8.23576656956865e-06, "loss": 1.0935, "step": 12836 }, { "epoch": 0.3, "learning_rate": 8.235480245533364e-06, "loss": 0.9747, "step": 12837 }, { "epoch": 0.3, "learning_rate": 8.235193903243717e-06, "loss": 0.9674, "step": 12838 }, { "epoch": 0.3, "learning_rate": 8.234907542701327e-06, "loss": 0.9572, "step": 12839 }, { "epoch": 0.3, "learning_rate": 8.234621163907807e-06, "loss": 0.9215, "step": 12840 }, { "epoch": 0.3, "learning_rate": 8.234334766864775e-06, "loss": 0.7993, "step": 12841 }, { "epoch": 0.3, "learning_rate": 8.234048351573848e-06, "loss": 1.0985, "step": 12842 }, { "epoch": 0.3, "learning_rate": 8.233761918036638e-06, "loss": 0.8636, "step": 12843 }, { "epoch": 0.3, "learning_rate": 8.233475466254766e-06, "loss": 0.8078, "step": 12844 }, { "epoch": 0.3, "learning_rate": 8.233188996229842e-06, "loss": 1.1343, "step": 12845 }, { "epoch": 0.3, "learning_rate": 8.232902507963488e-06, "loss": 1.2572, "step": 12846 }, { "epoch": 0.3, "learning_rate": 8.232616001457317e-06, "loss": 1.0888, "step": 12847 }, { "epoch": 0.3, "learning_rate": 8.232329476712946e-06, "loss": 0.8218, "step": 12848 }, { "epoch": 0.3, "learning_rate": 8.232042933731994e-06, "loss": 1.0211, "step": 12849 }, { "epoch": 0.3, "learning_rate": 8.231756372516074e-06, "loss": 0.9323, "step": 12850 }, { "epoch": 0.3, "learning_rate": 8.231469793066804e-06, "loss": 0.9811, "step": 12851 }, { "epoch": 0.3, "learning_rate": 8.231183195385802e-06, "loss": 1.169, "step": 12852 }, { "epoch": 0.3, "learning_rate": 8.230896579474684e-06, "loss": 1.0185, "step": 12853 }, { "epoch": 0.3, "learning_rate": 8.230609945335068e-06, "loss": 1.3104, "step": 12854 }, { "epoch": 0.3, "learning_rate": 8.230323292968569e-06, "loss": 0.7873, "step": 12855 }, { "epoch": 0.3, "learning_rate": 8.230036622376807e-06, "loss": 1.1475, "step": 12856 }, { "epoch": 0.3, "learning_rate": 8.229749933561396e-06, "loss": 0.7749, "step": 12857 }, { "epoch": 0.3, "learning_rate": 8.229463226523958e-06, "loss": 0.81, "step": 12858 }, { "epoch": 0.3, "learning_rate": 8.229176501266107e-06, "loss": 0.7483, "step": 12859 }, { "epoch": 0.3, "learning_rate": 8.228889757789461e-06, "loss": 0.9572, "step": 12860 }, { "epoch": 0.3, "learning_rate": 8.22860299609564e-06, "loss": 1.2049, "step": 12861 }, { "epoch": 0.3, "learning_rate": 8.22831621618626e-06, "loss": 1.1916, "step": 12862 }, { "epoch": 0.3, "learning_rate": 8.22802941806294e-06, "loss": 0.8079, "step": 12863 }, { "epoch": 0.3, "learning_rate": 8.227742601727297e-06, "loss": 1.0606, "step": 12864 }, { "epoch": 0.3, "learning_rate": 8.227455767180951e-06, "loss": 0.868, "step": 12865 }, { "epoch": 0.3, "learning_rate": 8.227168914425517e-06, "loss": 1.0652, "step": 12866 }, { "epoch": 0.3, "learning_rate": 8.226882043462616e-06, "loss": 1.1964, "step": 12867 }, { "epoch": 0.3, "learning_rate": 8.226595154293868e-06, "loss": 0.9763, "step": 12868 }, { "epoch": 0.3, "learning_rate": 8.226308246920888e-06, "loss": 1.2865, "step": 12869 }, { "epoch": 0.3, "learning_rate": 8.226021321345297e-06, "loss": 1.0315, "step": 12870 }, { "epoch": 0.3, "learning_rate": 8.225734377568712e-06, "loss": 1.0464, "step": 12871 }, { "epoch": 0.3, "learning_rate": 8.225447415592753e-06, "loss": 0.8973, "step": 12872 }, { "epoch": 0.3, "learning_rate": 8.225160435419041e-06, "loss": 0.9664, "step": 12873 }, { "epoch": 0.3, "learning_rate": 8.224873437049191e-06, "loss": 0.9852, "step": 12874 }, { "epoch": 0.3, "learning_rate": 8.224586420484825e-06, "loss": 0.9554, "step": 12875 }, { "epoch": 0.3, "learning_rate": 8.224299385727563e-06, "loss": 0.8613, "step": 12876 }, { "epoch": 0.3, "learning_rate": 8.224012332779022e-06, "loss": 0.7884, "step": 12877 }, { "epoch": 0.3, "learning_rate": 8.223725261640823e-06, "loss": 1.0821, "step": 12878 }, { "epoch": 0.3, "learning_rate": 8.223438172314586e-06, "loss": 1.1444, "step": 12879 }, { "epoch": 0.3, "learning_rate": 8.223151064801929e-06, "loss": 0.988, "step": 12880 }, { "epoch": 0.3, "learning_rate": 8.222863939104472e-06, "loss": 1.2943, "step": 12881 }, { "epoch": 0.3, "learning_rate": 8.222576795223839e-06, "loss": 1.0312, "step": 12882 }, { "epoch": 0.3, "learning_rate": 8.222289633161645e-06, "loss": 0.7714, "step": 12883 }, { "epoch": 0.3, "learning_rate": 8.222002452919514e-06, "loss": 0.889, "step": 12884 }, { "epoch": 0.3, "learning_rate": 8.221715254499061e-06, "loss": 0.9824, "step": 12885 }, { "epoch": 0.3, "learning_rate": 8.221428037901911e-06, "loss": 1.0792, "step": 12886 }, { "epoch": 0.3, "learning_rate": 8.221140803129684e-06, "loss": 0.8709, "step": 12887 }, { "epoch": 0.3, "learning_rate": 8.220853550183999e-06, "loss": 0.8228, "step": 12888 }, { "epoch": 0.3, "learning_rate": 8.220566279066478e-06, "loss": 1.2087, "step": 12889 }, { "epoch": 0.3, "learning_rate": 8.22027898977874e-06, "loss": 0.9727, "step": 12890 }, { "epoch": 0.3, "learning_rate": 8.219991682322408e-06, "loss": 0.7648, "step": 12891 }, { "epoch": 0.3, "learning_rate": 8.219704356699102e-06, "loss": 1.0006, "step": 12892 }, { "epoch": 0.3, "learning_rate": 8.219417012910442e-06, "loss": 1.0488, "step": 12893 }, { "epoch": 0.3, "learning_rate": 8.21912965095805e-06, "loss": 1.0508, "step": 12894 }, { "epoch": 0.3, "learning_rate": 8.21884227084355e-06, "loss": 1.1614, "step": 12895 }, { "epoch": 0.3, "learning_rate": 8.218554872568558e-06, "loss": 0.8899, "step": 12896 }, { "epoch": 0.3, "learning_rate": 8.2182674561347e-06, "loss": 0.9237, "step": 12897 }, { "epoch": 0.3, "learning_rate": 8.217980021543594e-06, "loss": 0.9669, "step": 12898 }, { "epoch": 0.3, "learning_rate": 8.217692568796865e-06, "loss": 0.9558, "step": 12899 }, { "epoch": 0.3, "learning_rate": 8.217405097896133e-06, "loss": 1.3313, "step": 12900 }, { "epoch": 0.3, "learning_rate": 8.217117608843021e-06, "loss": 0.9159, "step": 12901 }, { "epoch": 0.3, "learning_rate": 8.21683010163915e-06, "loss": 1.1062, "step": 12902 }, { "epoch": 0.3, "learning_rate": 8.216542576286143e-06, "loss": 1.0971, "step": 12903 }, { "epoch": 0.3, "learning_rate": 8.216255032785621e-06, "loss": 1.0636, "step": 12904 }, { "epoch": 0.3, "learning_rate": 8.215967471139207e-06, "loss": 0.7938, "step": 12905 }, { "epoch": 0.3, "learning_rate": 8.215679891348523e-06, "loss": 0.9978, "step": 12906 }, { "epoch": 0.3, "learning_rate": 8.215392293415192e-06, "loss": 1.0086, "step": 12907 }, { "epoch": 0.3, "learning_rate": 8.215104677340834e-06, "loss": 0.9712, "step": 12908 }, { "epoch": 0.3, "learning_rate": 8.214817043127077e-06, "loss": 0.9508, "step": 12909 }, { "epoch": 0.3, "learning_rate": 8.21452939077554e-06, "loss": 0.8965, "step": 12910 }, { "epoch": 0.3, "learning_rate": 8.214241720287847e-06, "loss": 0.8833, "step": 12911 }, { "epoch": 0.3, "learning_rate": 8.213954031665622e-06, "loss": 0.7898, "step": 12912 }, { "epoch": 0.3, "learning_rate": 8.213666324910486e-06, "loss": 0.9304, "step": 12913 }, { "epoch": 0.3, "learning_rate": 8.213378600024062e-06, "loss": 1.0736, "step": 12914 }, { "epoch": 0.3, "learning_rate": 8.213090857007977e-06, "loss": 0.8867, "step": 12915 }, { "epoch": 0.3, "learning_rate": 8.21280309586385e-06, "loss": 0.9166, "step": 12916 }, { "epoch": 0.3, "learning_rate": 8.212515316593307e-06, "loss": 1.1392, "step": 12917 }, { "epoch": 0.3, "learning_rate": 8.21222751919797e-06, "loss": 0.8538, "step": 12918 }, { "epoch": 0.3, "learning_rate": 8.211939703679465e-06, "loss": 0.8899, "step": 12919 }, { "epoch": 0.3, "learning_rate": 8.211651870039416e-06, "loss": 0.9173, "step": 12920 }, { "epoch": 0.3, "learning_rate": 8.211364018279444e-06, "loss": 0.8712, "step": 12921 }, { "epoch": 0.3, "learning_rate": 8.211076148401175e-06, "loss": 1.0764, "step": 12922 }, { "epoch": 0.3, "learning_rate": 8.210788260406232e-06, "loss": 0.7331, "step": 12923 }, { "epoch": 0.3, "learning_rate": 8.210500354296242e-06, "loss": 1.3612, "step": 12924 }, { "epoch": 0.3, "learning_rate": 8.210212430072825e-06, "loss": 1.1075, "step": 12925 }, { "epoch": 0.3, "learning_rate": 8.209924487737609e-06, "loss": 1.1781, "step": 12926 }, { "epoch": 0.3, "learning_rate": 8.209636527292218e-06, "loss": 1.4715, "step": 12927 }, { "epoch": 0.3, "learning_rate": 8.209348548738275e-06, "loss": 0.9261, "step": 12928 }, { "epoch": 0.3, "learning_rate": 8.209060552077406e-06, "loss": 0.821, "step": 12929 }, { "epoch": 0.3, "learning_rate": 8.208772537311235e-06, "loss": 0.9327, "step": 12930 }, { "epoch": 0.3, "learning_rate": 8.208484504441387e-06, "loss": 0.9536, "step": 12931 }, { "epoch": 0.3, "learning_rate": 8.208196453469491e-06, "loss": 0.9037, "step": 12932 }, { "epoch": 0.3, "learning_rate": 8.207908384397165e-06, "loss": 0.9166, "step": 12933 }, { "epoch": 0.3, "learning_rate": 8.20762029722604e-06, "loss": 1.0364, "step": 12934 }, { "epoch": 0.3, "learning_rate": 8.20733219195774e-06, "loss": 0.8995, "step": 12935 }, { "epoch": 0.3, "learning_rate": 8.207044068593888e-06, "loss": 0.8054, "step": 12936 }, { "epoch": 0.3, "learning_rate": 8.206755927136114e-06, "loss": 0.8425, "step": 12937 }, { "epoch": 0.3, "learning_rate": 8.206467767586039e-06, "loss": 0.9319, "step": 12938 }, { "epoch": 0.3, "learning_rate": 8.206179589945294e-06, "loss": 0.9361, "step": 12939 }, { "epoch": 0.3, "learning_rate": 8.205891394215499e-06, "loss": 0.829, "step": 12940 }, { "epoch": 0.3, "learning_rate": 8.205603180398283e-06, "loss": 0.7581, "step": 12941 }, { "epoch": 0.3, "learning_rate": 8.205314948495272e-06, "loss": 0.9854, "step": 12942 }, { "epoch": 0.3, "learning_rate": 8.205026698508095e-06, "loss": 0.9888, "step": 12943 }, { "epoch": 0.3, "learning_rate": 8.204738430438373e-06, "loss": 0.9071, "step": 12944 }, { "epoch": 0.3, "learning_rate": 8.204450144287733e-06, "loss": 0.9024, "step": 12945 }, { "epoch": 0.3, "learning_rate": 8.204161840057806e-06, "loss": 1.1301, "step": 12946 }, { "epoch": 0.3, "learning_rate": 8.203873517750214e-06, "loss": 1.037, "step": 12947 }, { "epoch": 0.3, "learning_rate": 8.203585177366586e-06, "loss": 0.9417, "step": 12948 }, { "epoch": 0.3, "learning_rate": 8.20329681890855e-06, "loss": 0.9691, "step": 12949 }, { "epoch": 0.3, "learning_rate": 8.203008442377728e-06, "loss": 1.019, "step": 12950 }, { "epoch": 0.3, "learning_rate": 8.202720047775753e-06, "loss": 0.8235, "step": 12951 }, { "epoch": 0.3, "learning_rate": 8.20243163510425e-06, "loss": 0.9304, "step": 12952 }, { "epoch": 0.3, "learning_rate": 8.202143204364844e-06, "loss": 1.1151, "step": 12953 }, { "epoch": 0.3, "learning_rate": 8.201854755559165e-06, "loss": 0.8443, "step": 12954 }, { "epoch": 0.3, "learning_rate": 8.201566288688835e-06, "loss": 0.8458, "step": 12955 }, { "epoch": 0.3, "learning_rate": 8.20127780375549e-06, "loss": 0.753, "step": 12956 }, { "epoch": 0.3, "learning_rate": 8.200989300760754e-06, "loss": 0.9546, "step": 12957 }, { "epoch": 0.3, "learning_rate": 8.200700779706251e-06, "loss": 0.652, "step": 12958 }, { "epoch": 0.3, "learning_rate": 8.200412240593613e-06, "loss": 0.9041, "step": 12959 }, { "epoch": 0.3, "learning_rate": 8.200123683424469e-06, "loss": 0.6583, "step": 12960 }, { "epoch": 0.3, "learning_rate": 8.199835108200442e-06, "loss": 0.8066, "step": 12961 }, { "epoch": 0.3, "learning_rate": 8.199546514923164e-06, "loss": 0.8535, "step": 12962 }, { "epoch": 0.3, "learning_rate": 8.199257903594262e-06, "loss": 1.1719, "step": 12963 }, { "epoch": 0.3, "learning_rate": 8.198969274215366e-06, "loss": 0.8022, "step": 12964 }, { "epoch": 0.3, "learning_rate": 8.1986806267881e-06, "loss": 1.1422, "step": 12965 }, { "epoch": 0.3, "learning_rate": 8.198391961314099e-06, "loss": 0.9525, "step": 12966 }, { "epoch": 0.3, "learning_rate": 8.198103277794984e-06, "loss": 0.9441, "step": 12967 }, { "epoch": 0.3, "learning_rate": 8.19781457623239e-06, "loss": 0.7604, "step": 12968 }, { "epoch": 0.3, "learning_rate": 8.197525856627944e-06, "loss": 0.9599, "step": 12969 }, { "epoch": 0.3, "learning_rate": 8.197237118983275e-06, "loss": 1.106, "step": 12970 }, { "epoch": 0.3, "learning_rate": 8.196948363300011e-06, "loss": 0.9197, "step": 12971 }, { "epoch": 0.3, "learning_rate": 8.196659589579782e-06, "loss": 0.8877, "step": 12972 }, { "epoch": 0.3, "learning_rate": 8.196370797824215e-06, "loss": 0.8529, "step": 12973 }, { "epoch": 0.3, "learning_rate": 8.196081988034945e-06, "loss": 0.9775, "step": 12974 }, { "epoch": 0.3, "learning_rate": 8.195793160213596e-06, "loss": 0.7541, "step": 12975 }, { "epoch": 0.3, "learning_rate": 8.1955043143618e-06, "loss": 1.0136, "step": 12976 }, { "epoch": 0.3, "learning_rate": 8.195215450481185e-06, "loss": 0.8597, "step": 12977 }, { "epoch": 0.3, "learning_rate": 8.194926568573383e-06, "loss": 1.1654, "step": 12978 }, { "epoch": 0.3, "learning_rate": 8.194637668640022e-06, "loss": 0.8469, "step": 12979 }, { "epoch": 0.3, "learning_rate": 8.194348750682731e-06, "loss": 0.8244, "step": 12980 }, { "epoch": 0.3, "learning_rate": 8.194059814703144e-06, "loss": 1.2244, "step": 12981 }, { "epoch": 0.3, "learning_rate": 8.193770860702887e-06, "loss": 1.0125, "step": 12982 }, { "epoch": 0.3, "learning_rate": 8.193481888683594e-06, "loss": 0.7636, "step": 12983 }, { "epoch": 0.3, "learning_rate": 8.193192898646891e-06, "loss": 0.8642, "step": 12984 }, { "epoch": 0.3, "learning_rate": 8.192903890594412e-06, "loss": 0.5747, "step": 12985 }, { "epoch": 0.3, "learning_rate": 8.192614864527788e-06, "loss": 0.9427, "step": 12986 }, { "epoch": 0.3, "learning_rate": 8.192325820448645e-06, "loss": 1.0159, "step": 12987 }, { "epoch": 0.3, "learning_rate": 8.19203675835862e-06, "loss": 0.9155, "step": 12988 }, { "epoch": 0.3, "learning_rate": 8.191747678259339e-06, "loss": 1.1718, "step": 12989 }, { "epoch": 0.3, "learning_rate": 8.191458580152433e-06, "loss": 0.9593, "step": 12990 }, { "epoch": 0.3, "learning_rate": 8.191169464039538e-06, "loss": 0.9348, "step": 12991 }, { "epoch": 0.3, "learning_rate": 8.190880329922282e-06, "loss": 1.0926, "step": 12992 }, { "epoch": 0.3, "learning_rate": 8.190591177802293e-06, "loss": 1.1272, "step": 12993 }, { "epoch": 0.3, "learning_rate": 8.190302007681209e-06, "loss": 0.7996, "step": 12994 }, { "epoch": 0.3, "learning_rate": 8.190012819560656e-06, "loss": 1.0271, "step": 12995 }, { "epoch": 0.3, "learning_rate": 8.189723613442269e-06, "loss": 1.1839, "step": 12996 }, { "epoch": 0.3, "learning_rate": 8.189434389327677e-06, "loss": 0.8824, "step": 12997 }, { "epoch": 0.3, "learning_rate": 8.189145147218513e-06, "loss": 1.0792, "step": 12998 }, { "epoch": 0.3, "learning_rate": 8.18885588711641e-06, "loss": 0.8649, "step": 12999 }, { "epoch": 0.3, "learning_rate": 8.188566609022998e-06, "loss": 0.8546, "step": 13000 }, { "epoch": 0.3, "learning_rate": 8.188277312939912e-06, "loss": 0.9077, "step": 13001 }, { "epoch": 0.3, "learning_rate": 8.18798799886878e-06, "loss": 0.9603, "step": 13002 }, { "epoch": 0.3, "learning_rate": 8.187698666811239e-06, "loss": 0.9279, "step": 13003 }, { "epoch": 0.3, "learning_rate": 8.187409316768918e-06, "loss": 1.1562, "step": 13004 }, { "epoch": 0.3, "learning_rate": 8.18711994874345e-06, "loss": 0.931, "step": 13005 }, { "epoch": 0.3, "learning_rate": 8.186830562736467e-06, "loss": 0.9198, "step": 13006 }, { "epoch": 0.3, "learning_rate": 8.186541158749603e-06, "loss": 0.877, "step": 13007 }, { "epoch": 0.3, "learning_rate": 8.186251736784492e-06, "loss": 0.8018, "step": 13008 }, { "epoch": 0.3, "learning_rate": 8.185962296842764e-06, "loss": 1.0237, "step": 13009 }, { "epoch": 0.3, "learning_rate": 8.185672838926055e-06, "loss": 1.1827, "step": 13010 }, { "epoch": 0.3, "learning_rate": 8.185383363035995e-06, "loss": 1.0118, "step": 13011 }, { "epoch": 0.3, "learning_rate": 8.18509386917422e-06, "loss": 0.8131, "step": 13012 }, { "epoch": 0.3, "learning_rate": 8.184804357342363e-06, "loss": 1.1247, "step": 13013 }, { "epoch": 0.3, "learning_rate": 8.184514827542054e-06, "loss": 1.0652, "step": 13014 }, { "epoch": 0.3, "learning_rate": 8.18422527977493e-06, "loss": 0.9253, "step": 13015 }, { "epoch": 0.3, "learning_rate": 8.183935714042624e-06, "loss": 1.0106, "step": 13016 }, { "epoch": 0.3, "learning_rate": 8.183646130346768e-06, "loss": 0.8028, "step": 13017 }, { "epoch": 0.3, "learning_rate": 8.183356528688999e-06, "loss": 1.1864, "step": 13018 }, { "epoch": 0.3, "learning_rate": 8.183066909070946e-06, "loss": 0.6589, "step": 13019 }, { "epoch": 0.3, "learning_rate": 8.182777271494249e-06, "loss": 1.1293, "step": 13020 }, { "epoch": 0.3, "learning_rate": 8.182487615960538e-06, "loss": 0.8756, "step": 13021 }, { "epoch": 0.3, "learning_rate": 8.182197942471449e-06, "loss": 1.2019, "step": 13022 }, { "epoch": 0.3, "learning_rate": 8.181908251028614e-06, "loss": 0.8809, "step": 13023 }, { "epoch": 0.3, "learning_rate": 8.181618541633669e-06, "loss": 0.99, "step": 13024 }, { "epoch": 0.3, "learning_rate": 8.18132881428825e-06, "loss": 1.2674, "step": 13025 }, { "epoch": 0.3, "learning_rate": 8.18103906899399e-06, "loss": 1.0712, "step": 13026 }, { "epoch": 0.3, "learning_rate": 8.180749305752524e-06, "loss": 0.9325, "step": 13027 }, { "epoch": 0.3, "learning_rate": 8.180459524565487e-06, "loss": 0.9975, "step": 13028 }, { "epoch": 0.3, "learning_rate": 8.180169725434512e-06, "loss": 1.0212, "step": 13029 }, { "epoch": 0.3, "learning_rate": 8.179879908361238e-06, "loss": 0.8283, "step": 13030 }, { "epoch": 0.3, "learning_rate": 8.179590073347297e-06, "loss": 1.0406, "step": 13031 }, { "epoch": 0.3, "learning_rate": 8.179300220394324e-06, "loss": 0.8754, "step": 13032 }, { "epoch": 0.3, "learning_rate": 8.179010349503958e-06, "loss": 0.9455, "step": 13033 }, { "epoch": 0.3, "learning_rate": 8.17872046067783e-06, "loss": 0.8097, "step": 13034 }, { "epoch": 0.3, "learning_rate": 8.178430553917577e-06, "loss": 1.0293, "step": 13035 }, { "epoch": 0.3, "learning_rate": 8.178140629224835e-06, "loss": 1.1103, "step": 13036 }, { "epoch": 0.3, "learning_rate": 8.177850686601241e-06, "loss": 1.2496, "step": 13037 }, { "epoch": 0.3, "learning_rate": 8.177560726048428e-06, "loss": 0.9243, "step": 13038 }, { "epoch": 0.3, "learning_rate": 8.177270747568035e-06, "loss": 1.1107, "step": 13039 }, { "epoch": 0.3, "learning_rate": 8.176980751161696e-06, "loss": 0.9902, "step": 13040 }, { "epoch": 0.3, "learning_rate": 8.176690736831047e-06, "loss": 1.3682, "step": 13041 }, { "epoch": 0.3, "learning_rate": 8.176400704577727e-06, "loss": 1.0254, "step": 13042 }, { "epoch": 0.3, "learning_rate": 8.17611065440337e-06, "loss": 0.8358, "step": 13043 }, { "epoch": 0.3, "learning_rate": 8.17582058630961e-06, "loss": 0.7935, "step": 13044 }, { "epoch": 0.3, "learning_rate": 8.175530500298088e-06, "loss": 1.1273, "step": 13045 }, { "epoch": 0.3, "learning_rate": 8.175240396370439e-06, "loss": 1.034, "step": 13046 }, { "epoch": 0.3, "learning_rate": 8.1749502745283e-06, "loss": 1.0777, "step": 13047 }, { "epoch": 0.3, "learning_rate": 8.174660134773307e-06, "loss": 0.9561, "step": 13048 }, { "epoch": 0.3, "learning_rate": 8.174369977107097e-06, "loss": 0.8773, "step": 13049 }, { "epoch": 0.3, "learning_rate": 8.174079801531307e-06, "loss": 1.0781, "step": 13050 }, { "epoch": 0.3, "learning_rate": 8.173789608047576e-06, "loss": 0.9464, "step": 13051 }, { "epoch": 0.3, "learning_rate": 8.173499396657541e-06, "loss": 0.8331, "step": 13052 }, { "epoch": 0.3, "learning_rate": 8.173209167362837e-06, "loss": 0.8902, "step": 13053 }, { "epoch": 0.3, "learning_rate": 8.172918920165101e-06, "loss": 1.0005, "step": 13054 }, { "epoch": 0.3, "learning_rate": 8.172628655065974e-06, "loss": 0.8873, "step": 13055 }, { "epoch": 0.3, "learning_rate": 8.172338372067093e-06, "loss": 0.9032, "step": 13056 }, { "epoch": 0.3, "learning_rate": 8.172048071170094e-06, "loss": 0.9499, "step": 13057 }, { "epoch": 0.3, "learning_rate": 8.171757752376613e-06, "loss": 0.9519, "step": 13058 }, { "epoch": 0.3, "learning_rate": 8.171467415688293e-06, "loss": 0.9127, "step": 13059 }, { "epoch": 0.3, "learning_rate": 8.17117706110677e-06, "loss": 0.9985, "step": 13060 }, { "epoch": 0.3, "learning_rate": 8.17088668863368e-06, "loss": 1.266, "step": 13061 }, { "epoch": 0.3, "learning_rate": 8.170596298270664e-06, "loss": 0.9231, "step": 13062 }, { "epoch": 0.3, "learning_rate": 8.170305890019358e-06, "loss": 0.9526, "step": 13063 }, { "epoch": 0.3, "learning_rate": 8.170015463881403e-06, "loss": 0.8683, "step": 13064 }, { "epoch": 0.3, "learning_rate": 8.169725019858436e-06, "loss": 1.1154, "step": 13065 }, { "epoch": 0.3, "learning_rate": 8.169434557952096e-06, "loss": 1.0027, "step": 13066 }, { "epoch": 0.3, "learning_rate": 8.169144078164024e-06, "loss": 0.7255, "step": 13067 }, { "epoch": 0.3, "learning_rate": 8.168853580495855e-06, "loss": 0.8833, "step": 13068 }, { "epoch": 0.3, "learning_rate": 8.168563064949228e-06, "loss": 1.0063, "step": 13069 }, { "epoch": 0.3, "learning_rate": 8.168272531525786e-06, "loss": 0.8388, "step": 13070 }, { "epoch": 0.3, "learning_rate": 8.167981980227164e-06, "loss": 1.253, "step": 13071 }, { "epoch": 0.3, "learning_rate": 8.167691411055005e-06, "loss": 0.8747, "step": 13072 }, { "epoch": 0.3, "learning_rate": 8.167400824010945e-06, "loss": 0.9808, "step": 13073 }, { "epoch": 0.3, "learning_rate": 8.167110219096626e-06, "loss": 0.9652, "step": 13074 }, { "epoch": 0.3, "learning_rate": 8.166819596313687e-06, "loss": 1.0227, "step": 13075 }, { "epoch": 0.3, "learning_rate": 8.166528955663766e-06, "loss": 0.9633, "step": 13076 }, { "epoch": 0.3, "learning_rate": 8.166238297148506e-06, "loss": 0.893, "step": 13077 }, { "epoch": 0.3, "learning_rate": 8.165947620769543e-06, "loss": 1.0253, "step": 13078 }, { "epoch": 0.3, "learning_rate": 8.16565692652852e-06, "loss": 0.8955, "step": 13079 }, { "epoch": 0.3, "learning_rate": 8.165366214427075e-06, "loss": 1.1014, "step": 13080 }, { "epoch": 0.3, "learning_rate": 8.16507548446685e-06, "loss": 0.8496, "step": 13081 }, { "epoch": 0.3, "learning_rate": 8.164784736649482e-06, "loss": 1.1879, "step": 13082 }, { "epoch": 0.3, "learning_rate": 8.164493970976617e-06, "loss": 0.8499, "step": 13083 }, { "epoch": 0.3, "learning_rate": 8.164203187449891e-06, "loss": 1.0535, "step": 13084 }, { "epoch": 0.3, "learning_rate": 8.163912386070944e-06, "loss": 0.9371, "step": 13085 }, { "epoch": 0.3, "learning_rate": 8.163621566841421e-06, "loss": 1.1039, "step": 13086 }, { "epoch": 0.3, "learning_rate": 8.16333072976296e-06, "loss": 0.8092, "step": 13087 }, { "epoch": 0.3, "learning_rate": 8.163039874837201e-06, "loss": 0.7975, "step": 13088 }, { "epoch": 0.3, "learning_rate": 8.162749002065788e-06, "loss": 0.5899, "step": 13089 }, { "epoch": 0.3, "learning_rate": 8.16245811145036e-06, "loss": 0.9506, "step": 13090 }, { "epoch": 0.3, "learning_rate": 8.162167202992556e-06, "loss": 0.8928, "step": 13091 }, { "epoch": 0.3, "learning_rate": 8.161876276694022e-06, "loss": 0.7145, "step": 13092 }, { "epoch": 0.3, "learning_rate": 8.161585332556396e-06, "loss": 0.711, "step": 13093 }, { "epoch": 0.3, "learning_rate": 8.161294370581322e-06, "loss": 1.1184, "step": 13094 }, { "epoch": 0.3, "learning_rate": 8.16100339077044e-06, "loss": 0.9967, "step": 13095 }, { "epoch": 0.3, "learning_rate": 8.16071239312539e-06, "loss": 0.7965, "step": 13096 }, { "epoch": 0.3, "learning_rate": 8.160421377647816e-06, "loss": 1.0231, "step": 13097 }, { "epoch": 0.3, "learning_rate": 8.160130344339361e-06, "loss": 0.8446, "step": 13098 }, { "epoch": 0.3, "learning_rate": 8.159839293201665e-06, "loss": 0.9107, "step": 13099 }, { "epoch": 0.3, "learning_rate": 8.15954822423637e-06, "loss": 1.2819, "step": 13100 }, { "epoch": 0.3, "learning_rate": 8.15925713744512e-06, "loss": 1.1043, "step": 13101 }, { "epoch": 0.3, "learning_rate": 8.158966032829557e-06, "loss": 0.9725, "step": 13102 }, { "epoch": 0.3, "learning_rate": 8.15867491039132e-06, "loss": 1.1256, "step": 13103 }, { "epoch": 0.3, "learning_rate": 8.158383770132054e-06, "loss": 0.9268, "step": 13104 }, { "epoch": 0.3, "learning_rate": 8.158092612053403e-06, "loss": 0.8202, "step": 13105 }, { "epoch": 0.3, "learning_rate": 8.157801436157008e-06, "loss": 0.9367, "step": 13106 }, { "epoch": 0.3, "learning_rate": 8.157510242444513e-06, "loss": 1.0694, "step": 13107 }, { "epoch": 0.3, "learning_rate": 8.157219030917559e-06, "loss": 0.8302, "step": 13108 }, { "epoch": 0.3, "learning_rate": 8.15692780157779e-06, "loss": 1.0593, "step": 13109 }, { "epoch": 0.3, "learning_rate": 8.156636554426848e-06, "loss": 0.9074, "step": 13110 }, { "epoch": 0.3, "learning_rate": 8.15634528946638e-06, "loss": 0.8982, "step": 13111 }, { "epoch": 0.3, "learning_rate": 8.156054006698024e-06, "loss": 0.9358, "step": 13112 }, { "epoch": 0.3, "learning_rate": 8.155762706123426e-06, "loss": 0.9101, "step": 13113 }, { "epoch": 0.3, "learning_rate": 8.155471387744232e-06, "loss": 0.9778, "step": 13114 }, { "epoch": 0.3, "learning_rate": 8.155180051562082e-06, "loss": 0.9158, "step": 13115 }, { "epoch": 0.3, "learning_rate": 8.15488869757862e-06, "loss": 0.9227, "step": 13116 }, { "epoch": 0.3, "learning_rate": 8.15459732579549e-06, "loss": 1.2248, "step": 13117 }, { "epoch": 0.3, "learning_rate": 8.154305936214337e-06, "loss": 1.1262, "step": 13118 }, { "epoch": 0.3, "learning_rate": 8.154014528836806e-06, "loss": 1.2579, "step": 13119 }, { "epoch": 0.3, "learning_rate": 8.153723103664536e-06, "loss": 0.8232, "step": 13120 }, { "epoch": 0.3, "learning_rate": 8.153431660699179e-06, "loss": 1.0957, "step": 13121 }, { "epoch": 0.3, "learning_rate": 8.153140199942374e-06, "loss": 0.8641, "step": 13122 }, { "epoch": 0.3, "learning_rate": 8.152848721395764e-06, "loss": 0.9322, "step": 13123 }, { "epoch": 0.3, "learning_rate": 8.152557225060997e-06, "loss": 0.9838, "step": 13124 }, { "epoch": 0.3, "learning_rate": 8.152265710939717e-06, "loss": 1.0022, "step": 13125 }, { "epoch": 0.3, "learning_rate": 8.151974179033571e-06, "loss": 0.7527, "step": 13126 }, { "epoch": 0.3, "learning_rate": 8.151682629344197e-06, "loss": 0.9627, "step": 13127 }, { "epoch": 0.3, "learning_rate": 8.151391061873246e-06, "loss": 1.0452, "step": 13128 }, { "epoch": 0.3, "learning_rate": 8.151099476622359e-06, "loss": 0.7612, "step": 13129 }, { "epoch": 0.3, "learning_rate": 8.150807873593186e-06, "loss": 1.0318, "step": 13130 }, { "epoch": 0.3, "learning_rate": 8.150516252787369e-06, "loss": 0.8937, "step": 13131 }, { "epoch": 0.3, "learning_rate": 8.15022461420655e-06, "loss": 0.9204, "step": 13132 }, { "epoch": 0.3, "learning_rate": 8.149932957852382e-06, "loss": 1.1845, "step": 13133 }, { "epoch": 0.3, "learning_rate": 8.149641283726504e-06, "loss": 0.8677, "step": 13134 }, { "epoch": 0.3, "learning_rate": 8.149349591830564e-06, "loss": 1.0101, "step": 13135 }, { "epoch": 0.3, "learning_rate": 8.14905788216621e-06, "loss": 0.9382, "step": 13136 }, { "epoch": 0.3, "learning_rate": 8.148766154735084e-06, "loss": 1.0339, "step": 13137 }, { "epoch": 0.3, "learning_rate": 8.148474409538836e-06, "loss": 1.0216, "step": 13138 }, { "epoch": 0.3, "learning_rate": 8.148182646579106e-06, "loss": 0.8586, "step": 13139 }, { "epoch": 0.3, "learning_rate": 8.147890865857546e-06, "loss": 0.959, "step": 13140 }, { "epoch": 0.3, "learning_rate": 8.1475990673758e-06, "loss": 1.0809, "step": 13141 }, { "epoch": 0.3, "learning_rate": 8.147307251135513e-06, "loss": 0.8802, "step": 13142 }, { "epoch": 0.3, "learning_rate": 8.147015417138332e-06, "loss": 1.0193, "step": 13143 }, { "epoch": 0.3, "learning_rate": 8.146723565385906e-06, "loss": 1.0045, "step": 13144 }, { "epoch": 0.3, "learning_rate": 8.146431695879877e-06, "loss": 0.8091, "step": 13145 }, { "epoch": 0.3, "learning_rate": 8.146139808621897e-06, "loss": 1.0657, "step": 13146 }, { "epoch": 0.3, "learning_rate": 8.145847903613609e-06, "loss": 0.8362, "step": 13147 }, { "epoch": 0.3, "learning_rate": 8.14555598085666e-06, "loss": 0.9778, "step": 13148 }, { "epoch": 0.3, "learning_rate": 8.1452640403527e-06, "loss": 0.6473, "step": 13149 }, { "epoch": 0.3, "learning_rate": 8.144972082103374e-06, "loss": 0.8779, "step": 13150 }, { "epoch": 0.3, "learning_rate": 8.14468010611033e-06, "loss": 0.8984, "step": 13151 }, { "epoch": 0.31, "learning_rate": 8.144388112375214e-06, "loss": 0.8483, "step": 13152 }, { "epoch": 0.31, "learning_rate": 8.144096100899674e-06, "loss": 0.9938, "step": 13153 }, { "epoch": 0.31, "learning_rate": 8.143804071685358e-06, "loss": 1.0188, "step": 13154 }, { "epoch": 0.31, "learning_rate": 8.143512024733913e-06, "loss": 0.8305, "step": 13155 }, { "epoch": 0.31, "learning_rate": 8.143219960046986e-06, "loss": 1.0421, "step": 13156 }, { "epoch": 0.31, "learning_rate": 8.142927877626226e-06, "loss": 0.705, "step": 13157 }, { "epoch": 0.31, "learning_rate": 8.142635777473282e-06, "loss": 0.8079, "step": 13158 }, { "epoch": 0.31, "learning_rate": 8.1423436595898e-06, "loss": 0.6539, "step": 13159 }, { "epoch": 0.31, "learning_rate": 8.14205152397743e-06, "loss": 0.9673, "step": 13160 }, { "epoch": 0.31, "learning_rate": 8.141759370637816e-06, "loss": 0.8206, "step": 13161 }, { "epoch": 0.31, "learning_rate": 8.141467199572612e-06, "loss": 1.1269, "step": 13162 }, { "epoch": 0.31, "learning_rate": 8.141175010783464e-06, "loss": 1.0152, "step": 13163 }, { "epoch": 0.31, "learning_rate": 8.14088280427202e-06, "loss": 1.1318, "step": 13164 }, { "epoch": 0.31, "learning_rate": 8.140590580039926e-06, "loss": 0.7209, "step": 13165 }, { "epoch": 0.31, "learning_rate": 8.140298338088837e-06, "loss": 1.0302, "step": 13166 }, { "epoch": 0.31, "learning_rate": 8.140006078420395e-06, "loss": 0.9661, "step": 13167 }, { "epoch": 0.31, "learning_rate": 8.139713801036256e-06, "loss": 1.0244, "step": 13168 }, { "epoch": 0.31, "learning_rate": 8.139421505938063e-06, "loss": 1.0473, "step": 13169 }, { "epoch": 0.31, "learning_rate": 8.139129193127468e-06, "loss": 0.9959, "step": 13170 }, { "epoch": 0.31, "learning_rate": 8.13883686260612e-06, "loss": 0.7811, "step": 13171 }, { "epoch": 0.31, "learning_rate": 8.138544514375669e-06, "loss": 0.866, "step": 13172 }, { "epoch": 0.31, "learning_rate": 8.13825214843776e-06, "loss": 0.9988, "step": 13173 }, { "epoch": 0.31, "learning_rate": 8.137959764794048e-06, "loss": 0.9071, "step": 13174 }, { "epoch": 0.31, "learning_rate": 8.137667363446181e-06, "loss": 1.08, "step": 13175 }, { "epoch": 0.31, "learning_rate": 8.137374944395807e-06, "loss": 1.0139, "step": 13176 }, { "epoch": 0.31, "learning_rate": 8.137082507644577e-06, "loss": 0.8073, "step": 13177 }, { "epoch": 0.31, "learning_rate": 8.13679005319414e-06, "loss": 1.0193, "step": 13178 }, { "epoch": 0.31, "learning_rate": 8.13649758104615e-06, "loss": 0.8394, "step": 13179 }, { "epoch": 0.31, "learning_rate": 8.136205091202252e-06, "loss": 0.8002, "step": 13180 }, { "epoch": 0.31, "learning_rate": 8.135912583664099e-06, "loss": 1.2455, "step": 13181 }, { "epoch": 0.31, "learning_rate": 8.135620058433339e-06, "loss": 0.7818, "step": 13182 }, { "epoch": 0.31, "learning_rate": 8.135327515511625e-06, "loss": 1.0639, "step": 13183 }, { "epoch": 0.31, "learning_rate": 8.135034954900607e-06, "loss": 1.0554, "step": 13184 }, { "epoch": 0.31, "learning_rate": 8.134742376601934e-06, "loss": 1.1755, "step": 13185 }, { "epoch": 0.31, "learning_rate": 8.134449780617257e-06, "loss": 0.8039, "step": 13186 }, { "epoch": 0.31, "learning_rate": 8.134157166948229e-06, "loss": 0.7149, "step": 13187 }, { "epoch": 0.31, "learning_rate": 8.133864535596498e-06, "loss": 0.7829, "step": 13188 }, { "epoch": 0.31, "learning_rate": 8.133571886563718e-06, "loss": 0.949, "step": 13189 }, { "epoch": 0.31, "learning_rate": 8.133279219851538e-06, "loss": 1.0373, "step": 13190 }, { "epoch": 0.31, "learning_rate": 8.132986535461608e-06, "loss": 1.2251, "step": 13191 }, { "epoch": 0.31, "learning_rate": 8.132693833395585e-06, "loss": 0.9643, "step": 13192 }, { "epoch": 0.31, "learning_rate": 8.132401113655114e-06, "loss": 0.8371, "step": 13193 }, { "epoch": 0.31, "learning_rate": 8.132108376241849e-06, "loss": 0.9572, "step": 13194 }, { "epoch": 0.31, "learning_rate": 8.131815621157441e-06, "loss": 0.916, "step": 13195 }, { "epoch": 0.31, "learning_rate": 8.131522848403543e-06, "loss": 0.9284, "step": 13196 }, { "epoch": 0.31, "learning_rate": 8.131230057981807e-06, "loss": 0.8962, "step": 13197 }, { "epoch": 0.31, "learning_rate": 8.130937249893883e-06, "loss": 0.7915, "step": 13198 }, { "epoch": 0.31, "learning_rate": 8.130644424141425e-06, "loss": 0.9244, "step": 13199 }, { "epoch": 0.31, "learning_rate": 8.130351580726084e-06, "loss": 0.8841, "step": 13200 }, { "epoch": 0.31, "learning_rate": 8.13005871964951e-06, "loss": 0.7568, "step": 13201 }, { "epoch": 0.31, "learning_rate": 8.12976584091336e-06, "loss": 1.4159, "step": 13202 }, { "epoch": 0.31, "learning_rate": 8.129472944519283e-06, "loss": 0.687, "step": 13203 }, { "epoch": 0.31, "learning_rate": 8.129180030468932e-06, "loss": 1.1236, "step": 13204 }, { "epoch": 0.31, "learning_rate": 8.128887098763963e-06, "loss": 0.9379, "step": 13205 }, { "epoch": 0.31, "learning_rate": 8.128594149406023e-06, "loss": 1.0198, "step": 13206 }, { "epoch": 0.31, "learning_rate": 8.128301182396767e-06, "loss": 0.6885, "step": 13207 }, { "epoch": 0.31, "learning_rate": 8.12800819773785e-06, "loss": 1.434, "step": 13208 }, { "epoch": 0.31, "learning_rate": 8.127715195430924e-06, "loss": 0.9368, "step": 13209 }, { "epoch": 0.31, "learning_rate": 8.127422175477642e-06, "loss": 0.7321, "step": 13210 }, { "epoch": 0.31, "learning_rate": 8.127129137879655e-06, "loss": 1.0841, "step": 13211 }, { "epoch": 0.31, "learning_rate": 8.126836082638618e-06, "loss": 0.9983, "step": 13212 }, { "epoch": 0.31, "learning_rate": 8.126543009756187e-06, "loss": 1.0445, "step": 13213 }, { "epoch": 0.31, "learning_rate": 8.126249919234011e-06, "loss": 0.7845, "step": 13214 }, { "epoch": 0.31, "learning_rate": 8.125956811073745e-06, "loss": 1.0285, "step": 13215 }, { "epoch": 0.31, "learning_rate": 8.125663685277045e-06, "loss": 1.2075, "step": 13216 }, { "epoch": 0.31, "learning_rate": 8.125370541845563e-06, "loss": 0.8234, "step": 13217 }, { "epoch": 0.31, "learning_rate": 8.125077380780953e-06, "loss": 0.7561, "step": 13218 }, { "epoch": 0.31, "learning_rate": 8.124784202084868e-06, "loss": 1.3871, "step": 13219 }, { "epoch": 0.31, "learning_rate": 8.124491005758964e-06, "loss": 1.3385, "step": 13220 }, { "epoch": 0.31, "learning_rate": 8.124197791804892e-06, "loss": 0.8484, "step": 13221 }, { "epoch": 0.31, "learning_rate": 8.123904560224311e-06, "loss": 1.1666, "step": 13222 }, { "epoch": 0.31, "learning_rate": 8.123611311018872e-06, "loss": 1.1241, "step": 13223 }, { "epoch": 0.31, "learning_rate": 8.123318044190232e-06, "loss": 1.049, "step": 13224 }, { "epoch": 0.31, "learning_rate": 8.123024759740041e-06, "loss": 1.25, "step": 13225 }, { "epoch": 0.31, "learning_rate": 8.12273145766996e-06, "loss": 1.1352, "step": 13226 }, { "epoch": 0.31, "learning_rate": 8.12243813798164e-06, "loss": 1.0028, "step": 13227 }, { "epoch": 0.31, "learning_rate": 8.122144800676733e-06, "loss": 0.8251, "step": 13228 }, { "epoch": 0.31, "learning_rate": 8.121851445756901e-06, "loss": 1.078, "step": 13229 }, { "epoch": 0.31, "learning_rate": 8.121558073223795e-06, "loss": 0.933, "step": 13230 }, { "epoch": 0.31, "learning_rate": 8.12126468307907e-06, "loss": 1.0528, "step": 13231 }, { "epoch": 0.31, "learning_rate": 8.120971275324381e-06, "loss": 0.6973, "step": 13232 }, { "epoch": 0.31, "learning_rate": 8.120677849961385e-06, "loss": 1.0352, "step": 13233 }, { "epoch": 0.31, "learning_rate": 8.120384406991737e-06, "loss": 1.194, "step": 13234 }, { "epoch": 0.31, "learning_rate": 8.120090946417093e-06, "loss": 0.9204, "step": 13235 }, { "epoch": 0.31, "learning_rate": 8.119797468239108e-06, "loss": 0.8183, "step": 13236 }, { "epoch": 0.31, "learning_rate": 8.119503972459437e-06, "loss": 0.8628, "step": 13237 }, { "epoch": 0.31, "learning_rate": 8.119210459079739e-06, "loss": 0.8945, "step": 13238 }, { "epoch": 0.31, "learning_rate": 8.118916928101666e-06, "loss": 0.7912, "step": 13239 }, { "epoch": 0.31, "learning_rate": 8.118623379526875e-06, "loss": 1.0335, "step": 13240 }, { "epoch": 0.31, "learning_rate": 8.118329813357024e-06, "loss": 0.9613, "step": 13241 }, { "epoch": 0.31, "learning_rate": 8.118036229593768e-06, "loss": 0.9278, "step": 13242 }, { "epoch": 0.31, "learning_rate": 8.117742628238765e-06, "loss": 0.9443, "step": 13243 }, { "epoch": 0.31, "learning_rate": 8.117449009293668e-06, "loss": 1.1298, "step": 13244 }, { "epoch": 0.31, "learning_rate": 8.117155372760138e-06, "loss": 1.006, "step": 13245 }, { "epoch": 0.31, "learning_rate": 8.116861718639829e-06, "loss": 1.0627, "step": 13246 }, { "epoch": 0.31, "learning_rate": 8.116568046934396e-06, "loss": 0.8513, "step": 13247 }, { "epoch": 0.31, "learning_rate": 8.116274357645499e-06, "loss": 0.857, "step": 13248 }, { "epoch": 0.31, "learning_rate": 8.115980650774795e-06, "loss": 1.1408, "step": 13249 }, { "epoch": 0.31, "learning_rate": 8.11568692632394e-06, "loss": 0.9174, "step": 13250 }, { "epoch": 0.31, "learning_rate": 8.11539318429459e-06, "loss": 0.8289, "step": 13251 }, { "epoch": 0.31, "learning_rate": 8.115099424688407e-06, "loss": 1.0002, "step": 13252 }, { "epoch": 0.31, "learning_rate": 8.11480564750704e-06, "loss": 1.0023, "step": 13253 }, { "epoch": 0.31, "learning_rate": 8.114511852752156e-06, "loss": 0.9458, "step": 13254 }, { "epoch": 0.31, "learning_rate": 8.114218040425405e-06, "loss": 0.921, "step": 13255 }, { "epoch": 0.31, "learning_rate": 8.11392421052845e-06, "loss": 0.9565, "step": 13256 }, { "epoch": 0.31, "learning_rate": 8.113630363062943e-06, "loss": 0.8722, "step": 13257 }, { "epoch": 0.31, "learning_rate": 8.113336498030547e-06, "loss": 1.2212, "step": 13258 }, { "epoch": 0.31, "learning_rate": 8.11304261543292e-06, "loss": 1.0407, "step": 13259 }, { "epoch": 0.31, "learning_rate": 8.112748715271716e-06, "loss": 1.2001, "step": 13260 }, { "epoch": 0.31, "learning_rate": 8.112454797548596e-06, "loss": 1.4706, "step": 13261 }, { "epoch": 0.31, "learning_rate": 8.11216086226522e-06, "loss": 0.9846, "step": 13262 }, { "epoch": 0.31, "learning_rate": 8.11186690942324e-06, "loss": 0.7337, "step": 13263 }, { "epoch": 0.31, "learning_rate": 8.11157293902432e-06, "loss": 0.9396, "step": 13264 }, { "epoch": 0.31, "learning_rate": 8.11127895107012e-06, "loss": 0.7588, "step": 13265 }, { "epoch": 0.31, "learning_rate": 8.110984945562292e-06, "loss": 1.0197, "step": 13266 }, { "epoch": 0.31, "learning_rate": 8.110690922502501e-06, "loss": 0.9407, "step": 13267 }, { "epoch": 0.31, "learning_rate": 8.110396881892402e-06, "loss": 0.9942, "step": 13268 }, { "epoch": 0.31, "learning_rate": 8.110102823733657e-06, "loss": 0.7203, "step": 13269 }, { "epoch": 0.31, "learning_rate": 8.109808748027921e-06, "loss": 1.1941, "step": 13270 }, { "epoch": 0.31, "learning_rate": 8.109514654776857e-06, "loss": 0.7417, "step": 13271 }, { "epoch": 0.31, "learning_rate": 8.109220543982124e-06, "loss": 1.1497, "step": 13272 }, { "epoch": 0.31, "learning_rate": 8.10892641564538e-06, "loss": 0.9337, "step": 13273 }, { "epoch": 0.31, "learning_rate": 8.108632269768282e-06, "loss": 0.7572, "step": 13274 }, { "epoch": 0.31, "learning_rate": 8.108338106352493e-06, "loss": 0.9401, "step": 13275 }, { "epoch": 0.31, "learning_rate": 8.108043925399673e-06, "loss": 1.0726, "step": 13276 }, { "epoch": 0.31, "learning_rate": 8.10774972691148e-06, "loss": 0.7812, "step": 13277 }, { "epoch": 0.31, "learning_rate": 8.107455510889574e-06, "loss": 0.8693, "step": 13278 }, { "epoch": 0.31, "learning_rate": 8.107161277335618e-06, "loss": 0.8557, "step": 13279 }, { "epoch": 0.31, "learning_rate": 8.106867026251265e-06, "loss": 0.9042, "step": 13280 }, { "epoch": 0.31, "learning_rate": 8.106572757638184e-06, "loss": 0.8786, "step": 13281 }, { "epoch": 0.31, "learning_rate": 8.106278471498028e-06, "loss": 0.9427, "step": 13282 }, { "epoch": 0.31, "learning_rate": 8.105984167832461e-06, "loss": 0.9458, "step": 13283 }, { "epoch": 0.31, "learning_rate": 8.105689846643144e-06, "loss": 0.8606, "step": 13284 }, { "epoch": 0.31, "learning_rate": 8.105395507931733e-06, "loss": 1.3262, "step": 13285 }, { "epoch": 0.31, "learning_rate": 8.105101151699895e-06, "loss": 0.9209, "step": 13286 }, { "epoch": 0.31, "learning_rate": 8.104806777949284e-06, "loss": 0.81, "step": 13287 }, { "epoch": 0.31, "learning_rate": 8.104512386681568e-06, "loss": 1.0462, "step": 13288 }, { "epoch": 0.31, "learning_rate": 8.104217977898402e-06, "loss": 0.9768, "step": 13289 }, { "epoch": 0.31, "learning_rate": 8.103923551601448e-06, "loss": 1.0311, "step": 13290 }, { "epoch": 0.31, "learning_rate": 8.103629107792372e-06, "loss": 1.0368, "step": 13291 }, { "epoch": 0.31, "learning_rate": 8.103334646472829e-06, "loss": 0.7913, "step": 13292 }, { "epoch": 0.31, "learning_rate": 8.103040167644484e-06, "loss": 0.7566, "step": 13293 }, { "epoch": 0.31, "learning_rate": 8.102745671308997e-06, "loss": 0.9183, "step": 13294 }, { "epoch": 0.31, "learning_rate": 8.102451157468033e-06, "loss": 0.821, "step": 13295 }, { "epoch": 0.31, "learning_rate": 8.102156626123248e-06, "loss": 0.7768, "step": 13296 }, { "epoch": 0.31, "learning_rate": 8.101862077276305e-06, "loss": 1.0807, "step": 13297 }, { "epoch": 0.31, "learning_rate": 8.10156751092887e-06, "loss": 0.7206, "step": 13298 }, { "epoch": 0.31, "learning_rate": 8.101272927082599e-06, "loss": 1.0881, "step": 13299 }, { "epoch": 0.31, "learning_rate": 8.10097832573916e-06, "loss": 1.0672, "step": 13300 }, { "epoch": 0.31, "learning_rate": 8.10068370690021e-06, "loss": 0.6978, "step": 13301 }, { "epoch": 0.31, "learning_rate": 8.100389070567414e-06, "loss": 0.7078, "step": 13302 }, { "epoch": 0.31, "learning_rate": 8.100094416742435e-06, "loss": 0.9927, "step": 13303 }, { "epoch": 0.31, "learning_rate": 8.099799745426933e-06, "loss": 0.5581, "step": 13304 }, { "epoch": 0.31, "learning_rate": 8.099505056622572e-06, "loss": 1.2386, "step": 13305 }, { "epoch": 0.31, "learning_rate": 8.099210350331015e-06, "loss": 0.9623, "step": 13306 }, { "epoch": 0.31, "learning_rate": 8.098915626553923e-06, "loss": 1.3645, "step": 13307 }, { "epoch": 0.31, "learning_rate": 8.09862088529296e-06, "loss": 0.9379, "step": 13308 }, { "epoch": 0.31, "learning_rate": 8.09832612654979e-06, "loss": 1.0029, "step": 13309 }, { "epoch": 0.31, "learning_rate": 8.098031350326072e-06, "loss": 0.9855, "step": 13310 }, { "epoch": 0.31, "learning_rate": 8.097736556623473e-06, "loss": 0.7738, "step": 13311 }, { "epoch": 0.31, "learning_rate": 8.097441745443655e-06, "loss": 1.1348, "step": 13312 }, { "epoch": 0.31, "learning_rate": 8.097146916788284e-06, "loss": 1.2185, "step": 13313 }, { "epoch": 0.31, "learning_rate": 8.096852070659017e-06, "loss": 0.9704, "step": 13314 }, { "epoch": 0.31, "learning_rate": 8.096557207057525e-06, "loss": 0.9742, "step": 13315 }, { "epoch": 0.31, "learning_rate": 8.096262325985465e-06, "loss": 0.5669, "step": 13316 }, { "epoch": 0.31, "learning_rate": 8.095967427444502e-06, "loss": 0.733, "step": 13317 }, { "epoch": 0.31, "learning_rate": 8.095672511436306e-06, "loss": 0.9794, "step": 13318 }, { "epoch": 0.31, "learning_rate": 8.095377577962533e-06, "loss": 1.009, "step": 13319 }, { "epoch": 0.31, "learning_rate": 8.09508262702485e-06, "loss": 0.8037, "step": 13320 }, { "epoch": 0.31, "learning_rate": 8.094787658624922e-06, "loss": 1.1601, "step": 13321 }, { "epoch": 0.31, "learning_rate": 8.094492672764414e-06, "loss": 0.9836, "step": 13322 }, { "epoch": 0.31, "learning_rate": 8.094197669444988e-06, "loss": 0.7819, "step": 13323 }, { "epoch": 0.31, "learning_rate": 8.09390264866831e-06, "loss": 1.0881, "step": 13324 }, { "epoch": 0.31, "learning_rate": 8.093607610436043e-06, "loss": 0.9233, "step": 13325 }, { "epoch": 0.31, "learning_rate": 8.093312554749852e-06, "loss": 0.9429, "step": 13326 }, { "epoch": 0.31, "learning_rate": 8.0930174816114e-06, "loss": 1.2071, "step": 13327 }, { "epoch": 0.31, "learning_rate": 8.092722391022357e-06, "loss": 0.8409, "step": 13328 }, { "epoch": 0.31, "learning_rate": 8.092427282984383e-06, "loss": 1.0574, "step": 13329 }, { "epoch": 0.31, "learning_rate": 8.092132157499147e-06, "loss": 0.9157, "step": 13330 }, { "epoch": 0.31, "learning_rate": 8.091837014568308e-06, "loss": 0.7852, "step": 13331 }, { "epoch": 0.31, "learning_rate": 8.091541854193538e-06, "loss": 0.8629, "step": 13332 }, { "epoch": 0.31, "learning_rate": 8.091246676376497e-06, "loss": 1.1497, "step": 13333 }, { "epoch": 0.31, "learning_rate": 8.090951481118855e-06, "loss": 0.8792, "step": 13334 }, { "epoch": 0.31, "learning_rate": 8.090656268422273e-06, "loss": 0.9285, "step": 13335 }, { "epoch": 0.31, "learning_rate": 8.090361038288416e-06, "loss": 0.9713, "step": 13336 }, { "epoch": 0.31, "learning_rate": 8.090065790718958e-06, "loss": 1.0202, "step": 13337 }, { "epoch": 0.31, "learning_rate": 8.089770525715555e-06, "loss": 0.924, "step": 13338 }, { "epoch": 0.31, "learning_rate": 8.089475243279878e-06, "loss": 1.0332, "step": 13339 }, { "epoch": 0.31, "learning_rate": 8.089179943413592e-06, "loss": 1.0893, "step": 13340 }, { "epoch": 0.31, "learning_rate": 8.088884626118363e-06, "loss": 0.7039, "step": 13341 }, { "epoch": 0.31, "learning_rate": 8.088589291395857e-06, "loss": 0.8963, "step": 13342 }, { "epoch": 0.31, "learning_rate": 8.08829393924774e-06, "loss": 1.1605, "step": 13343 }, { "epoch": 0.31, "learning_rate": 8.087998569675677e-06, "loss": 0.9723, "step": 13344 }, { "epoch": 0.31, "learning_rate": 8.08770318268134e-06, "loss": 0.9019, "step": 13345 }, { "epoch": 0.31, "learning_rate": 8.087407778266387e-06, "loss": 0.8262, "step": 13346 }, { "epoch": 0.31, "learning_rate": 8.087112356432495e-06, "loss": 1.242, "step": 13347 }, { "epoch": 0.31, "learning_rate": 8.08681691718132e-06, "loss": 1.0004, "step": 13348 }, { "epoch": 0.31, "learning_rate": 8.086521460514534e-06, "loss": 1.1568, "step": 13349 }, { "epoch": 0.31, "learning_rate": 8.086225986433807e-06, "loss": 0.9474, "step": 13350 }, { "epoch": 0.31, "learning_rate": 8.085930494940801e-06, "loss": 0.9352, "step": 13351 }, { "epoch": 0.31, "learning_rate": 8.085634986037187e-06, "loss": 0.7911, "step": 13352 }, { "epoch": 0.31, "learning_rate": 8.085339459724629e-06, "loss": 0.9184, "step": 13353 }, { "epoch": 0.31, "learning_rate": 8.085043916004793e-06, "loss": 0.9692, "step": 13354 }, { "epoch": 0.31, "learning_rate": 8.084748354879353e-06, "loss": 1.0501, "step": 13355 }, { "epoch": 0.31, "learning_rate": 8.084452776349971e-06, "loss": 0.9875, "step": 13356 }, { "epoch": 0.31, "learning_rate": 8.084157180418318e-06, "loss": 0.7442, "step": 13357 }, { "epoch": 0.31, "learning_rate": 8.083861567086058e-06, "loss": 0.8153, "step": 13358 }, { "epoch": 0.31, "learning_rate": 8.08356593635486e-06, "loss": 0.9306, "step": 13359 }, { "epoch": 0.31, "learning_rate": 8.083270288226395e-06, "loss": 0.7516, "step": 13360 }, { "epoch": 0.31, "learning_rate": 8.082974622702327e-06, "loss": 0.7597, "step": 13361 }, { "epoch": 0.31, "learning_rate": 8.082678939784327e-06, "loss": 0.8401, "step": 13362 }, { "epoch": 0.31, "learning_rate": 8.08238323947406e-06, "loss": 1.0722, "step": 13363 }, { "epoch": 0.31, "learning_rate": 8.0820875217732e-06, "loss": 0.8838, "step": 13364 }, { "epoch": 0.31, "learning_rate": 8.08179178668341e-06, "loss": 0.8086, "step": 13365 }, { "epoch": 0.31, "learning_rate": 8.08149603420636e-06, "loss": 1.1194, "step": 13366 }, { "epoch": 0.31, "learning_rate": 8.081200264343719e-06, "loss": 0.912, "step": 13367 }, { "epoch": 0.31, "learning_rate": 8.080904477097156e-06, "loss": 1.2457, "step": 13368 }, { "epoch": 0.31, "learning_rate": 8.08060867246834e-06, "loss": 1.0835, "step": 13369 }, { "epoch": 0.31, "learning_rate": 8.080312850458937e-06, "loss": 0.9429, "step": 13370 }, { "epoch": 0.31, "learning_rate": 8.080017011070623e-06, "loss": 0.916, "step": 13371 }, { "epoch": 0.31, "learning_rate": 8.079721154305058e-06, "loss": 1.0163, "step": 13372 }, { "epoch": 0.31, "learning_rate": 8.079425280163919e-06, "loss": 0.7794, "step": 13373 }, { "epoch": 0.31, "learning_rate": 8.07912938864887e-06, "loss": 1.0076, "step": 13374 }, { "epoch": 0.31, "learning_rate": 8.078833479761584e-06, "loss": 1.1885, "step": 13375 }, { "epoch": 0.31, "learning_rate": 8.078537553503727e-06, "loss": 1.0317, "step": 13376 }, { "epoch": 0.31, "learning_rate": 8.078241609876972e-06, "loss": 1.0042, "step": 13377 }, { "epoch": 0.31, "learning_rate": 8.077945648882985e-06, "loss": 1.2377, "step": 13378 }, { "epoch": 0.31, "learning_rate": 8.077649670523442e-06, "loss": 0.879, "step": 13379 }, { "epoch": 0.31, "learning_rate": 8.077353674800005e-06, "loss": 0.8648, "step": 13380 }, { "epoch": 0.31, "learning_rate": 8.07705766171435e-06, "loss": 0.9725, "step": 13381 }, { "epoch": 0.31, "learning_rate": 8.076761631268145e-06, "loss": 0.9323, "step": 13382 }, { "epoch": 0.31, "learning_rate": 8.076465583463061e-06, "loss": 0.9518, "step": 13383 }, { "epoch": 0.31, "learning_rate": 8.076169518300764e-06, "loss": 1.2488, "step": 13384 }, { "epoch": 0.31, "learning_rate": 8.07587343578293e-06, "loss": 0.8854, "step": 13385 }, { "epoch": 0.31, "learning_rate": 8.075577335911227e-06, "loss": 0.9347, "step": 13386 }, { "epoch": 0.31, "learning_rate": 8.075281218687327e-06, "loss": 0.71, "step": 13387 }, { "epoch": 0.31, "learning_rate": 8.074985084112898e-06, "loss": 0.7259, "step": 13388 }, { "epoch": 0.31, "learning_rate": 8.074688932189614e-06, "loss": 1.1396, "step": 13389 }, { "epoch": 0.31, "learning_rate": 8.074392762919143e-06, "loss": 0.9742, "step": 13390 }, { "epoch": 0.31, "learning_rate": 8.074096576303157e-06, "loss": 0.6548, "step": 13391 }, { "epoch": 0.31, "learning_rate": 8.073800372343328e-06, "loss": 0.817, "step": 13392 }, { "epoch": 0.31, "learning_rate": 8.073504151041325e-06, "loss": 0.8427, "step": 13393 }, { "epoch": 0.31, "learning_rate": 8.073207912398822e-06, "loss": 0.816, "step": 13394 }, { "epoch": 0.31, "learning_rate": 8.072911656417488e-06, "loss": 1.1007, "step": 13395 }, { "epoch": 0.31, "learning_rate": 8.072615383098996e-06, "loss": 1.0266, "step": 13396 }, { "epoch": 0.31, "learning_rate": 8.072319092445018e-06, "loss": 1.0825, "step": 13397 }, { "epoch": 0.31, "learning_rate": 8.072022784457223e-06, "loss": 0.8074, "step": 13398 }, { "epoch": 0.31, "learning_rate": 8.071726459137286e-06, "loss": 0.7878, "step": 13399 }, { "epoch": 0.31, "learning_rate": 8.071430116486875e-06, "loss": 1.026, "step": 13400 }, { "epoch": 0.31, "learning_rate": 8.071133756507666e-06, "loss": 0.8367, "step": 13401 }, { "epoch": 0.31, "learning_rate": 8.070837379201328e-06, "loss": 0.8332, "step": 13402 }, { "epoch": 0.31, "learning_rate": 8.070540984569535e-06, "loss": 0.8363, "step": 13403 }, { "epoch": 0.31, "learning_rate": 8.07024457261396e-06, "loss": 1.0021, "step": 13404 }, { "epoch": 0.31, "learning_rate": 8.069948143336272e-06, "loss": 1.003, "step": 13405 }, { "epoch": 0.31, "learning_rate": 8.069651696738146e-06, "loss": 1.1303, "step": 13406 }, { "epoch": 0.31, "learning_rate": 8.069355232821254e-06, "loss": 1.064, "step": 13407 }, { "epoch": 0.31, "learning_rate": 8.06905875158727e-06, "loss": 1.0911, "step": 13408 }, { "epoch": 0.31, "learning_rate": 8.068762253037863e-06, "loss": 1.088, "step": 13409 }, { "epoch": 0.31, "learning_rate": 8.068465737174709e-06, "loss": 0.9373, "step": 13410 }, { "epoch": 0.31, "learning_rate": 8.068169203999481e-06, "loss": 0.9104, "step": 13411 }, { "epoch": 0.31, "learning_rate": 8.06787265351385e-06, "loss": 1.0049, "step": 13412 }, { "epoch": 0.31, "learning_rate": 8.06757608571949e-06, "loss": 0.9861, "step": 13413 }, { "epoch": 0.31, "learning_rate": 8.067279500618075e-06, "loss": 1.3195, "step": 13414 }, { "epoch": 0.31, "learning_rate": 8.066982898211276e-06, "loss": 0.9783, "step": 13415 }, { "epoch": 0.31, "learning_rate": 8.06668627850077e-06, "loss": 0.9739, "step": 13416 }, { "epoch": 0.31, "learning_rate": 8.066389641488228e-06, "loss": 0.8555, "step": 13417 }, { "epoch": 0.31, "learning_rate": 8.066092987175325e-06, "loss": 0.7579, "step": 13418 }, { "epoch": 0.31, "learning_rate": 8.065796315563733e-06, "loss": 0.6895, "step": 13419 }, { "epoch": 0.31, "learning_rate": 8.065499626655127e-06, "loss": 1.0315, "step": 13420 }, { "epoch": 0.31, "learning_rate": 8.06520292045118e-06, "loss": 1.2299, "step": 13421 }, { "epoch": 0.31, "learning_rate": 8.064906196953567e-06, "loss": 0.6718, "step": 13422 }, { "epoch": 0.31, "learning_rate": 8.064609456163963e-06, "loss": 0.9745, "step": 13423 }, { "epoch": 0.31, "learning_rate": 8.06431269808404e-06, "loss": 0.7842, "step": 13424 }, { "epoch": 0.31, "learning_rate": 8.064015922715472e-06, "loss": 0.9051, "step": 13425 }, { "epoch": 0.31, "learning_rate": 8.063719130059934e-06, "loss": 0.6778, "step": 13426 }, { "epoch": 0.31, "learning_rate": 8.063422320119102e-06, "loss": 0.9133, "step": 13427 }, { "epoch": 0.31, "learning_rate": 8.063125492894653e-06, "loss": 0.7073, "step": 13428 }, { "epoch": 0.31, "learning_rate": 8.062828648388254e-06, "loss": 0.7089, "step": 13429 }, { "epoch": 0.31, "learning_rate": 8.062531786601586e-06, "loss": 0.975, "step": 13430 }, { "epoch": 0.31, "learning_rate": 8.062234907536321e-06, "loss": 1.0295, "step": 13431 }, { "epoch": 0.31, "learning_rate": 8.061938011194137e-06, "loss": 1.1166, "step": 13432 }, { "epoch": 0.31, "learning_rate": 8.061641097576706e-06, "loss": 1.0843, "step": 13433 }, { "epoch": 0.31, "learning_rate": 8.061344166685703e-06, "loss": 0.8205, "step": 13434 }, { "epoch": 0.31, "learning_rate": 8.061047218522804e-06, "loss": 0.8721, "step": 13435 }, { "epoch": 0.31, "learning_rate": 8.060750253089688e-06, "loss": 0.7942, "step": 13436 }, { "epoch": 0.31, "learning_rate": 8.060453270388024e-06, "loss": 1.0705, "step": 13437 }, { "epoch": 0.31, "learning_rate": 8.060156270419493e-06, "loss": 0.9918, "step": 13438 }, { "epoch": 0.31, "learning_rate": 8.059859253185768e-06, "loss": 1.0094, "step": 13439 }, { "epoch": 0.31, "learning_rate": 8.059562218688524e-06, "loss": 1.0623, "step": 13440 }, { "epoch": 0.31, "learning_rate": 8.05926516692944e-06, "loss": 0.9043, "step": 13441 }, { "epoch": 0.31, "learning_rate": 8.058968097910188e-06, "loss": 1.0692, "step": 13442 }, { "epoch": 0.31, "learning_rate": 8.058671011632448e-06, "loss": 0.787, "step": 13443 }, { "epoch": 0.31, "learning_rate": 8.058373908097892e-06, "loss": 1.0452, "step": 13444 }, { "epoch": 0.31, "learning_rate": 8.0580767873082e-06, "loss": 0.7488, "step": 13445 }, { "epoch": 0.31, "learning_rate": 8.057779649265047e-06, "loss": 0.8272, "step": 13446 }, { "epoch": 0.31, "learning_rate": 8.057482493970109e-06, "loss": 1.0041, "step": 13447 }, { "epoch": 0.31, "learning_rate": 8.057185321425062e-06, "loss": 0.8631, "step": 13448 }, { "epoch": 0.31, "learning_rate": 8.056888131631583e-06, "loss": 0.9807, "step": 13449 }, { "epoch": 0.31, "learning_rate": 8.056590924591349e-06, "loss": 0.9611, "step": 13450 }, { "epoch": 0.31, "learning_rate": 8.05629370030604e-06, "loss": 0.9136, "step": 13451 }, { "epoch": 0.31, "learning_rate": 8.055996458777326e-06, "loss": 1.035, "step": 13452 }, { "epoch": 0.31, "learning_rate": 8.05569920000689e-06, "loss": 0.9673, "step": 13453 }, { "epoch": 0.31, "learning_rate": 8.055401923996406e-06, "loss": 0.882, "step": 13454 }, { "epoch": 0.31, "learning_rate": 8.055104630747553e-06, "loss": 1.2461, "step": 13455 }, { "epoch": 0.31, "learning_rate": 8.054807320262006e-06, "loss": 0.8705, "step": 13456 }, { "epoch": 0.31, "learning_rate": 8.054509992541444e-06, "loss": 0.7736, "step": 13457 }, { "epoch": 0.31, "learning_rate": 8.054212647587547e-06, "loss": 0.8946, "step": 13458 }, { "epoch": 0.31, "learning_rate": 8.053915285401987e-06, "loss": 0.7392, "step": 13459 }, { "epoch": 0.31, "learning_rate": 8.053617905986447e-06, "loss": 0.9186, "step": 13460 }, { "epoch": 0.31, "learning_rate": 8.053320509342601e-06, "loss": 0.9382, "step": 13461 }, { "epoch": 0.31, "learning_rate": 8.05302309547213e-06, "loss": 0.8505, "step": 13462 }, { "epoch": 0.31, "learning_rate": 8.052725664376708e-06, "loss": 1.2937, "step": 13463 }, { "epoch": 0.31, "learning_rate": 8.052428216058018e-06, "loss": 0.8418, "step": 13464 }, { "epoch": 0.31, "learning_rate": 8.052130750517733e-06, "loss": 0.8165, "step": 13465 }, { "epoch": 0.31, "learning_rate": 8.051833267757537e-06, "loss": 0.836, "step": 13466 }, { "epoch": 0.31, "learning_rate": 8.051535767779101e-06, "loss": 0.9536, "step": 13467 }, { "epoch": 0.31, "learning_rate": 8.051238250584112e-06, "loss": 0.9765, "step": 13468 }, { "epoch": 0.31, "learning_rate": 8.050940716174243e-06, "loss": 0.7897, "step": 13469 }, { "epoch": 0.31, "learning_rate": 8.050643164551173e-06, "loss": 0.7496, "step": 13470 }, { "epoch": 0.31, "learning_rate": 8.050345595716582e-06, "loss": 1.1022, "step": 13471 }, { "epoch": 0.31, "learning_rate": 8.05004800967215e-06, "loss": 0.7385, "step": 13472 }, { "epoch": 0.31, "learning_rate": 8.049750406419553e-06, "loss": 1.1363, "step": 13473 }, { "epoch": 0.31, "learning_rate": 8.049452785960473e-06, "loss": 0.8964, "step": 13474 }, { "epoch": 0.31, "learning_rate": 8.049155148296586e-06, "loss": 0.9066, "step": 13475 }, { "epoch": 0.31, "learning_rate": 8.048857493429574e-06, "loss": 0.8395, "step": 13476 }, { "epoch": 0.31, "learning_rate": 8.048559821361116e-06, "loss": 0.8971, "step": 13477 }, { "epoch": 0.31, "learning_rate": 8.04826213209289e-06, "loss": 0.8116, "step": 13478 }, { "epoch": 0.31, "learning_rate": 8.047964425626575e-06, "loss": 0.915, "step": 13479 }, { "epoch": 0.31, "learning_rate": 8.047666701963855e-06, "loss": 0.9904, "step": 13480 }, { "epoch": 0.31, "learning_rate": 8.047368961106406e-06, "loss": 0.8939, "step": 13481 }, { "epoch": 0.31, "learning_rate": 8.047071203055909e-06, "loss": 1.0196, "step": 13482 }, { "epoch": 0.31, "learning_rate": 8.046773427814043e-06, "loss": 1.2028, "step": 13483 }, { "epoch": 0.31, "learning_rate": 8.046475635382487e-06, "loss": 0.9428, "step": 13484 }, { "epoch": 0.31, "learning_rate": 8.046177825762925e-06, "loss": 0.5472, "step": 13485 }, { "epoch": 0.31, "learning_rate": 8.045879998957032e-06, "loss": 1.2083, "step": 13486 }, { "epoch": 0.31, "learning_rate": 8.045582154966494e-06, "loss": 0.9188, "step": 13487 }, { "epoch": 0.31, "learning_rate": 8.045284293792988e-06, "loss": 1.0143, "step": 13488 }, { "epoch": 0.31, "learning_rate": 8.044986415438193e-06, "loss": 1.0114, "step": 13489 }, { "epoch": 0.31, "learning_rate": 8.044688519903795e-06, "loss": 0.9392, "step": 13490 }, { "epoch": 0.31, "learning_rate": 8.04439060719147e-06, "loss": 0.7912, "step": 13491 }, { "epoch": 0.31, "learning_rate": 8.044092677302901e-06, "loss": 1.0986, "step": 13492 }, { "epoch": 0.31, "learning_rate": 8.043794730239766e-06, "loss": 0.9191, "step": 13493 }, { "epoch": 0.31, "learning_rate": 8.04349676600375e-06, "loss": 0.9169, "step": 13494 }, { "epoch": 0.31, "learning_rate": 8.043198784596533e-06, "loss": 0.6631, "step": 13495 }, { "epoch": 0.31, "learning_rate": 8.042900786019794e-06, "loss": 0.724, "step": 13496 }, { "epoch": 0.31, "learning_rate": 8.042602770275217e-06, "loss": 0.7417, "step": 13497 }, { "epoch": 0.31, "learning_rate": 8.042304737364481e-06, "loss": 0.9111, "step": 13498 }, { "epoch": 0.31, "learning_rate": 8.042006687289269e-06, "loss": 0.8287, "step": 13499 }, { "epoch": 0.31, "learning_rate": 8.041708620051262e-06, "loss": 1.2264, "step": 13500 }, { "epoch": 0.31, "learning_rate": 8.041410535652143e-06, "loss": 1.0378, "step": 13501 }, { "epoch": 0.31, "learning_rate": 8.04111243409359e-06, "loss": 1.0666, "step": 13502 }, { "epoch": 0.31, "learning_rate": 8.04081431537729e-06, "loss": 0.9066, "step": 13503 }, { "epoch": 0.31, "learning_rate": 8.04051617950492e-06, "loss": 0.9061, "step": 13504 }, { "epoch": 0.31, "learning_rate": 8.040218026478168e-06, "loss": 0.9801, "step": 13505 }, { "epoch": 0.31, "learning_rate": 8.03991985629871e-06, "loss": 0.9081, "step": 13506 }, { "epoch": 0.31, "learning_rate": 8.039621668968232e-06, "loss": 0.7544, "step": 13507 }, { "epoch": 0.31, "learning_rate": 8.039323464488415e-06, "loss": 0.9692, "step": 13508 }, { "epoch": 0.31, "learning_rate": 8.039025242860942e-06, "loss": 1.1348, "step": 13509 }, { "epoch": 0.31, "learning_rate": 8.038727004087495e-06, "loss": 0.9532, "step": 13510 }, { "epoch": 0.31, "learning_rate": 8.038428748169758e-06, "loss": 0.9452, "step": 13511 }, { "epoch": 0.31, "learning_rate": 8.038130475109412e-06, "loss": 0.9542, "step": 13512 }, { "epoch": 0.31, "learning_rate": 8.037832184908138e-06, "loss": 0.7514, "step": 13513 }, { "epoch": 0.31, "learning_rate": 8.037533877567625e-06, "loss": 1.0424, "step": 13514 }, { "epoch": 0.31, "learning_rate": 8.03723555308955e-06, "loss": 1.124, "step": 13515 }, { "epoch": 0.31, "learning_rate": 8.0369372114756e-06, "loss": 1.0286, "step": 13516 }, { "epoch": 0.31, "learning_rate": 8.036638852727457e-06, "loss": 0.9699, "step": 13517 }, { "epoch": 0.31, "learning_rate": 8.036340476846804e-06, "loss": 1.0922, "step": 13518 }, { "epoch": 0.31, "learning_rate": 8.036042083835325e-06, "loss": 0.7708, "step": 13519 }, { "epoch": 0.31, "learning_rate": 8.035743673694701e-06, "loss": 1.0529, "step": 13520 }, { "epoch": 0.31, "learning_rate": 8.035445246426619e-06, "loss": 1.2205, "step": 13521 }, { "epoch": 0.31, "learning_rate": 8.035146802032763e-06, "loss": 1.0265, "step": 13522 }, { "epoch": 0.31, "learning_rate": 8.034848340514813e-06, "loss": 1.0928, "step": 13523 }, { "epoch": 0.31, "learning_rate": 8.034549861874455e-06, "loss": 1.2016, "step": 13524 }, { "epoch": 0.31, "learning_rate": 8.034251366113374e-06, "loss": 1.1543, "step": 13525 }, { "epoch": 0.31, "learning_rate": 8.033952853233254e-06, "loss": 0.8703, "step": 13526 }, { "epoch": 0.31, "learning_rate": 8.033654323235777e-06, "loss": 1.0021, "step": 13527 }, { "epoch": 0.31, "learning_rate": 8.033355776122629e-06, "loss": 0.9745, "step": 13528 }, { "epoch": 0.31, "learning_rate": 8.033057211895494e-06, "loss": 1.0228, "step": 13529 }, { "epoch": 0.31, "learning_rate": 8.032758630556056e-06, "loss": 1.1015, "step": 13530 }, { "epoch": 0.31, "learning_rate": 8.032460032106002e-06, "loss": 0.8082, "step": 13531 }, { "epoch": 0.31, "learning_rate": 8.032161416547013e-06, "loss": 0.8808, "step": 13532 }, { "epoch": 0.31, "learning_rate": 8.031862783880776e-06, "loss": 1.0155, "step": 13533 }, { "epoch": 0.31, "learning_rate": 8.031564134108976e-06, "loss": 1.209, "step": 13534 }, { "epoch": 0.31, "learning_rate": 8.031265467233296e-06, "loss": 0.7806, "step": 13535 }, { "epoch": 0.31, "learning_rate": 8.030966783255422e-06, "loss": 0.8311, "step": 13536 }, { "epoch": 0.31, "learning_rate": 8.030668082177043e-06, "loss": 0.9906, "step": 13537 }, { "epoch": 0.31, "learning_rate": 8.030369363999838e-06, "loss": 0.9237, "step": 13538 }, { "epoch": 0.31, "learning_rate": 8.030070628725495e-06, "loss": 0.9531, "step": 13539 }, { "epoch": 0.31, "learning_rate": 8.029771876355701e-06, "loss": 0.9766, "step": 13540 }, { "epoch": 0.31, "learning_rate": 8.029473106892139e-06, "loss": 1.165, "step": 13541 }, { "epoch": 0.31, "learning_rate": 8.029174320336497e-06, "loss": 0.8878, "step": 13542 }, { "epoch": 0.31, "learning_rate": 8.028875516690457e-06, "loss": 0.8952, "step": 13543 }, { "epoch": 0.31, "learning_rate": 8.028576695955711e-06, "loss": 1.1389, "step": 13544 }, { "epoch": 0.31, "learning_rate": 8.028277858133939e-06, "loss": 0.8438, "step": 13545 }, { "epoch": 0.31, "learning_rate": 8.02797900322683e-06, "loss": 1.2047, "step": 13546 }, { "epoch": 0.31, "learning_rate": 8.02768013123607e-06, "loss": 1.0739, "step": 13547 }, { "epoch": 0.31, "learning_rate": 8.027381242163342e-06, "loss": 1.0978, "step": 13548 }, { "epoch": 0.31, "learning_rate": 8.027082336010337e-06, "loss": 0.9528, "step": 13549 }, { "epoch": 0.31, "learning_rate": 8.02678341277874e-06, "loss": 0.9469, "step": 13550 }, { "epoch": 0.31, "learning_rate": 8.026484472470236e-06, "loss": 0.9162, "step": 13551 }, { "epoch": 0.31, "learning_rate": 8.026185515086514e-06, "loss": 0.8663, "step": 13552 }, { "epoch": 0.31, "learning_rate": 8.025886540629255e-06, "loss": 1.0196, "step": 13553 }, { "epoch": 0.31, "learning_rate": 8.025587549100153e-06, "loss": 0.9929, "step": 13554 }, { "epoch": 0.31, "learning_rate": 8.025288540500893e-06, "loss": 0.9965, "step": 13555 }, { "epoch": 0.31, "learning_rate": 8.02498951483316e-06, "loss": 1.0779, "step": 13556 }, { "epoch": 0.31, "learning_rate": 8.02469047209864e-06, "loss": 1.0383, "step": 13557 }, { "epoch": 0.31, "learning_rate": 8.024391412299023e-06, "loss": 0.8628, "step": 13558 }, { "epoch": 0.31, "learning_rate": 8.024092335435996e-06, "loss": 1.0729, "step": 13559 }, { "epoch": 0.31, "learning_rate": 8.023793241511245e-06, "loss": 0.8424, "step": 13560 }, { "epoch": 0.31, "learning_rate": 8.02349413052646e-06, "loss": 0.898, "step": 13561 }, { "epoch": 0.31, "learning_rate": 8.023195002483324e-06, "loss": 0.9189, "step": 13562 }, { "epoch": 0.31, "learning_rate": 8.022895857383531e-06, "loss": 1.1156, "step": 13563 }, { "epoch": 0.31, "learning_rate": 8.022596695228762e-06, "loss": 0.9766, "step": 13564 }, { "epoch": 0.31, "learning_rate": 8.02229751602071e-06, "loss": 0.9638, "step": 13565 }, { "epoch": 0.31, "learning_rate": 8.02199831976106e-06, "loss": 0.8795, "step": 13566 }, { "epoch": 0.31, "learning_rate": 8.0216991064515e-06, "loss": 1.038, "step": 13567 }, { "epoch": 0.31, "learning_rate": 8.02139987609372e-06, "loss": 0.9683, "step": 13568 }, { "epoch": 0.31, "learning_rate": 8.021100628689409e-06, "loss": 0.7979, "step": 13569 }, { "epoch": 0.31, "learning_rate": 8.020801364240251e-06, "loss": 1.0243, "step": 13570 }, { "epoch": 0.31, "learning_rate": 8.020502082747939e-06, "loss": 0.9845, "step": 13571 }, { "epoch": 0.31, "learning_rate": 8.02020278421416e-06, "loss": 0.9911, "step": 13572 }, { "epoch": 0.31, "learning_rate": 8.019903468640601e-06, "loss": 0.9743, "step": 13573 }, { "epoch": 0.31, "learning_rate": 8.019604136028954e-06, "loss": 0.7938, "step": 13574 }, { "epoch": 0.31, "learning_rate": 8.019304786380903e-06, "loss": 1.0808, "step": 13575 }, { "epoch": 0.31, "learning_rate": 8.019005419698143e-06, "loss": 0.7763, "step": 13576 }, { "epoch": 0.31, "learning_rate": 8.018706035982357e-06, "loss": 1.093, "step": 13577 }, { "epoch": 0.31, "learning_rate": 8.018406635235238e-06, "loss": 1.036, "step": 13578 }, { "epoch": 0.31, "learning_rate": 8.018107217458475e-06, "loss": 1.0624, "step": 13579 }, { "epoch": 0.31, "learning_rate": 8.017807782653755e-06, "loss": 0.9568, "step": 13580 }, { "epoch": 0.31, "learning_rate": 8.017508330822769e-06, "loss": 0.939, "step": 13581 }, { "epoch": 0.31, "learning_rate": 8.017208861967207e-06, "loss": 0.8502, "step": 13582 }, { "epoch": 0.32, "learning_rate": 8.016909376088757e-06, "loss": 1.2334, "step": 13583 }, { "epoch": 0.32, "learning_rate": 8.01660987318911e-06, "loss": 0.9461, "step": 13584 }, { "epoch": 0.32, "learning_rate": 8.016310353269955e-06, "loss": 1.0303, "step": 13585 }, { "epoch": 0.32, "learning_rate": 8.016010816332982e-06, "loss": 1.0051, "step": 13586 }, { "epoch": 0.32, "learning_rate": 8.015711262379882e-06, "loss": 1.0425, "step": 13587 }, { "epoch": 0.32, "learning_rate": 8.015411691412344e-06, "loss": 1.2414, "step": 13588 }, { "epoch": 0.32, "learning_rate": 8.015112103432057e-06, "loss": 1.1377, "step": 13589 }, { "epoch": 0.32, "learning_rate": 8.014812498440713e-06, "loss": 1.0912, "step": 13590 }, { "epoch": 0.32, "learning_rate": 8.014512876440004e-06, "loss": 0.9796, "step": 13591 }, { "epoch": 0.32, "learning_rate": 8.014213237431617e-06, "loss": 1.0137, "step": 13592 }, { "epoch": 0.32, "learning_rate": 8.013913581417244e-06, "loss": 0.7597, "step": 13593 }, { "epoch": 0.32, "learning_rate": 8.013613908398575e-06, "loss": 1.018, "step": 13594 }, { "epoch": 0.32, "learning_rate": 8.013314218377301e-06, "loss": 0.9905, "step": 13595 }, { "epoch": 0.32, "learning_rate": 8.013014511355114e-06, "loss": 0.8489, "step": 13596 }, { "epoch": 0.32, "learning_rate": 8.012714787333705e-06, "loss": 0.967, "step": 13597 }, { "epoch": 0.32, "learning_rate": 8.012415046314763e-06, "loss": 1.1244, "step": 13598 }, { "epoch": 0.32, "learning_rate": 8.01211528829998e-06, "loss": 0.6132, "step": 13599 }, { "epoch": 0.32, "learning_rate": 8.011815513291047e-06, "loss": 1.0079, "step": 13600 }, { "epoch": 0.32, "learning_rate": 8.011515721289658e-06, "loss": 1.0853, "step": 13601 }, { "epoch": 0.32, "learning_rate": 8.011215912297498e-06, "loss": 0.7186, "step": 13602 }, { "epoch": 0.32, "learning_rate": 8.010916086316268e-06, "loss": 1.0593, "step": 13603 }, { "epoch": 0.32, "learning_rate": 8.01061624334765e-06, "loss": 0.9615, "step": 13604 }, { "epoch": 0.32, "learning_rate": 8.010316383393342e-06, "loss": 1.021, "step": 13605 }, { "epoch": 0.32, "learning_rate": 8.010016506455033e-06, "loss": 0.8454, "step": 13606 }, { "epoch": 0.32, "learning_rate": 8.009716612534415e-06, "loss": 0.8883, "step": 13607 }, { "epoch": 0.32, "learning_rate": 8.009416701633181e-06, "loss": 1.0023, "step": 13608 }, { "epoch": 0.32, "learning_rate": 8.009116773753023e-06, "loss": 1.2362, "step": 13609 }, { "epoch": 0.32, "learning_rate": 8.008816828895633e-06, "loss": 1.0883, "step": 13610 }, { "epoch": 0.32, "learning_rate": 8.008516867062703e-06, "loss": 1.1981, "step": 13611 }, { "epoch": 0.32, "learning_rate": 8.008216888255926e-06, "loss": 1.0637, "step": 13612 }, { "epoch": 0.32, "learning_rate": 8.007916892476994e-06, "loss": 1.0109, "step": 13613 }, { "epoch": 0.32, "learning_rate": 8.007616879727597e-06, "loss": 0.7976, "step": 13614 }, { "epoch": 0.32, "learning_rate": 8.007316850009434e-06, "loss": 1.0044, "step": 13615 }, { "epoch": 0.32, "learning_rate": 8.00701680332419e-06, "loss": 0.9423, "step": 13616 }, { "epoch": 0.32, "learning_rate": 8.006716739673564e-06, "loss": 1.081, "step": 13617 }, { "epoch": 0.32, "learning_rate": 8.006416659059247e-06, "loss": 0.9948, "step": 13618 }, { "epoch": 0.32, "learning_rate": 8.006116561482931e-06, "loss": 1.056, "step": 13619 }, { "epoch": 0.32, "learning_rate": 8.005816446946309e-06, "loss": 0.7156, "step": 13620 }, { "epoch": 0.32, "learning_rate": 8.005516315451075e-06, "loss": 0.738, "step": 13621 }, { "epoch": 0.32, "learning_rate": 8.005216166998923e-06, "loss": 1.1153, "step": 13622 }, { "epoch": 0.32, "learning_rate": 8.004916001591547e-06, "loss": 1.1195, "step": 13623 }, { "epoch": 0.32, "learning_rate": 8.00461581923064e-06, "loss": 0.846, "step": 13624 }, { "epoch": 0.32, "learning_rate": 8.004315619917893e-06, "loss": 1.1224, "step": 13625 }, { "epoch": 0.32, "learning_rate": 8.004015403655e-06, "loss": 0.7651, "step": 13626 }, { "epoch": 0.32, "learning_rate": 8.00371517044366e-06, "loss": 1.0084, "step": 13627 }, { "epoch": 0.32, "learning_rate": 8.003414920285561e-06, "loss": 1.1048, "step": 13628 }, { "epoch": 0.32, "learning_rate": 8.0031146531824e-06, "loss": 0.8672, "step": 13629 }, { "epoch": 0.32, "learning_rate": 8.002814369135871e-06, "loss": 1.0301, "step": 13630 }, { "epoch": 0.32, "learning_rate": 8.002514068147666e-06, "loss": 1.0436, "step": 13631 }, { "epoch": 0.32, "learning_rate": 8.002213750219484e-06, "loss": 1.1313, "step": 13632 }, { "epoch": 0.32, "learning_rate": 8.001913415353013e-06, "loss": 1.0052, "step": 13633 }, { "epoch": 0.32, "learning_rate": 8.001613063549952e-06, "loss": 1.0641, "step": 13634 }, { "epoch": 0.32, "learning_rate": 8.001312694811994e-06, "loss": 1.1488, "step": 13635 }, { "epoch": 0.32, "learning_rate": 8.001012309140835e-06, "loss": 0.7951, "step": 13636 }, { "epoch": 0.32, "learning_rate": 8.000711906538167e-06, "loss": 1.2119, "step": 13637 }, { "epoch": 0.32, "learning_rate": 8.000411487005686e-06, "loss": 1.1309, "step": 13638 }, { "epoch": 0.32, "learning_rate": 8.00011105054509e-06, "loss": 0.7763, "step": 13639 }, { "epoch": 0.32, "learning_rate": 7.99981059715807e-06, "loss": 1.046, "step": 13640 }, { "epoch": 0.32, "learning_rate": 7.999510126846322e-06, "loss": 0.7399, "step": 13641 }, { "epoch": 0.32, "learning_rate": 7.999209639611544e-06, "loss": 1.1798, "step": 13642 }, { "epoch": 0.32, "learning_rate": 7.998909135455427e-06, "loss": 0.8494, "step": 13643 }, { "epoch": 0.32, "learning_rate": 7.99860861437967e-06, "loss": 0.9365, "step": 13644 }, { "epoch": 0.32, "learning_rate": 7.998308076385966e-06, "loss": 0.8821, "step": 13645 }, { "epoch": 0.32, "learning_rate": 7.998007521476013e-06, "loss": 0.8274, "step": 13646 }, { "epoch": 0.32, "learning_rate": 7.997706949651505e-06, "loss": 1.0217, "step": 13647 }, { "epoch": 0.32, "learning_rate": 7.99740636091414e-06, "loss": 0.919, "step": 13648 }, { "epoch": 0.32, "learning_rate": 7.997105755265608e-06, "loss": 0.8219, "step": 13649 }, { "epoch": 0.32, "learning_rate": 7.996805132707613e-06, "loss": 1.1114, "step": 13650 }, { "epoch": 0.32, "learning_rate": 7.996504493241845e-06, "loss": 0.7809, "step": 13651 }, { "epoch": 0.32, "learning_rate": 7.996203836870005e-06, "loss": 0.9585, "step": 13652 }, { "epoch": 0.32, "learning_rate": 7.995903163593784e-06, "loss": 1.0567, "step": 13653 }, { "epoch": 0.32, "learning_rate": 7.995602473414884e-06, "loss": 1.1249, "step": 13654 }, { "epoch": 0.32, "learning_rate": 7.995301766334996e-06, "loss": 1.0415, "step": 13655 }, { "epoch": 0.32, "learning_rate": 7.995001042355818e-06, "loss": 1.0765, "step": 13656 }, { "epoch": 0.32, "learning_rate": 7.994700301479053e-06, "loss": 1.162, "step": 13657 }, { "epoch": 0.32, "learning_rate": 7.994399543706388e-06, "loss": 0.7129, "step": 13658 }, { "epoch": 0.32, "learning_rate": 7.994098769039527e-06, "loss": 1.0096, "step": 13659 }, { "epoch": 0.32, "learning_rate": 7.993797977480163e-06, "loss": 1.0384, "step": 13660 }, { "epoch": 0.32, "learning_rate": 7.993497169029994e-06, "loss": 0.9945, "step": 13661 }, { "epoch": 0.32, "learning_rate": 7.993196343690719e-06, "loss": 1.0497, "step": 13662 }, { "epoch": 0.32, "learning_rate": 7.992895501464032e-06, "loss": 0.7465, "step": 13663 }, { "epoch": 0.32, "learning_rate": 7.992594642351636e-06, "loss": 1.0761, "step": 13664 }, { "epoch": 0.32, "learning_rate": 7.992293766355221e-06, "loss": 1.199, "step": 13665 }, { "epoch": 0.32, "learning_rate": 7.991992873476488e-06, "loss": 1.244, "step": 13666 }, { "epoch": 0.32, "learning_rate": 7.991691963717137e-06, "loss": 0.9136, "step": 13667 }, { "epoch": 0.32, "learning_rate": 7.991391037078862e-06, "loss": 1.021, "step": 13668 }, { "epoch": 0.32, "learning_rate": 7.991090093563362e-06, "loss": 1.0384, "step": 13669 }, { "epoch": 0.32, "learning_rate": 7.990789133172336e-06, "loss": 1.1188, "step": 13670 }, { "epoch": 0.32, "learning_rate": 7.990488155907481e-06, "loss": 0.8233, "step": 13671 }, { "epoch": 0.32, "learning_rate": 7.990187161770496e-06, "loss": 1.2813, "step": 13672 }, { "epoch": 0.32, "learning_rate": 7.989886150763077e-06, "loss": 0.8294, "step": 13673 }, { "epoch": 0.32, "learning_rate": 7.989585122886925e-06, "loss": 0.8586, "step": 13674 }, { "epoch": 0.32, "learning_rate": 7.989284078143736e-06, "loss": 0.9177, "step": 13675 }, { "epoch": 0.32, "learning_rate": 7.98898301653521e-06, "loss": 0.9088, "step": 13676 }, { "epoch": 0.32, "learning_rate": 7.988681938063046e-06, "loss": 1.0363, "step": 13677 }, { "epoch": 0.32, "learning_rate": 7.98838084272894e-06, "loss": 0.8851, "step": 13678 }, { "epoch": 0.32, "learning_rate": 7.988079730534592e-06, "loss": 0.9454, "step": 13679 }, { "epoch": 0.32, "learning_rate": 7.987778601481704e-06, "loss": 1.3164, "step": 13680 }, { "epoch": 0.32, "learning_rate": 7.987477455571971e-06, "loss": 0.8594, "step": 13681 }, { "epoch": 0.32, "learning_rate": 7.987176292807092e-06, "loss": 0.8578, "step": 13682 }, { "epoch": 0.32, "learning_rate": 7.98687511318877e-06, "loss": 0.9076, "step": 13683 }, { "epoch": 0.32, "learning_rate": 7.9865739167187e-06, "loss": 0.7434, "step": 13684 }, { "epoch": 0.32, "learning_rate": 7.986272703398586e-06, "loss": 1.143, "step": 13685 }, { "epoch": 0.32, "learning_rate": 7.985971473230122e-06, "loss": 0.8679, "step": 13686 }, { "epoch": 0.32, "learning_rate": 7.98567022621501e-06, "loss": 0.9763, "step": 13687 }, { "epoch": 0.32, "learning_rate": 7.98536896235495e-06, "loss": 0.9589, "step": 13688 }, { "epoch": 0.32, "learning_rate": 7.985067681651642e-06, "loss": 0.8438, "step": 13689 }, { "epoch": 0.32, "learning_rate": 7.984766384106784e-06, "loss": 0.9009, "step": 13690 }, { "epoch": 0.32, "learning_rate": 7.984465069722078e-06, "loss": 0.8227, "step": 13691 }, { "epoch": 0.32, "learning_rate": 7.984163738499224e-06, "loss": 0.9544, "step": 13692 }, { "epoch": 0.32, "learning_rate": 7.983862390439921e-06, "loss": 0.9761, "step": 13693 }, { "epoch": 0.32, "learning_rate": 7.983561025545867e-06, "loss": 0.8175, "step": 13694 }, { "epoch": 0.32, "learning_rate": 7.983259643818765e-06, "loss": 0.968, "step": 13695 }, { "epoch": 0.32, "learning_rate": 7.982958245260317e-06, "loss": 1.2195, "step": 13696 }, { "epoch": 0.32, "learning_rate": 7.982656829872221e-06, "loss": 0.7476, "step": 13697 }, { "epoch": 0.32, "learning_rate": 7.982355397656177e-06, "loss": 0.9869, "step": 13698 }, { "epoch": 0.32, "learning_rate": 7.982053948613888e-06, "loss": 0.8712, "step": 13699 }, { "epoch": 0.32, "learning_rate": 7.981752482747054e-06, "loss": 1.0487, "step": 13700 }, { "epoch": 0.32, "learning_rate": 7.981451000057374e-06, "loss": 0.754, "step": 13701 }, { "epoch": 0.32, "learning_rate": 7.98114950054655e-06, "loss": 0.9994, "step": 13702 }, { "epoch": 0.32, "learning_rate": 7.980847984216283e-06, "loss": 0.8856, "step": 13703 }, { "epoch": 0.32, "learning_rate": 7.980546451068277e-06, "loss": 0.9515, "step": 13704 }, { "epoch": 0.32, "learning_rate": 7.980244901104228e-06, "loss": 0.8405, "step": 13705 }, { "epoch": 0.32, "learning_rate": 7.979943334325841e-06, "loss": 0.6577, "step": 13706 }, { "epoch": 0.32, "learning_rate": 7.979641750734814e-06, "loss": 0.847, "step": 13707 }, { "epoch": 0.32, "learning_rate": 7.979340150332854e-06, "loss": 0.9894, "step": 13708 }, { "epoch": 0.32, "learning_rate": 7.97903853312166e-06, "loss": 1.0444, "step": 13709 }, { "epoch": 0.32, "learning_rate": 7.97873689910293e-06, "loss": 0.8744, "step": 13710 }, { "epoch": 0.32, "learning_rate": 7.978435248278371e-06, "loss": 0.9373, "step": 13711 }, { "epoch": 0.32, "learning_rate": 7.978133580649684e-06, "loss": 0.8754, "step": 13712 }, { "epoch": 0.32, "learning_rate": 7.977831896218568e-06, "loss": 0.9801, "step": 13713 }, { "epoch": 0.32, "learning_rate": 7.977530194986728e-06, "loss": 1.035, "step": 13714 }, { "epoch": 0.32, "learning_rate": 7.977228476955866e-06, "loss": 1.0234, "step": 13715 }, { "epoch": 0.32, "learning_rate": 7.976926742127682e-06, "loss": 1.1301, "step": 13716 }, { "epoch": 0.32, "learning_rate": 7.976624990503879e-06, "loss": 0.8898, "step": 13717 }, { "epoch": 0.32, "learning_rate": 7.976323222086162e-06, "loss": 0.8912, "step": 13718 }, { "epoch": 0.32, "learning_rate": 7.976021436876232e-06, "loss": 0.9097, "step": 13719 }, { "epoch": 0.32, "learning_rate": 7.97571963487579e-06, "loss": 1.0377, "step": 13720 }, { "epoch": 0.32, "learning_rate": 7.97541781608654e-06, "loss": 0.9782, "step": 13721 }, { "epoch": 0.32, "learning_rate": 7.975115980510187e-06, "loss": 0.928, "step": 13722 }, { "epoch": 0.32, "learning_rate": 7.974814128148431e-06, "loss": 0.9143, "step": 13723 }, { "epoch": 0.32, "learning_rate": 7.974512259002976e-06, "loss": 1.1209, "step": 13724 }, { "epoch": 0.32, "learning_rate": 7.974210373075524e-06, "loss": 0.9301, "step": 13725 }, { "epoch": 0.32, "learning_rate": 7.973908470367782e-06, "loss": 0.7215, "step": 13726 }, { "epoch": 0.32, "learning_rate": 7.97360655088145e-06, "loss": 1.1151, "step": 13727 }, { "epoch": 0.32, "learning_rate": 7.97330461461823e-06, "loss": 0.9049, "step": 13728 }, { "epoch": 0.32, "learning_rate": 7.973002661579829e-06, "loss": 0.8195, "step": 13729 }, { "epoch": 0.32, "learning_rate": 7.97270069176795e-06, "loss": 0.8579, "step": 13730 }, { "epoch": 0.32, "learning_rate": 7.972398705184295e-06, "loss": 0.7153, "step": 13731 }, { "epoch": 0.32, "learning_rate": 7.972096701830568e-06, "loss": 0.9041, "step": 13732 }, { "epoch": 0.32, "learning_rate": 7.971794681708475e-06, "loss": 1.1417, "step": 13733 }, { "epoch": 0.32, "learning_rate": 7.971492644819718e-06, "loss": 1.0285, "step": 13734 }, { "epoch": 0.32, "learning_rate": 7.971190591166e-06, "loss": 1.0726, "step": 13735 }, { "epoch": 0.32, "learning_rate": 7.97088852074903e-06, "loss": 0.904, "step": 13736 }, { "epoch": 0.32, "learning_rate": 7.970586433570507e-06, "loss": 1.081, "step": 13737 }, { "epoch": 0.32, "learning_rate": 7.970284329632138e-06, "loss": 1.0429, "step": 13738 }, { "epoch": 0.32, "learning_rate": 7.969982208935627e-06, "loss": 1.0385, "step": 13739 }, { "epoch": 0.32, "learning_rate": 7.969680071482677e-06, "loss": 1.1289, "step": 13740 }, { "epoch": 0.32, "learning_rate": 7.969377917274997e-06, "loss": 1.0497, "step": 13741 }, { "epoch": 0.32, "learning_rate": 7.969075746314285e-06, "loss": 1.0106, "step": 13742 }, { "epoch": 0.32, "learning_rate": 7.968773558602252e-06, "loss": 0.962, "step": 13743 }, { "epoch": 0.32, "learning_rate": 7.968471354140598e-06, "loss": 0.9901, "step": 13744 }, { "epoch": 0.32, "learning_rate": 7.968169132931035e-06, "loss": 0.989, "step": 13745 }, { "epoch": 0.32, "learning_rate": 7.96786689497526e-06, "loss": 1.0573, "step": 13746 }, { "epoch": 0.32, "learning_rate": 7.967564640274983e-06, "loss": 0.8745, "step": 13747 }, { "epoch": 0.32, "learning_rate": 7.96726236883191e-06, "loss": 0.8676, "step": 13748 }, { "epoch": 0.32, "learning_rate": 7.96696008064774e-06, "loss": 0.7413, "step": 13749 }, { "epoch": 0.32, "learning_rate": 7.966657775724186e-06, "loss": 0.8596, "step": 13750 }, { "epoch": 0.32, "learning_rate": 7.96635545406295e-06, "loss": 0.7777, "step": 13751 }, { "epoch": 0.32, "learning_rate": 7.96605311566574e-06, "loss": 0.975, "step": 13752 }, { "epoch": 0.32, "learning_rate": 7.965750760534259e-06, "loss": 1.1386, "step": 13753 }, { "epoch": 0.32, "learning_rate": 7.965448388670214e-06, "loss": 0.9919, "step": 13754 }, { "epoch": 0.32, "learning_rate": 7.96514600007531e-06, "loss": 1.0586, "step": 13755 }, { "epoch": 0.32, "learning_rate": 7.964843594751255e-06, "loss": 0.6717, "step": 13756 }, { "epoch": 0.32, "learning_rate": 7.964541172699752e-06, "loss": 0.9514, "step": 13757 }, { "epoch": 0.32, "learning_rate": 7.964238733922512e-06, "loss": 0.7914, "step": 13758 }, { "epoch": 0.32, "learning_rate": 7.963936278421238e-06, "loss": 0.8971, "step": 13759 }, { "epoch": 0.32, "learning_rate": 7.963633806197638e-06, "loss": 1.1504, "step": 13760 }, { "epoch": 0.32, "learning_rate": 7.963331317253416e-06, "loss": 1.123, "step": 13761 }, { "epoch": 0.32, "learning_rate": 7.963028811590278e-06, "loss": 1.0095, "step": 13762 }, { "epoch": 0.32, "learning_rate": 7.962726289209937e-06, "loss": 0.8227, "step": 13763 }, { "epoch": 0.32, "learning_rate": 7.962423750114094e-06, "loss": 1.1977, "step": 13764 }, { "epoch": 0.32, "learning_rate": 7.96212119430446e-06, "loss": 0.8212, "step": 13765 }, { "epoch": 0.32, "learning_rate": 7.961818621782737e-06, "loss": 0.896, "step": 13766 }, { "epoch": 0.32, "learning_rate": 7.961516032550636e-06, "loss": 0.8693, "step": 13767 }, { "epoch": 0.32, "learning_rate": 7.961213426609863e-06, "loss": 0.7899, "step": 13768 }, { "epoch": 0.32, "learning_rate": 7.960910803962126e-06, "loss": 1.0989, "step": 13769 }, { "epoch": 0.32, "learning_rate": 7.960608164609129e-06, "loss": 0.4331, "step": 13770 }, { "epoch": 0.32, "learning_rate": 7.960305508552584e-06, "loss": 0.9947, "step": 13771 }, { "epoch": 0.32, "learning_rate": 7.960002835794198e-06, "loss": 0.9358, "step": 13772 }, { "epoch": 0.32, "learning_rate": 7.959700146335675e-06, "loss": 0.747, "step": 13773 }, { "epoch": 0.32, "learning_rate": 7.959397440178725e-06, "loss": 1.1484, "step": 13774 }, { "epoch": 0.32, "learning_rate": 7.959094717325057e-06, "loss": 1.1998, "step": 13775 }, { "epoch": 0.32, "learning_rate": 7.958791977776377e-06, "loss": 0.9473, "step": 13776 }, { "epoch": 0.32, "learning_rate": 7.958489221534396e-06, "loss": 1.068, "step": 13777 }, { "epoch": 0.32, "learning_rate": 7.958186448600817e-06, "loss": 0.9915, "step": 13778 }, { "epoch": 0.32, "learning_rate": 7.957883658977353e-06, "loss": 1.0927, "step": 13779 }, { "epoch": 0.32, "learning_rate": 7.957580852665711e-06, "loss": 0.7824, "step": 13780 }, { "epoch": 0.32, "learning_rate": 7.957278029667599e-06, "loss": 1.0557, "step": 13781 }, { "epoch": 0.32, "learning_rate": 7.956975189984727e-06, "loss": 1.0966, "step": 13782 }, { "epoch": 0.32, "learning_rate": 7.956672333618798e-06, "loss": 0.8572, "step": 13783 }, { "epoch": 0.32, "learning_rate": 7.956369460571527e-06, "loss": 1.0332, "step": 13784 }, { "epoch": 0.32, "learning_rate": 7.956066570844621e-06, "loss": 0.9647, "step": 13785 }, { "epoch": 0.32, "learning_rate": 7.955763664439788e-06, "loss": 1.2353, "step": 13786 }, { "epoch": 0.32, "learning_rate": 7.955460741358737e-06, "loss": 0.735, "step": 13787 }, { "epoch": 0.32, "learning_rate": 7.955157801603177e-06, "loss": 0.9253, "step": 13788 }, { "epoch": 0.32, "learning_rate": 7.95485484517482e-06, "loss": 0.6832, "step": 13789 }, { "epoch": 0.32, "learning_rate": 7.95455187207537e-06, "loss": 0.7691, "step": 13790 }, { "epoch": 0.32, "learning_rate": 7.954248882306542e-06, "loss": 0.9621, "step": 13791 }, { "epoch": 0.32, "learning_rate": 7.953945875870042e-06, "loss": 1.0091, "step": 13792 }, { "epoch": 0.32, "learning_rate": 7.95364285276758e-06, "loss": 0.9236, "step": 13793 }, { "epoch": 0.32, "learning_rate": 7.953339813000867e-06, "loss": 0.8772, "step": 13794 }, { "epoch": 0.32, "learning_rate": 7.95303675657161e-06, "loss": 1.0071, "step": 13795 }, { "epoch": 0.32, "learning_rate": 7.952733683481522e-06, "loss": 1.0005, "step": 13796 }, { "epoch": 0.32, "learning_rate": 7.95243059373231e-06, "loss": 0.8491, "step": 13797 }, { "epoch": 0.32, "learning_rate": 7.952127487325685e-06, "loss": 0.991, "step": 13798 }, { "epoch": 0.32, "learning_rate": 7.95182436426336e-06, "loss": 0.999, "step": 13799 }, { "epoch": 0.32, "learning_rate": 7.951521224547041e-06, "loss": 1.026, "step": 13800 }, { "epoch": 0.32, "learning_rate": 7.95121806817844e-06, "loss": 0.786, "step": 13801 }, { "epoch": 0.32, "learning_rate": 7.950914895159268e-06, "loss": 1.032, "step": 13802 }, { "epoch": 0.32, "learning_rate": 7.950611705491233e-06, "loss": 0.997, "step": 13803 }, { "epoch": 0.32, "learning_rate": 7.95030849917605e-06, "loss": 1.1152, "step": 13804 }, { "epoch": 0.32, "learning_rate": 7.950005276215425e-06, "loss": 0.7631, "step": 13805 }, { "epoch": 0.32, "learning_rate": 7.949702036611071e-06, "loss": 0.995, "step": 13806 }, { "epoch": 0.32, "learning_rate": 7.949398780364702e-06, "loss": 0.8762, "step": 13807 }, { "epoch": 0.32, "learning_rate": 7.949095507478021e-06, "loss": 0.9601, "step": 13808 }, { "epoch": 0.32, "learning_rate": 7.948792217952747e-06, "loss": 0.8629, "step": 13809 }, { "epoch": 0.32, "learning_rate": 7.948488911790587e-06, "loss": 0.9158, "step": 13810 }, { "epoch": 0.32, "learning_rate": 7.948185588993254e-06, "loss": 0.8759, "step": 13811 }, { "epoch": 0.32, "learning_rate": 7.947882249562457e-06, "loss": 0.9263, "step": 13812 }, { "epoch": 0.32, "learning_rate": 7.947578893499909e-06, "loss": 0.7585, "step": 13813 }, { "epoch": 0.32, "learning_rate": 7.947275520807323e-06, "loss": 1.2353, "step": 13814 }, { "epoch": 0.32, "learning_rate": 7.946972131486407e-06, "loss": 0.7428, "step": 13815 }, { "epoch": 0.32, "learning_rate": 7.946668725538875e-06, "loss": 1.0566, "step": 13816 }, { "epoch": 0.32, "learning_rate": 7.94636530296644e-06, "loss": 0.7508, "step": 13817 }, { "epoch": 0.32, "learning_rate": 7.946061863770811e-06, "loss": 1.046, "step": 13818 }, { "epoch": 0.32, "learning_rate": 7.945758407953701e-06, "loss": 1.2735, "step": 13819 }, { "epoch": 0.32, "learning_rate": 7.945454935516822e-06, "loss": 0.8226, "step": 13820 }, { "epoch": 0.32, "learning_rate": 7.945151446461889e-06, "loss": 1.0493, "step": 13821 }, { "epoch": 0.32, "learning_rate": 7.944847940790612e-06, "loss": 1.0742, "step": 13822 }, { "epoch": 0.32, "learning_rate": 7.9445444185047e-06, "loss": 0.837, "step": 13823 }, { "epoch": 0.32, "learning_rate": 7.94424087960587e-06, "loss": 0.9192, "step": 13824 }, { "epoch": 0.32, "learning_rate": 7.943937324095836e-06, "loss": 1.1649, "step": 13825 }, { "epoch": 0.32, "learning_rate": 7.943633751976304e-06, "loss": 0.8639, "step": 13826 }, { "epoch": 0.32, "learning_rate": 7.943330163248993e-06, "loss": 0.8508, "step": 13827 }, { "epoch": 0.32, "learning_rate": 7.943026557915613e-06, "loss": 0.9304, "step": 13828 }, { "epoch": 0.32, "learning_rate": 7.942722935977878e-06, "loss": 0.9673, "step": 13829 }, { "epoch": 0.32, "learning_rate": 7.942419297437499e-06, "loss": 0.7604, "step": 13830 }, { "epoch": 0.32, "learning_rate": 7.942115642296189e-06, "loss": 0.808, "step": 13831 }, { "epoch": 0.32, "learning_rate": 7.941811970555666e-06, "loss": 0.9347, "step": 13832 }, { "epoch": 0.32, "learning_rate": 7.941508282217638e-06, "loss": 0.8839, "step": 13833 }, { "epoch": 0.32, "learning_rate": 7.941204577283822e-06, "loss": 1.0567, "step": 13834 }, { "epoch": 0.32, "learning_rate": 7.940900855755927e-06, "loss": 1.2086, "step": 13835 }, { "epoch": 0.32, "learning_rate": 7.940597117635671e-06, "loss": 0.9401, "step": 13836 }, { "epoch": 0.32, "learning_rate": 7.940293362924766e-06, "loss": 0.8885, "step": 13837 }, { "epoch": 0.32, "learning_rate": 7.939989591624926e-06, "loss": 0.8514, "step": 13838 }, { "epoch": 0.32, "learning_rate": 7.939685803737865e-06, "loss": 1.0898, "step": 13839 }, { "epoch": 0.32, "learning_rate": 7.939381999265297e-06, "loss": 0.899, "step": 13840 }, { "epoch": 0.32, "learning_rate": 7.939078178208934e-06, "loss": 0.8897, "step": 13841 }, { "epoch": 0.32, "learning_rate": 7.938774340570493e-06, "loss": 0.7925, "step": 13842 }, { "epoch": 0.32, "learning_rate": 7.938470486351687e-06, "loss": 0.8166, "step": 13843 }, { "epoch": 0.32, "learning_rate": 7.93816661555423e-06, "loss": 0.8823, "step": 13844 }, { "epoch": 0.32, "learning_rate": 7.937862728179837e-06, "loss": 0.9436, "step": 13845 }, { "epoch": 0.32, "learning_rate": 7.937558824230222e-06, "loss": 0.9987, "step": 13846 }, { "epoch": 0.32, "learning_rate": 7.9372549037071e-06, "loss": 0.9666, "step": 13847 }, { "epoch": 0.32, "learning_rate": 7.936950966612187e-06, "loss": 1.1559, "step": 13848 }, { "epoch": 0.32, "learning_rate": 7.936647012947197e-06, "loss": 1.0021, "step": 13849 }, { "epoch": 0.32, "learning_rate": 7.93634304271384e-06, "loss": 1.0625, "step": 13850 }, { "epoch": 0.32, "learning_rate": 7.93603905591384e-06, "loss": 0.9483, "step": 13851 }, { "epoch": 0.32, "learning_rate": 7.935735052548906e-06, "loss": 0.943, "step": 13852 }, { "epoch": 0.32, "learning_rate": 7.935431032620753e-06, "loss": 0.7548, "step": 13853 }, { "epoch": 0.32, "learning_rate": 7.935126996131098e-06, "loss": 1.1815, "step": 13854 }, { "epoch": 0.32, "learning_rate": 7.934822943081656e-06, "loss": 1.0552, "step": 13855 }, { "epoch": 0.32, "learning_rate": 7.934518873474144e-06, "loss": 0.8496, "step": 13856 }, { "epoch": 0.32, "learning_rate": 7.934214787310276e-06, "loss": 0.7849, "step": 13857 }, { "epoch": 0.32, "learning_rate": 7.933910684591768e-06, "loss": 0.9697, "step": 13858 }, { "epoch": 0.32, "learning_rate": 7.933606565320332e-06, "loss": 1.0598, "step": 13859 }, { "epoch": 0.32, "learning_rate": 7.933302429497691e-06, "loss": 0.9598, "step": 13860 }, { "epoch": 0.32, "learning_rate": 7.932998277125558e-06, "loss": 1.1011, "step": 13861 }, { "epoch": 0.32, "learning_rate": 7.932694108205645e-06, "loss": 1.1381, "step": 13862 }, { "epoch": 0.32, "learning_rate": 7.932389922739673e-06, "loss": 1.0738, "step": 13863 }, { "epoch": 0.32, "learning_rate": 7.932085720729356e-06, "loss": 1.1539, "step": 13864 }, { "epoch": 0.32, "learning_rate": 7.931781502176412e-06, "loss": 1.0946, "step": 13865 }, { "epoch": 0.32, "learning_rate": 7.931477267082555e-06, "loss": 0.952, "step": 13866 }, { "epoch": 0.32, "learning_rate": 7.931173015449504e-06, "loss": 0.9984, "step": 13867 }, { "epoch": 0.32, "learning_rate": 7.930868747278973e-06, "loss": 1.187, "step": 13868 }, { "epoch": 0.32, "learning_rate": 7.93056446257268e-06, "loss": 0.9266, "step": 13869 }, { "epoch": 0.32, "learning_rate": 7.930260161332341e-06, "loss": 1.0246, "step": 13870 }, { "epoch": 0.32, "learning_rate": 7.929955843559676e-06, "loss": 1.0892, "step": 13871 }, { "epoch": 0.32, "learning_rate": 7.929651509256397e-06, "loss": 0.9256, "step": 13872 }, { "epoch": 0.32, "learning_rate": 7.929347158424224e-06, "loss": 0.8361, "step": 13873 }, { "epoch": 0.32, "learning_rate": 7.929042791064874e-06, "loss": 0.7632, "step": 13874 }, { "epoch": 0.32, "learning_rate": 7.928738407180062e-06, "loss": 0.8857, "step": 13875 }, { "epoch": 0.32, "learning_rate": 7.92843400677151e-06, "loss": 0.9395, "step": 13876 }, { "epoch": 0.32, "learning_rate": 7.92812958984093e-06, "loss": 0.8162, "step": 13877 }, { "epoch": 0.32, "learning_rate": 7.927825156390043e-06, "loss": 0.9485, "step": 13878 }, { "epoch": 0.32, "learning_rate": 7.927520706420567e-06, "loss": 1.0187, "step": 13879 }, { "epoch": 0.32, "learning_rate": 7.927216239934217e-06, "loss": 0.912, "step": 13880 }, { "epoch": 0.32, "learning_rate": 7.926911756932711e-06, "loss": 0.9376, "step": 13881 }, { "epoch": 0.32, "learning_rate": 7.926607257417769e-06, "loss": 0.7661, "step": 13882 }, { "epoch": 0.32, "learning_rate": 7.92630274139111e-06, "loss": 0.8699, "step": 13883 }, { "epoch": 0.32, "learning_rate": 7.925998208854446e-06, "loss": 0.6732, "step": 13884 }, { "epoch": 0.32, "learning_rate": 7.925693659809501e-06, "loss": 1.21, "step": 13885 }, { "epoch": 0.32, "learning_rate": 7.925389094257993e-06, "loss": 0.874, "step": 13886 }, { "epoch": 0.32, "learning_rate": 7.925084512201636e-06, "loss": 0.9795, "step": 13887 }, { "epoch": 0.32, "learning_rate": 7.924779913642153e-06, "loss": 0.9192, "step": 13888 }, { "epoch": 0.32, "learning_rate": 7.92447529858126e-06, "loss": 1.0313, "step": 13889 }, { "epoch": 0.32, "learning_rate": 7.924170667020676e-06, "loss": 0.8475, "step": 13890 }, { "epoch": 0.32, "learning_rate": 7.92386601896212e-06, "loss": 0.7685, "step": 13891 }, { "epoch": 0.32, "learning_rate": 7.923561354407313e-06, "loss": 0.7441, "step": 13892 }, { "epoch": 0.32, "learning_rate": 7.923256673357968e-06, "loss": 1.0617, "step": 13893 }, { "epoch": 0.32, "learning_rate": 7.92295197581581e-06, "loss": 0.9433, "step": 13894 }, { "epoch": 0.32, "learning_rate": 7.922647261782557e-06, "loss": 0.9991, "step": 13895 }, { "epoch": 0.32, "learning_rate": 7.922342531259924e-06, "loss": 1.0608, "step": 13896 }, { "epoch": 0.32, "learning_rate": 7.922037784249635e-06, "loss": 0.9071, "step": 13897 }, { "epoch": 0.32, "learning_rate": 7.921733020753408e-06, "loss": 0.9039, "step": 13898 }, { "epoch": 0.32, "learning_rate": 7.921428240772959e-06, "loss": 1.1575, "step": 13899 }, { "epoch": 0.32, "learning_rate": 7.921123444310015e-06, "loss": 0.873, "step": 13900 }, { "epoch": 0.32, "learning_rate": 7.920818631366287e-06, "loss": 0.9099, "step": 13901 }, { "epoch": 0.32, "learning_rate": 7.920513801943502e-06, "loss": 0.9913, "step": 13902 }, { "epoch": 0.32, "learning_rate": 7.920208956043376e-06, "loss": 1.0707, "step": 13903 }, { "epoch": 0.32, "learning_rate": 7.919904093667629e-06, "loss": 1.0166, "step": 13904 }, { "epoch": 0.32, "learning_rate": 7.91959921481798e-06, "loss": 0.9251, "step": 13905 }, { "epoch": 0.32, "learning_rate": 7.919294319496155e-06, "loss": 0.9772, "step": 13906 }, { "epoch": 0.32, "learning_rate": 7.918989407703868e-06, "loss": 0.8367, "step": 13907 }, { "epoch": 0.32, "learning_rate": 7.918684479442841e-06, "loss": 0.9542, "step": 13908 }, { "epoch": 0.32, "learning_rate": 7.918379534714796e-06, "loss": 0.5359, "step": 13909 }, { "epoch": 0.32, "learning_rate": 7.91807457352145e-06, "loss": 0.8124, "step": 13910 }, { "epoch": 0.32, "learning_rate": 7.917769595864526e-06, "loss": 0.9873, "step": 13911 }, { "epoch": 0.32, "learning_rate": 7.917464601745746e-06, "loss": 0.9243, "step": 13912 }, { "epoch": 0.32, "learning_rate": 7.917159591166827e-06, "loss": 0.663, "step": 13913 }, { "epoch": 0.32, "learning_rate": 7.916854564129496e-06, "loss": 0.7677, "step": 13914 }, { "epoch": 0.32, "learning_rate": 7.916549520635466e-06, "loss": 0.9008, "step": 13915 }, { "epoch": 0.32, "learning_rate": 7.916244460686462e-06, "loss": 0.7908, "step": 13916 }, { "epoch": 0.32, "learning_rate": 7.915939384284208e-06, "loss": 0.9254, "step": 13917 }, { "epoch": 0.32, "learning_rate": 7.91563429143042e-06, "loss": 0.862, "step": 13918 }, { "epoch": 0.32, "learning_rate": 7.915329182126823e-06, "loss": 1.1511, "step": 13919 }, { "epoch": 0.32, "learning_rate": 7.915024056375137e-06, "loss": 0.897, "step": 13920 }, { "epoch": 0.32, "learning_rate": 7.914718914177081e-06, "loss": 1.1995, "step": 13921 }, { "epoch": 0.32, "learning_rate": 7.914413755534382e-06, "loss": 0.964, "step": 13922 }, { "epoch": 0.32, "learning_rate": 7.914108580448758e-06, "loss": 0.9287, "step": 13923 }, { "epoch": 0.32, "learning_rate": 7.913803388921932e-06, "loss": 0.8287, "step": 13924 }, { "epoch": 0.32, "learning_rate": 7.913498180955625e-06, "loss": 0.9316, "step": 13925 }, { "epoch": 0.32, "learning_rate": 7.91319295655156e-06, "loss": 0.9495, "step": 13926 }, { "epoch": 0.32, "learning_rate": 7.912887715711459e-06, "loss": 0.8546, "step": 13927 }, { "epoch": 0.32, "learning_rate": 7.912582458437042e-06, "loss": 1.2001, "step": 13928 }, { "epoch": 0.32, "learning_rate": 7.912277184730035e-06, "loss": 0.8415, "step": 13929 }, { "epoch": 0.32, "learning_rate": 7.911971894592157e-06, "loss": 0.9942, "step": 13930 }, { "epoch": 0.32, "learning_rate": 7.91166658802513e-06, "loss": 0.8113, "step": 13931 }, { "epoch": 0.32, "learning_rate": 7.91136126503068e-06, "loss": 1.0129, "step": 13932 }, { "epoch": 0.32, "learning_rate": 7.911055925610527e-06, "loss": 1.0921, "step": 13933 }, { "epoch": 0.32, "learning_rate": 7.910750569766394e-06, "loss": 0.9152, "step": 13934 }, { "epoch": 0.32, "learning_rate": 7.910445197500007e-06, "loss": 0.8714, "step": 13935 }, { "epoch": 0.32, "learning_rate": 7.910139808813083e-06, "loss": 1.0796, "step": 13936 }, { "epoch": 0.32, "learning_rate": 7.909834403707351e-06, "loss": 0.7638, "step": 13937 }, { "epoch": 0.32, "learning_rate": 7.90952898218453e-06, "loss": 1.1068, "step": 13938 }, { "epoch": 0.32, "learning_rate": 7.909223544246343e-06, "loss": 0.7096, "step": 13939 }, { "epoch": 0.32, "learning_rate": 7.908918089894515e-06, "loss": 1.0903, "step": 13940 }, { "epoch": 0.32, "learning_rate": 7.90861261913077e-06, "loss": 1.035, "step": 13941 }, { "epoch": 0.32, "learning_rate": 7.908307131956831e-06, "loss": 0.9362, "step": 13942 }, { "epoch": 0.32, "learning_rate": 7.90800162837442e-06, "loss": 0.9876, "step": 13943 }, { "epoch": 0.32, "learning_rate": 7.907696108385261e-06, "loss": 0.9998, "step": 13944 }, { "epoch": 0.32, "learning_rate": 7.907390571991079e-06, "loss": 0.9796, "step": 13945 }, { "epoch": 0.32, "learning_rate": 7.907085019193597e-06, "loss": 1.1605, "step": 13946 }, { "epoch": 0.32, "learning_rate": 7.90677944999454e-06, "loss": 0.7039, "step": 13947 }, { "epoch": 0.32, "learning_rate": 7.90647386439563e-06, "loss": 1.0205, "step": 13948 }, { "epoch": 0.32, "learning_rate": 7.906168262398594e-06, "loss": 0.7982, "step": 13949 }, { "epoch": 0.32, "learning_rate": 7.905862644005151e-06, "loss": 1.0254, "step": 13950 }, { "epoch": 0.32, "learning_rate": 7.905557009217031e-06, "loss": 0.7584, "step": 13951 }, { "epoch": 0.32, "learning_rate": 7.905251358035958e-06, "loss": 0.9652, "step": 13952 }, { "epoch": 0.32, "learning_rate": 7.90494569046365e-06, "loss": 0.8382, "step": 13953 }, { "epoch": 0.32, "learning_rate": 7.904640006501838e-06, "loss": 0.8678, "step": 13954 }, { "epoch": 0.32, "learning_rate": 7.904334306152244e-06, "loss": 1.0043, "step": 13955 }, { "epoch": 0.32, "learning_rate": 7.904028589416595e-06, "loss": 0.9354, "step": 13956 }, { "epoch": 0.32, "learning_rate": 7.903722856296613e-06, "loss": 1.0099, "step": 13957 }, { "epoch": 0.32, "learning_rate": 7.903417106794025e-06, "loss": 0.8884, "step": 13958 }, { "epoch": 0.32, "learning_rate": 7.903111340910553e-06, "loss": 1.2931, "step": 13959 }, { "epoch": 0.32, "learning_rate": 7.902805558647928e-06, "loss": 1.106, "step": 13960 }, { "epoch": 0.32, "learning_rate": 7.902499760007867e-06, "loss": 0.9407, "step": 13961 }, { "epoch": 0.32, "learning_rate": 7.902193944992104e-06, "loss": 1.0963, "step": 13962 }, { "epoch": 0.32, "learning_rate": 7.901888113602357e-06, "loss": 0.9114, "step": 13963 }, { "epoch": 0.32, "learning_rate": 7.901582265840357e-06, "loss": 0.837, "step": 13964 }, { "epoch": 0.32, "learning_rate": 7.901276401707826e-06, "loss": 1.2056, "step": 13965 }, { "epoch": 0.32, "learning_rate": 7.90097052120649e-06, "loss": 0.7317, "step": 13966 }, { "epoch": 0.32, "learning_rate": 7.900664624338077e-06, "loss": 0.8594, "step": 13967 }, { "epoch": 0.32, "learning_rate": 7.900358711104312e-06, "loss": 0.8456, "step": 13968 }, { "epoch": 0.32, "learning_rate": 7.90005278150692e-06, "loss": 1.062, "step": 13969 }, { "epoch": 0.32, "learning_rate": 7.899746835547625e-06, "loss": 1.1451, "step": 13970 }, { "epoch": 0.32, "learning_rate": 7.89944087322816e-06, "loss": 0.9967, "step": 13971 }, { "epoch": 0.32, "learning_rate": 7.899134894550244e-06, "loss": 1.0548, "step": 13972 }, { "epoch": 0.32, "learning_rate": 7.898828899515606e-06, "loss": 0.9802, "step": 13973 }, { "epoch": 0.32, "learning_rate": 7.898522888125974e-06, "loss": 0.8797, "step": 13974 }, { "epoch": 0.32, "learning_rate": 7.898216860383073e-06, "loss": 1.2709, "step": 13975 }, { "epoch": 0.32, "learning_rate": 7.897910816288628e-06, "loss": 0.9843, "step": 13976 }, { "epoch": 0.32, "learning_rate": 7.897604755844368e-06, "loss": 1.0373, "step": 13977 }, { "epoch": 0.32, "learning_rate": 7.897298679052019e-06, "loss": 0.6946, "step": 13978 }, { "epoch": 0.32, "learning_rate": 7.896992585913309e-06, "loss": 0.9823, "step": 13979 }, { "epoch": 0.32, "learning_rate": 7.896686476429963e-06, "loss": 0.9555, "step": 13980 }, { "epoch": 0.32, "learning_rate": 7.896380350603708e-06, "loss": 0.8824, "step": 13981 }, { "epoch": 0.32, "learning_rate": 7.896074208436273e-06, "loss": 1.0698, "step": 13982 }, { "epoch": 0.32, "learning_rate": 7.895768049929384e-06, "loss": 0.7847, "step": 13983 }, { "epoch": 0.32, "learning_rate": 7.895461875084768e-06, "loss": 0.9217, "step": 13984 }, { "epoch": 0.32, "learning_rate": 7.895155683904155e-06, "loss": 1.0955, "step": 13985 }, { "epoch": 0.32, "learning_rate": 7.89484947638927e-06, "loss": 0.6493, "step": 13986 }, { "epoch": 0.32, "learning_rate": 7.89454325254184e-06, "loss": 1.0705, "step": 13987 }, { "epoch": 0.32, "learning_rate": 7.894237012363595e-06, "loss": 0.961, "step": 13988 }, { "epoch": 0.32, "learning_rate": 7.89393075585626e-06, "loss": 0.9597, "step": 13989 }, { "epoch": 0.32, "learning_rate": 7.893624483021567e-06, "loss": 0.8215, "step": 13990 }, { "epoch": 0.32, "learning_rate": 7.893318193861239e-06, "loss": 0.937, "step": 13991 }, { "epoch": 0.32, "learning_rate": 7.893011888377009e-06, "loss": 0.9647, "step": 13992 }, { "epoch": 0.32, "learning_rate": 7.892705566570601e-06, "loss": 1.2319, "step": 13993 }, { "epoch": 0.32, "learning_rate": 7.892399228443746e-06, "loss": 1.1916, "step": 13994 }, { "epoch": 0.32, "learning_rate": 7.89209287399817e-06, "loss": 0.8692, "step": 13995 }, { "epoch": 0.32, "learning_rate": 7.891786503235604e-06, "loss": 0.8756, "step": 13996 }, { "epoch": 0.32, "learning_rate": 7.891480116157774e-06, "loss": 1.0477, "step": 13997 }, { "epoch": 0.32, "learning_rate": 7.891173712766412e-06, "loss": 0.883, "step": 13998 }, { "epoch": 0.32, "learning_rate": 7.890867293063243e-06, "loss": 1.0109, "step": 13999 }, { "epoch": 0.32, "learning_rate": 7.890560857049995e-06, "loss": 0.8627, "step": 14000 }, { "epoch": 0.32, "learning_rate": 7.890254404728404e-06, "loss": 1.0551, "step": 14001 }, { "epoch": 0.32, "learning_rate": 7.88994793610019e-06, "loss": 1.0295, "step": 14002 }, { "epoch": 0.32, "learning_rate": 7.889641451167089e-06, "loss": 1.096, "step": 14003 }, { "epoch": 0.32, "learning_rate": 7.889334949930827e-06, "loss": 0.9509, "step": 14004 }, { "epoch": 0.32, "learning_rate": 7.889028432393133e-06, "loss": 0.8915, "step": 14005 }, { "epoch": 0.32, "learning_rate": 7.888721898555739e-06, "loss": 0.8409, "step": 14006 }, { "epoch": 0.32, "learning_rate": 7.88841534842037e-06, "loss": 0.957, "step": 14007 }, { "epoch": 0.32, "learning_rate": 7.88810878198876e-06, "loss": 0.9314, "step": 14008 }, { "epoch": 0.32, "learning_rate": 7.887802199262635e-06, "loss": 0.725, "step": 14009 }, { "epoch": 0.32, "learning_rate": 7.887495600243728e-06, "loss": 1.1266, "step": 14010 }, { "epoch": 0.32, "learning_rate": 7.887188984933767e-06, "loss": 1.0522, "step": 14011 }, { "epoch": 0.32, "learning_rate": 7.886882353334481e-06, "loss": 1.1008, "step": 14012 }, { "epoch": 0.32, "learning_rate": 7.886575705447604e-06, "loss": 0.9209, "step": 14013 }, { "epoch": 0.33, "learning_rate": 7.886269041274858e-06, "loss": 1.0257, "step": 14014 }, { "epoch": 0.33, "learning_rate": 7.885962360817983e-06, "loss": 0.773, "step": 14015 }, { "epoch": 0.33, "learning_rate": 7.885655664078704e-06, "loss": 1.0773, "step": 14016 }, { "epoch": 0.33, "learning_rate": 7.88534895105875e-06, "loss": 0.9885, "step": 14017 }, { "epoch": 0.33, "learning_rate": 7.885042221759856e-06, "loss": 1.0121, "step": 14018 }, { "epoch": 0.33, "learning_rate": 7.884735476183747e-06, "loss": 1.1542, "step": 14019 }, { "epoch": 0.33, "learning_rate": 7.88442871433216e-06, "loss": 0.7751, "step": 14020 }, { "epoch": 0.33, "learning_rate": 7.88412193620682e-06, "loss": 0.7459, "step": 14021 }, { "epoch": 0.33, "learning_rate": 7.883815141809462e-06, "loss": 1.0219, "step": 14022 }, { "epoch": 0.33, "learning_rate": 7.883508331141813e-06, "loss": 0.8476, "step": 14023 }, { "epoch": 0.33, "learning_rate": 7.883201504205607e-06, "loss": 1.1483, "step": 14024 }, { "epoch": 0.33, "learning_rate": 7.882894661002575e-06, "loss": 0.7164, "step": 14025 }, { "epoch": 0.33, "learning_rate": 7.882587801534446e-06, "loss": 0.9544, "step": 14026 }, { "epoch": 0.33, "learning_rate": 7.882280925802953e-06, "loss": 0.8986, "step": 14027 }, { "epoch": 0.33, "learning_rate": 7.881974033809829e-06, "loss": 0.7168, "step": 14028 }, { "epoch": 0.33, "learning_rate": 7.881667125556803e-06, "loss": 0.9217, "step": 14029 }, { "epoch": 0.33, "learning_rate": 7.881360201045606e-06, "loss": 0.8824, "step": 14030 }, { "epoch": 0.33, "learning_rate": 7.881053260277971e-06, "loss": 0.9537, "step": 14031 }, { "epoch": 0.33, "learning_rate": 7.880746303255628e-06, "loss": 0.8542, "step": 14032 }, { "epoch": 0.33, "learning_rate": 7.880439329980313e-06, "loss": 0.8427, "step": 14033 }, { "epoch": 0.33, "learning_rate": 7.880132340453753e-06, "loss": 0.8885, "step": 14034 }, { "epoch": 0.33, "learning_rate": 7.879825334677685e-06, "loss": 0.7202, "step": 14035 }, { "epoch": 0.33, "learning_rate": 7.879518312653836e-06, "loss": 0.8454, "step": 14036 }, { "epoch": 0.33, "learning_rate": 7.87921127438394e-06, "loss": 0.9011, "step": 14037 }, { "epoch": 0.33, "learning_rate": 7.878904219869732e-06, "loss": 0.8947, "step": 14038 }, { "epoch": 0.33, "learning_rate": 7.878597149112942e-06, "loss": 0.9324, "step": 14039 }, { "epoch": 0.33, "learning_rate": 7.878290062115301e-06, "loss": 0.9872, "step": 14040 }, { "epoch": 0.33, "learning_rate": 7.877982958878543e-06, "loss": 0.8421, "step": 14041 }, { "epoch": 0.33, "learning_rate": 7.877675839404402e-06, "loss": 0.8133, "step": 14042 }, { "epoch": 0.33, "learning_rate": 7.877368703694611e-06, "loss": 0.8752, "step": 14043 }, { "epoch": 0.33, "learning_rate": 7.8770615517509e-06, "loss": 0.7355, "step": 14044 }, { "epoch": 0.33, "learning_rate": 7.876754383575002e-06, "loss": 0.7852, "step": 14045 }, { "epoch": 0.33, "learning_rate": 7.876447199168654e-06, "loss": 0.9366, "step": 14046 }, { "epoch": 0.33, "learning_rate": 7.876139998533584e-06, "loss": 0.8926, "step": 14047 }, { "epoch": 0.33, "learning_rate": 7.87583278167153e-06, "loss": 0.9465, "step": 14048 }, { "epoch": 0.33, "learning_rate": 7.875525548584223e-06, "loss": 0.7713, "step": 14049 }, { "epoch": 0.33, "learning_rate": 7.875218299273398e-06, "loss": 1.0084, "step": 14050 }, { "epoch": 0.33, "learning_rate": 7.874911033740783e-06, "loss": 0.9949, "step": 14051 }, { "epoch": 0.33, "learning_rate": 7.874603751988116e-06, "loss": 0.7546, "step": 14052 }, { "epoch": 0.33, "learning_rate": 7.874296454017133e-06, "loss": 0.9343, "step": 14053 }, { "epoch": 0.33, "learning_rate": 7.873989139829564e-06, "loss": 0.9543, "step": 14054 }, { "epoch": 0.33, "learning_rate": 7.873681809427143e-06, "loss": 1.1888, "step": 14055 }, { "epoch": 0.33, "learning_rate": 7.873374462811605e-06, "loss": 0.9231, "step": 14056 }, { "epoch": 0.33, "learning_rate": 7.873067099984683e-06, "loss": 0.9889, "step": 14057 }, { "epoch": 0.33, "learning_rate": 7.872759720948112e-06, "loss": 0.9179, "step": 14058 }, { "epoch": 0.33, "learning_rate": 7.872452325703626e-06, "loss": 0.9453, "step": 14059 }, { "epoch": 0.33, "learning_rate": 7.872144914252961e-06, "loss": 0.8936, "step": 14060 }, { "epoch": 0.33, "learning_rate": 7.871837486597849e-06, "loss": 0.9474, "step": 14061 }, { "epoch": 0.33, "learning_rate": 7.871530042740025e-06, "loss": 0.9007, "step": 14062 }, { "epoch": 0.33, "learning_rate": 7.871222582681222e-06, "loss": 1.2141, "step": 14063 }, { "epoch": 0.33, "learning_rate": 7.870915106423178e-06, "loss": 1.0554, "step": 14064 }, { "epoch": 0.33, "learning_rate": 7.870607613967628e-06, "loss": 0.947, "step": 14065 }, { "epoch": 0.33, "learning_rate": 7.870300105316304e-06, "loss": 0.8726, "step": 14066 }, { "epoch": 0.33, "learning_rate": 7.86999258047094e-06, "loss": 1.1558, "step": 14067 }, { "epoch": 0.33, "learning_rate": 7.869685039433274e-06, "loss": 0.7648, "step": 14068 }, { "epoch": 0.33, "learning_rate": 7.869377482205042e-06, "loss": 1.0504, "step": 14069 }, { "epoch": 0.33, "learning_rate": 7.869069908787976e-06, "loss": 0.9333, "step": 14070 }, { "epoch": 0.33, "learning_rate": 7.868762319183813e-06, "loss": 0.9093, "step": 14071 }, { "epoch": 0.33, "learning_rate": 7.86845471339429e-06, "loss": 0.5959, "step": 14072 }, { "epoch": 0.33, "learning_rate": 7.868147091421137e-06, "loss": 0.7905, "step": 14073 }, { "epoch": 0.33, "learning_rate": 7.867839453266095e-06, "loss": 0.8946, "step": 14074 }, { "epoch": 0.33, "learning_rate": 7.867531798930899e-06, "loss": 0.8345, "step": 14075 }, { "epoch": 0.33, "learning_rate": 7.867224128417282e-06, "loss": 0.9463, "step": 14076 }, { "epoch": 0.33, "learning_rate": 7.866916441726982e-06, "loss": 0.7749, "step": 14077 }, { "epoch": 0.33, "learning_rate": 7.866608738861734e-06, "loss": 0.8966, "step": 14078 }, { "epoch": 0.33, "learning_rate": 7.866301019823275e-06, "loss": 0.744, "step": 14079 }, { "epoch": 0.33, "learning_rate": 7.86599328461334e-06, "loss": 0.7643, "step": 14080 }, { "epoch": 0.33, "learning_rate": 7.865685533233665e-06, "loss": 0.6995, "step": 14081 }, { "epoch": 0.33, "learning_rate": 7.86537776568599e-06, "loss": 1.034, "step": 14082 }, { "epoch": 0.33, "learning_rate": 7.865069981972047e-06, "loss": 1.1687, "step": 14083 }, { "epoch": 0.33, "learning_rate": 7.864762182093573e-06, "loss": 0.7444, "step": 14084 }, { "epoch": 0.33, "learning_rate": 7.864454366052308e-06, "loss": 1.0996, "step": 14085 }, { "epoch": 0.33, "learning_rate": 7.864146533849985e-06, "loss": 1.1414, "step": 14086 }, { "epoch": 0.33, "learning_rate": 7.863838685488341e-06, "loss": 0.9926, "step": 14087 }, { "epoch": 0.33, "learning_rate": 7.863530820969116e-06, "loss": 0.9602, "step": 14088 }, { "epoch": 0.33, "learning_rate": 7.863222940294044e-06, "loss": 0.964, "step": 14089 }, { "epoch": 0.33, "learning_rate": 7.862915043464862e-06, "loss": 0.9343, "step": 14090 }, { "epoch": 0.33, "learning_rate": 7.862607130483309e-06, "loss": 1.0552, "step": 14091 }, { "epoch": 0.33, "learning_rate": 7.86229920135112e-06, "loss": 0.9599, "step": 14092 }, { "epoch": 0.33, "learning_rate": 7.861991256070036e-06, "loss": 0.7121, "step": 14093 }, { "epoch": 0.33, "learning_rate": 7.861683294641791e-06, "loss": 0.7701, "step": 14094 }, { "epoch": 0.33, "learning_rate": 7.861375317068123e-06, "loss": 1.4179, "step": 14095 }, { "epoch": 0.33, "learning_rate": 7.86106732335077e-06, "loss": 0.8978, "step": 14096 }, { "epoch": 0.33, "learning_rate": 7.86075931349147e-06, "loss": 0.8266, "step": 14097 }, { "epoch": 0.33, "learning_rate": 7.860451287491962e-06, "loss": 0.9582, "step": 14098 }, { "epoch": 0.33, "learning_rate": 7.860143245353981e-06, "loss": 1.0894, "step": 14099 }, { "epoch": 0.33, "learning_rate": 7.859835187079266e-06, "loss": 0.6447, "step": 14100 }, { "epoch": 0.33, "learning_rate": 7.859527112669557e-06, "loss": 0.7968, "step": 14101 }, { "epoch": 0.33, "learning_rate": 7.859219022126589e-06, "loss": 1.2604, "step": 14102 }, { "epoch": 0.33, "learning_rate": 7.858910915452102e-06, "loss": 0.9953, "step": 14103 }, { "epoch": 0.33, "learning_rate": 7.858602792647833e-06, "loss": 1.1284, "step": 14104 }, { "epoch": 0.33, "learning_rate": 7.858294653715523e-06, "loss": 1.0434, "step": 14105 }, { "epoch": 0.33, "learning_rate": 7.857986498656909e-06, "loss": 0.9624, "step": 14106 }, { "epoch": 0.33, "learning_rate": 7.85767832747373e-06, "loss": 0.8415, "step": 14107 }, { "epoch": 0.33, "learning_rate": 7.857370140167722e-06, "loss": 1.0838, "step": 14108 }, { "epoch": 0.33, "learning_rate": 7.85706193674063e-06, "loss": 1.0259, "step": 14109 }, { "epoch": 0.33, "learning_rate": 7.856753717194186e-06, "loss": 0.7856, "step": 14110 }, { "epoch": 0.33, "learning_rate": 7.85644548153013e-06, "loss": 0.9129, "step": 14111 }, { "epoch": 0.33, "learning_rate": 7.856137229750206e-06, "loss": 0.8199, "step": 14112 }, { "epoch": 0.33, "learning_rate": 7.85582896185615e-06, "loss": 0.9984, "step": 14113 }, { "epoch": 0.33, "learning_rate": 7.8555206778497e-06, "loss": 0.8356, "step": 14114 }, { "epoch": 0.33, "learning_rate": 7.855212377732598e-06, "loss": 0.9608, "step": 14115 }, { "epoch": 0.33, "learning_rate": 7.85490406150658e-06, "loss": 1.1671, "step": 14116 }, { "epoch": 0.33, "learning_rate": 7.854595729173389e-06, "loss": 0.8694, "step": 14117 }, { "epoch": 0.33, "learning_rate": 7.854287380734762e-06, "loss": 0.8361, "step": 14118 }, { "epoch": 0.33, "learning_rate": 7.853979016192441e-06, "loss": 1.0755, "step": 14119 }, { "epoch": 0.33, "learning_rate": 7.853670635548163e-06, "loss": 0.83, "step": 14120 }, { "epoch": 0.33, "learning_rate": 7.85336223880367e-06, "loss": 0.9529, "step": 14121 }, { "epoch": 0.33, "learning_rate": 7.853053825960701e-06, "loss": 0.851, "step": 14122 }, { "epoch": 0.33, "learning_rate": 7.852745397020998e-06, "loss": 0.9572, "step": 14123 }, { "epoch": 0.33, "learning_rate": 7.852436951986297e-06, "loss": 0.8623, "step": 14124 }, { "epoch": 0.33, "learning_rate": 7.852128490858345e-06, "loss": 0.8869, "step": 14125 }, { "epoch": 0.33, "learning_rate": 7.851820013638873e-06, "loss": 0.8846, "step": 14126 }, { "epoch": 0.33, "learning_rate": 7.851511520329628e-06, "loss": 1.0352, "step": 14127 }, { "epoch": 0.33, "learning_rate": 7.851203010932351e-06, "loss": 0.9409, "step": 14128 }, { "epoch": 0.33, "learning_rate": 7.850894485448778e-06, "loss": 1.0472, "step": 14129 }, { "epoch": 0.33, "learning_rate": 7.850585943880656e-06, "loss": 0.9416, "step": 14130 }, { "epoch": 0.33, "learning_rate": 7.85027738622972e-06, "loss": 1.1586, "step": 14131 }, { "epoch": 0.33, "learning_rate": 7.84996881249771e-06, "loss": 0.8437, "step": 14132 }, { "epoch": 0.33, "learning_rate": 7.849660222686372e-06, "loss": 1.1551, "step": 14133 }, { "epoch": 0.33, "learning_rate": 7.849351616797446e-06, "loss": 1.145, "step": 14134 }, { "epoch": 0.33, "learning_rate": 7.84904299483267e-06, "loss": 0.9759, "step": 14135 }, { "epoch": 0.33, "learning_rate": 7.848734356793789e-06, "loss": 0.9557, "step": 14136 }, { "epoch": 0.33, "learning_rate": 7.84842570268254e-06, "loss": 1.3554, "step": 14137 }, { "epoch": 0.33, "learning_rate": 7.84811703250067e-06, "loss": 0.7138, "step": 14138 }, { "epoch": 0.33, "learning_rate": 7.847808346249916e-06, "loss": 1.067, "step": 14139 }, { "epoch": 0.33, "learning_rate": 7.847499643932022e-06, "loss": 0.975, "step": 14140 }, { "epoch": 0.33, "learning_rate": 7.847190925548727e-06, "loss": 1.01, "step": 14141 }, { "epoch": 0.33, "learning_rate": 7.846882191101775e-06, "loss": 1.0946, "step": 14142 }, { "epoch": 0.33, "learning_rate": 7.846573440592907e-06, "loss": 0.9151, "step": 14143 }, { "epoch": 0.33, "learning_rate": 7.846264674023867e-06, "loss": 0.9281, "step": 14144 }, { "epoch": 0.33, "learning_rate": 7.845955891396394e-06, "loss": 1.01, "step": 14145 }, { "epoch": 0.33, "learning_rate": 7.845647092712232e-06, "loss": 0.9376, "step": 14146 }, { "epoch": 0.33, "learning_rate": 7.845338277973121e-06, "loss": 0.7756, "step": 14147 }, { "epoch": 0.33, "learning_rate": 7.845029447180807e-06, "loss": 0.8623, "step": 14148 }, { "epoch": 0.33, "learning_rate": 7.84472060033703e-06, "loss": 0.9326, "step": 14149 }, { "epoch": 0.33, "learning_rate": 7.84441173744353e-06, "loss": 0.9927, "step": 14150 }, { "epoch": 0.33, "learning_rate": 7.844102858502057e-06, "loss": 1.0409, "step": 14151 }, { "epoch": 0.33, "learning_rate": 7.843793963514347e-06, "loss": 0.8808, "step": 14152 }, { "epoch": 0.33, "learning_rate": 7.843485052482145e-06, "loss": 0.8732, "step": 14153 }, { "epoch": 0.33, "learning_rate": 7.843176125407194e-06, "loss": 1.0649, "step": 14154 }, { "epoch": 0.33, "learning_rate": 7.842867182291237e-06, "loss": 1.0555, "step": 14155 }, { "epoch": 0.33, "learning_rate": 7.842558223136016e-06, "loss": 0.7565, "step": 14156 }, { "epoch": 0.33, "learning_rate": 7.842249247943274e-06, "loss": 1.2233, "step": 14157 }, { "epoch": 0.33, "learning_rate": 7.841940256714757e-06, "loss": 1.3012, "step": 14158 }, { "epoch": 0.33, "learning_rate": 7.841631249452205e-06, "loss": 0.928, "step": 14159 }, { "epoch": 0.33, "learning_rate": 7.841322226157362e-06, "loss": 1.1343, "step": 14160 }, { "epoch": 0.33, "learning_rate": 7.841013186831975e-06, "loss": 1.0238, "step": 14161 }, { "epoch": 0.33, "learning_rate": 7.840704131477782e-06, "loss": 0.8559, "step": 14162 }, { "epoch": 0.33, "learning_rate": 7.840395060096534e-06, "loss": 1.0294, "step": 14163 }, { "epoch": 0.33, "learning_rate": 7.840085972689965e-06, "loss": 0.7809, "step": 14164 }, { "epoch": 0.33, "learning_rate": 7.839776869259825e-06, "loss": 0.81, "step": 14165 }, { "epoch": 0.33, "learning_rate": 7.83946774980786e-06, "loss": 0.892, "step": 14166 }, { "epoch": 0.33, "learning_rate": 7.839158614335808e-06, "loss": 0.6877, "step": 14167 }, { "epoch": 0.33, "learning_rate": 7.838849462845419e-06, "loss": 1.556, "step": 14168 }, { "epoch": 0.33, "learning_rate": 7.838540295338433e-06, "loss": 0.9911, "step": 14169 }, { "epoch": 0.33, "learning_rate": 7.838231111816596e-06, "loss": 0.9676, "step": 14170 }, { "epoch": 0.33, "learning_rate": 7.837921912281653e-06, "loss": 0.8775, "step": 14171 }, { "epoch": 0.33, "learning_rate": 7.837612696735345e-06, "loss": 1.1578, "step": 14172 }, { "epoch": 0.33, "learning_rate": 7.83730346517942e-06, "loss": 1.2571, "step": 14173 }, { "epoch": 0.33, "learning_rate": 7.836994217615624e-06, "loss": 0.8663, "step": 14174 }, { "epoch": 0.33, "learning_rate": 7.836684954045698e-06, "loss": 1.0553, "step": 14175 }, { "epoch": 0.33, "learning_rate": 7.836375674471389e-06, "loss": 1.0237, "step": 14176 }, { "epoch": 0.33, "learning_rate": 7.83606637889444e-06, "loss": 1.1061, "step": 14177 }, { "epoch": 0.33, "learning_rate": 7.835757067316598e-06, "loss": 0.9394, "step": 14178 }, { "epoch": 0.33, "learning_rate": 7.835447739739607e-06, "loss": 0.8219, "step": 14179 }, { "epoch": 0.33, "learning_rate": 7.835138396165217e-06, "loss": 0.98, "step": 14180 }, { "epoch": 0.33, "learning_rate": 7.834829036595163e-06, "loss": 0.851, "step": 14181 }, { "epoch": 0.33, "learning_rate": 7.8345196610312e-06, "loss": 0.9198, "step": 14182 }, { "epoch": 0.33, "learning_rate": 7.83421026947507e-06, "loss": 0.9721, "step": 14183 }, { "epoch": 0.33, "learning_rate": 7.833900861928516e-06, "loss": 1.131, "step": 14184 }, { "epoch": 0.33, "learning_rate": 7.833591438393287e-06, "loss": 0.9296, "step": 14185 }, { "epoch": 0.33, "learning_rate": 7.833281998871128e-06, "loss": 0.7949, "step": 14186 }, { "epoch": 0.33, "learning_rate": 7.832972543363787e-06, "loss": 1.1221, "step": 14187 }, { "epoch": 0.33, "learning_rate": 7.832663071873003e-06, "loss": 1.0342, "step": 14188 }, { "epoch": 0.33, "learning_rate": 7.83235358440053e-06, "loss": 0.8962, "step": 14189 }, { "epoch": 0.33, "learning_rate": 7.83204408094811e-06, "loss": 0.9465, "step": 14190 }, { "epoch": 0.33, "learning_rate": 7.83173456151749e-06, "loss": 0.6793, "step": 14191 }, { "epoch": 0.33, "learning_rate": 7.831425026110417e-06, "loss": 1.0334, "step": 14192 }, { "epoch": 0.33, "learning_rate": 7.831115474728636e-06, "loss": 0.639, "step": 14193 }, { "epoch": 0.33, "learning_rate": 7.830805907373892e-06, "loss": 1.0002, "step": 14194 }, { "epoch": 0.33, "learning_rate": 7.830496324047936e-06, "loss": 1.0455, "step": 14195 }, { "epoch": 0.33, "learning_rate": 7.830186724752511e-06, "loss": 0.8744, "step": 14196 }, { "epoch": 0.33, "learning_rate": 7.829877109489366e-06, "loss": 1.0928, "step": 14197 }, { "epoch": 0.33, "learning_rate": 7.829567478260247e-06, "loss": 1.2672, "step": 14198 }, { "epoch": 0.33, "learning_rate": 7.8292578310669e-06, "loss": 1.2071, "step": 14199 }, { "epoch": 0.33, "learning_rate": 7.828948167911073e-06, "loss": 1.1607, "step": 14200 }, { "epoch": 0.33, "learning_rate": 7.828638488794513e-06, "loss": 0.6838, "step": 14201 }, { "epoch": 0.33, "learning_rate": 7.828328793718966e-06, "loss": 0.7956, "step": 14202 }, { "epoch": 0.33, "learning_rate": 7.828019082686183e-06, "loss": 0.7259, "step": 14203 }, { "epoch": 0.33, "learning_rate": 7.827709355697906e-06, "loss": 0.82, "step": 14204 }, { "epoch": 0.33, "learning_rate": 7.827399612755887e-06, "loss": 1.1551, "step": 14205 }, { "epoch": 0.33, "learning_rate": 7.82708985386187e-06, "loss": 1.2388, "step": 14206 }, { "epoch": 0.33, "learning_rate": 7.826780079017604e-06, "loss": 0.7816, "step": 14207 }, { "epoch": 0.33, "learning_rate": 7.826470288224839e-06, "loss": 0.9945, "step": 14208 }, { "epoch": 0.33, "learning_rate": 7.826160481485322e-06, "loss": 0.9441, "step": 14209 }, { "epoch": 0.33, "learning_rate": 7.825850658800797e-06, "loss": 0.7042, "step": 14210 }, { "epoch": 0.33, "learning_rate": 7.825540820173015e-06, "loss": 1.3093, "step": 14211 }, { "epoch": 0.33, "learning_rate": 7.825230965603726e-06, "loss": 1.0189, "step": 14212 }, { "epoch": 0.33, "learning_rate": 7.824921095094672e-06, "loss": 0.7564, "step": 14213 }, { "epoch": 0.33, "learning_rate": 7.82461120864761e-06, "loss": 0.9821, "step": 14214 }, { "epoch": 0.33, "learning_rate": 7.824301306264281e-06, "loss": 0.9138, "step": 14215 }, { "epoch": 0.33, "learning_rate": 7.823991387946437e-06, "loss": 0.847, "step": 14216 }, { "epoch": 0.33, "learning_rate": 7.823681453695826e-06, "loss": 0.7236, "step": 14217 }, { "epoch": 0.33, "learning_rate": 7.823371503514195e-06, "loss": 0.8481, "step": 14218 }, { "epoch": 0.33, "learning_rate": 7.823061537403295e-06, "loss": 1.0922, "step": 14219 }, { "epoch": 0.33, "learning_rate": 7.822751555364873e-06, "loss": 1.0743, "step": 14220 }, { "epoch": 0.33, "learning_rate": 7.82244155740068e-06, "loss": 0.6205, "step": 14221 }, { "epoch": 0.33, "learning_rate": 7.822131543512464e-06, "loss": 0.8221, "step": 14222 }, { "epoch": 0.33, "learning_rate": 7.821821513701973e-06, "loss": 0.7667, "step": 14223 }, { "epoch": 0.33, "learning_rate": 7.821511467970956e-06, "loss": 0.8669, "step": 14224 }, { "epoch": 0.33, "learning_rate": 7.821201406321164e-06, "loss": 0.8235, "step": 14225 }, { "epoch": 0.33, "learning_rate": 7.820891328754345e-06, "loss": 0.912, "step": 14226 }, { "epoch": 0.33, "learning_rate": 7.820581235272252e-06, "loss": 0.8601, "step": 14227 }, { "epoch": 0.33, "learning_rate": 7.820271125876629e-06, "loss": 1.1073, "step": 14228 }, { "epoch": 0.33, "learning_rate": 7.819961000569228e-06, "loss": 0.8934, "step": 14229 }, { "epoch": 0.33, "learning_rate": 7.819650859351799e-06, "loss": 0.7497, "step": 14230 }, { "epoch": 0.33, "learning_rate": 7.819340702226091e-06, "loss": 0.7253, "step": 14231 }, { "epoch": 0.33, "learning_rate": 7.819030529193855e-06, "loss": 0.8685, "step": 14232 }, { "epoch": 0.33, "learning_rate": 7.818720340256843e-06, "loss": 0.8139, "step": 14233 }, { "epoch": 0.33, "learning_rate": 7.818410135416799e-06, "loss": 0.9008, "step": 14234 }, { "epoch": 0.33, "learning_rate": 7.818099914675478e-06, "loss": 0.7193, "step": 14235 }, { "epoch": 0.33, "learning_rate": 7.81778967803463e-06, "loss": 0.9927, "step": 14236 }, { "epoch": 0.33, "learning_rate": 7.817479425496003e-06, "loss": 0.9649, "step": 14237 }, { "epoch": 0.33, "learning_rate": 7.817169157061349e-06, "loss": 0.8665, "step": 14238 }, { "epoch": 0.33, "learning_rate": 7.816858872732418e-06, "loss": 1.0685, "step": 14239 }, { "epoch": 0.33, "learning_rate": 7.816548572510962e-06, "loss": 1.1099, "step": 14240 }, { "epoch": 0.33, "learning_rate": 7.816238256398729e-06, "loss": 1.3486, "step": 14241 }, { "epoch": 0.33, "learning_rate": 7.815927924397474e-06, "loss": 1.2291, "step": 14242 }, { "epoch": 0.33, "learning_rate": 7.815617576508942e-06, "loss": 1.1934, "step": 14243 }, { "epoch": 0.33, "learning_rate": 7.815307212734888e-06, "loss": 0.6856, "step": 14244 }, { "epoch": 0.33, "learning_rate": 7.814996833077063e-06, "loss": 0.8282, "step": 14245 }, { "epoch": 0.33, "learning_rate": 7.814686437537215e-06, "loss": 1.0666, "step": 14246 }, { "epoch": 0.33, "learning_rate": 7.8143760261171e-06, "loss": 1.3692, "step": 14247 }, { "epoch": 0.33, "learning_rate": 7.814065598818468e-06, "loss": 0.8919, "step": 14248 }, { "epoch": 0.33, "learning_rate": 7.813755155643068e-06, "loss": 0.9039, "step": 14249 }, { "epoch": 0.33, "learning_rate": 7.813444696592651e-06, "loss": 1.0996, "step": 14250 }, { "epoch": 0.33, "learning_rate": 7.813134221668972e-06, "loss": 0.9173, "step": 14251 }, { "epoch": 0.33, "learning_rate": 7.812823730873782e-06, "loss": 1.1814, "step": 14252 }, { "epoch": 0.33, "learning_rate": 7.81251322420883e-06, "loss": 0.8166, "step": 14253 }, { "epoch": 0.33, "learning_rate": 7.812202701675871e-06, "loss": 1.2525, "step": 14254 }, { "epoch": 0.33, "learning_rate": 7.811892163276655e-06, "loss": 1.0292, "step": 14255 }, { "epoch": 0.33, "learning_rate": 7.811581609012935e-06, "loss": 1.0117, "step": 14256 }, { "epoch": 0.33, "learning_rate": 7.811271038886463e-06, "loss": 0.9267, "step": 14257 }, { "epoch": 0.33, "learning_rate": 7.81096045289899e-06, "loss": 0.6763, "step": 14258 }, { "epoch": 0.33, "learning_rate": 7.810649851052273e-06, "loss": 1.1498, "step": 14259 }, { "epoch": 0.33, "learning_rate": 7.810339233348055e-06, "loss": 0.8616, "step": 14260 }, { "epoch": 0.33, "learning_rate": 7.810028599788097e-06, "loss": 1.1403, "step": 14261 }, { "epoch": 0.33, "learning_rate": 7.809717950374149e-06, "loss": 0.9441, "step": 14262 }, { "epoch": 0.33, "learning_rate": 7.809407285107964e-06, "loss": 0.8958, "step": 14263 }, { "epoch": 0.33, "learning_rate": 7.809096603991294e-06, "loss": 1.166, "step": 14264 }, { "epoch": 0.33, "learning_rate": 7.808785907025892e-06, "loss": 0.8726, "step": 14265 }, { "epoch": 0.33, "learning_rate": 7.80847519421351e-06, "loss": 1.1175, "step": 14266 }, { "epoch": 0.33, "learning_rate": 7.8081644655559e-06, "loss": 1.4279, "step": 14267 }, { "epoch": 0.33, "learning_rate": 7.80785372105482e-06, "loss": 0.7716, "step": 14268 }, { "epoch": 0.33, "learning_rate": 7.80754296071202e-06, "loss": 0.911, "step": 14269 }, { "epoch": 0.33, "learning_rate": 7.807232184529254e-06, "loss": 0.9263, "step": 14270 }, { "epoch": 0.33, "learning_rate": 7.806921392508275e-06, "loss": 0.8824, "step": 14271 }, { "epoch": 0.33, "learning_rate": 7.806610584650834e-06, "loss": 0.9893, "step": 14272 }, { "epoch": 0.33, "learning_rate": 7.806299760958688e-06, "loss": 0.7607, "step": 14273 }, { "epoch": 0.33, "learning_rate": 7.805988921433592e-06, "loss": 0.9109, "step": 14274 }, { "epoch": 0.33, "learning_rate": 7.805678066077296e-06, "loss": 1.1042, "step": 14275 }, { "epoch": 0.33, "learning_rate": 7.805367194891556e-06, "loss": 0.7192, "step": 14276 }, { "epoch": 0.33, "learning_rate": 7.805056307878123e-06, "loss": 1.2074, "step": 14277 }, { "epoch": 0.33, "learning_rate": 7.804745405038755e-06, "loss": 0.8542, "step": 14278 }, { "epoch": 0.33, "learning_rate": 7.804434486375203e-06, "loss": 0.8081, "step": 14279 }, { "epoch": 0.33, "learning_rate": 7.804123551889221e-06, "loss": 1.2442, "step": 14280 }, { "epoch": 0.33, "learning_rate": 7.803812601582568e-06, "loss": 1.1907, "step": 14281 }, { "epoch": 0.33, "learning_rate": 7.803501635456992e-06, "loss": 1.0899, "step": 14282 }, { "epoch": 0.33, "learning_rate": 7.803190653514251e-06, "loss": 1.0781, "step": 14283 }, { "epoch": 0.33, "learning_rate": 7.802879655756101e-06, "loss": 1.1014, "step": 14284 }, { "epoch": 0.33, "learning_rate": 7.802568642184293e-06, "loss": 0.948, "step": 14285 }, { "epoch": 0.33, "learning_rate": 7.802257612800586e-06, "loss": 0.8997, "step": 14286 }, { "epoch": 0.33, "learning_rate": 7.801946567606729e-06, "loss": 0.9827, "step": 14287 }, { "epoch": 0.33, "learning_rate": 7.80163550660448e-06, "loss": 1.0784, "step": 14288 }, { "epoch": 0.33, "learning_rate": 7.801324429795597e-06, "loss": 1.0229, "step": 14289 }, { "epoch": 0.33, "learning_rate": 7.801013337181828e-06, "loss": 0.8953, "step": 14290 }, { "epoch": 0.33, "learning_rate": 7.800702228764936e-06, "loss": 0.9282, "step": 14291 }, { "epoch": 0.33, "learning_rate": 7.80039110454667e-06, "loss": 1.2213, "step": 14292 }, { "epoch": 0.33, "learning_rate": 7.80007996452879e-06, "loss": 0.8933, "step": 14293 }, { "epoch": 0.33, "learning_rate": 7.799768808713048e-06, "loss": 1.1653, "step": 14294 }, { "epoch": 0.33, "learning_rate": 7.7994576371012e-06, "loss": 0.7704, "step": 14295 }, { "epoch": 0.33, "learning_rate": 7.799146449695005e-06, "loss": 0.8928, "step": 14296 }, { "epoch": 0.33, "learning_rate": 7.798835246496215e-06, "loss": 0.993, "step": 14297 }, { "epoch": 0.33, "learning_rate": 7.798524027506586e-06, "loss": 1.0486, "step": 14298 }, { "epoch": 0.33, "learning_rate": 7.798212792727875e-06, "loss": 0.7474, "step": 14299 }, { "epoch": 0.33, "learning_rate": 7.797901542161837e-06, "loss": 0.9195, "step": 14300 }, { "epoch": 0.33, "learning_rate": 7.797590275810232e-06, "loss": 1.1718, "step": 14301 }, { "epoch": 0.33, "learning_rate": 7.79727899367481e-06, "loss": 0.9541, "step": 14302 }, { "epoch": 0.33, "learning_rate": 7.796967695757332e-06, "loss": 0.9943, "step": 14303 }, { "epoch": 0.33, "learning_rate": 7.796656382059551e-06, "loss": 0.9516, "step": 14304 }, { "epoch": 0.33, "learning_rate": 7.796345052583224e-06, "loss": 0.9801, "step": 14305 }, { "epoch": 0.33, "learning_rate": 7.79603370733011e-06, "loss": 1.0511, "step": 14306 }, { "epoch": 0.33, "learning_rate": 7.795722346301964e-06, "loss": 1.2119, "step": 14307 }, { "epoch": 0.33, "learning_rate": 7.795410969500542e-06, "loss": 0.9327, "step": 14308 }, { "epoch": 0.33, "learning_rate": 7.795099576927603e-06, "loss": 0.7023, "step": 14309 }, { "epoch": 0.33, "learning_rate": 7.7947881685849e-06, "loss": 0.8325, "step": 14310 }, { "epoch": 0.33, "learning_rate": 7.794476744474195e-06, "loss": 0.8795, "step": 14311 }, { "epoch": 0.33, "learning_rate": 7.79416530459724e-06, "loss": 0.8744, "step": 14312 }, { "epoch": 0.33, "learning_rate": 7.793853848955797e-06, "loss": 0.8598, "step": 14313 }, { "epoch": 0.33, "learning_rate": 7.793542377551617e-06, "loss": 0.7518, "step": 14314 }, { "epoch": 0.33, "learning_rate": 7.793230890386464e-06, "loss": 1.1768, "step": 14315 }, { "epoch": 0.33, "learning_rate": 7.792919387462091e-06, "loss": 0.9509, "step": 14316 }, { "epoch": 0.33, "learning_rate": 7.792607868780257e-06, "loss": 0.8566, "step": 14317 }, { "epoch": 0.33, "learning_rate": 7.79229633434272e-06, "loss": 0.834, "step": 14318 }, { "epoch": 0.33, "learning_rate": 7.791984784151236e-06, "loss": 0.8843, "step": 14319 }, { "epoch": 0.33, "learning_rate": 7.791673218207562e-06, "loss": 0.8929, "step": 14320 }, { "epoch": 0.33, "learning_rate": 7.791361636513462e-06, "loss": 0.9966, "step": 14321 }, { "epoch": 0.33, "learning_rate": 7.791050039070686e-06, "loss": 1.0316, "step": 14322 }, { "epoch": 0.33, "learning_rate": 7.790738425880997e-06, "loss": 1.051, "step": 14323 }, { "epoch": 0.33, "learning_rate": 7.790426796946151e-06, "loss": 0.9372, "step": 14324 }, { "epoch": 0.33, "learning_rate": 7.790115152267907e-06, "loss": 0.7921, "step": 14325 }, { "epoch": 0.33, "learning_rate": 7.789803491848025e-06, "loss": 1.1938, "step": 14326 }, { "epoch": 0.33, "learning_rate": 7.789491815688259e-06, "loss": 1.0074, "step": 14327 }, { "epoch": 0.33, "learning_rate": 7.78918012379037e-06, "loss": 0.8876, "step": 14328 }, { "epoch": 0.33, "learning_rate": 7.788868416156117e-06, "loss": 0.7384, "step": 14329 }, { "epoch": 0.33, "learning_rate": 7.78855669278726e-06, "loss": 0.9779, "step": 14330 }, { "epoch": 0.33, "learning_rate": 7.788244953685554e-06, "loss": 1.0861, "step": 14331 }, { "epoch": 0.33, "learning_rate": 7.787933198852757e-06, "loss": 0.9927, "step": 14332 }, { "epoch": 0.33, "learning_rate": 7.787621428290635e-06, "loss": 1.1206, "step": 14333 }, { "epoch": 0.33, "learning_rate": 7.78730964200094e-06, "loss": 0.8244, "step": 14334 }, { "epoch": 0.33, "learning_rate": 7.786997839985435e-06, "loss": 0.8401, "step": 14335 }, { "epoch": 0.33, "learning_rate": 7.786686022245877e-06, "loss": 0.8354, "step": 14336 }, { "epoch": 0.33, "learning_rate": 7.786374188784024e-06, "loss": 1.0442, "step": 14337 }, { "epoch": 0.33, "learning_rate": 7.78606233960164e-06, "loss": 1.0259, "step": 14338 }, { "epoch": 0.33, "learning_rate": 7.785750474700482e-06, "loss": 0.6805, "step": 14339 }, { "epoch": 0.33, "learning_rate": 7.785438594082308e-06, "loss": 1.0511, "step": 14340 }, { "epoch": 0.33, "learning_rate": 7.78512669774888e-06, "loss": 0.878, "step": 14341 }, { "epoch": 0.33, "learning_rate": 7.784814785701955e-06, "loss": 0.9994, "step": 14342 }, { "epoch": 0.33, "learning_rate": 7.784502857943298e-06, "loss": 1.0334, "step": 14343 }, { "epoch": 0.33, "learning_rate": 7.784190914474661e-06, "loss": 0.9572, "step": 14344 }, { "epoch": 0.33, "learning_rate": 7.78387895529781e-06, "loss": 1.0597, "step": 14345 }, { "epoch": 0.33, "learning_rate": 7.783566980414504e-06, "loss": 1.1156, "step": 14346 }, { "epoch": 0.33, "learning_rate": 7.783254989826501e-06, "loss": 0.9456, "step": 14347 }, { "epoch": 0.33, "learning_rate": 7.782942983535564e-06, "loss": 1.1181, "step": 14348 }, { "epoch": 0.33, "learning_rate": 7.782630961543451e-06, "loss": 0.6007, "step": 14349 }, { "epoch": 0.33, "learning_rate": 7.782318923851923e-06, "loss": 1.063, "step": 14350 }, { "epoch": 0.33, "learning_rate": 7.782006870462742e-06, "loss": 0.9802, "step": 14351 }, { "epoch": 0.33, "learning_rate": 7.781694801377665e-06, "loss": 0.7984, "step": 14352 }, { "epoch": 0.33, "learning_rate": 7.78138271659846e-06, "loss": 0.9624, "step": 14353 }, { "epoch": 0.33, "learning_rate": 7.78107061612688e-06, "loss": 1.0805, "step": 14354 }, { "epoch": 0.33, "learning_rate": 7.780758499964689e-06, "loss": 1.0901, "step": 14355 }, { "epoch": 0.33, "learning_rate": 7.780446368113648e-06, "loss": 0.9578, "step": 14356 }, { "epoch": 0.33, "learning_rate": 7.780134220575518e-06, "loss": 0.8419, "step": 14357 }, { "epoch": 0.33, "learning_rate": 7.779822057352059e-06, "loss": 0.7152, "step": 14358 }, { "epoch": 0.33, "learning_rate": 7.77950987844503e-06, "loss": 0.9013, "step": 14359 }, { "epoch": 0.33, "learning_rate": 7.7791976838562e-06, "loss": 1.0893, "step": 14360 }, { "epoch": 0.33, "learning_rate": 7.778885473587324e-06, "loss": 0.9614, "step": 14361 }, { "epoch": 0.33, "learning_rate": 7.778573247640167e-06, "loss": 1.0551, "step": 14362 }, { "epoch": 0.33, "learning_rate": 7.778261006016485e-06, "loss": 0.8462, "step": 14363 }, { "epoch": 0.33, "learning_rate": 7.777948748718045e-06, "loss": 1.2204, "step": 14364 }, { "epoch": 0.33, "learning_rate": 7.777636475746609e-06, "loss": 0.9937, "step": 14365 }, { "epoch": 0.33, "learning_rate": 7.777324187103935e-06, "loss": 0.9195, "step": 14366 }, { "epoch": 0.33, "learning_rate": 7.777011882791787e-06, "loss": 1.0177, "step": 14367 }, { "epoch": 0.33, "learning_rate": 7.776699562811928e-06, "loss": 1.1569, "step": 14368 }, { "epoch": 0.33, "learning_rate": 7.776387227166119e-06, "loss": 1.1447, "step": 14369 }, { "epoch": 0.33, "learning_rate": 7.77607487585612e-06, "loss": 1.1487, "step": 14370 }, { "epoch": 0.33, "learning_rate": 7.775762508883697e-06, "loss": 1.0525, "step": 14371 }, { "epoch": 0.33, "learning_rate": 7.77545012625061e-06, "loss": 0.7793, "step": 14372 }, { "epoch": 0.33, "learning_rate": 7.775137727958623e-06, "loss": 0.8227, "step": 14373 }, { "epoch": 0.33, "learning_rate": 7.774825314009498e-06, "loss": 0.7234, "step": 14374 }, { "epoch": 0.33, "learning_rate": 7.774512884404997e-06, "loss": 0.8239, "step": 14375 }, { "epoch": 0.33, "learning_rate": 7.774200439146882e-06, "loss": 1.0328, "step": 14376 }, { "epoch": 0.33, "learning_rate": 7.773887978236917e-06, "loss": 1.0518, "step": 14377 }, { "epoch": 0.33, "learning_rate": 7.773575501676864e-06, "loss": 0.8296, "step": 14378 }, { "epoch": 0.33, "learning_rate": 7.77326300946849e-06, "loss": 1.1149, "step": 14379 }, { "epoch": 0.33, "learning_rate": 7.772950501613552e-06, "loss": 1.267, "step": 14380 }, { "epoch": 0.33, "learning_rate": 7.772637978113817e-06, "loss": 0.9095, "step": 14381 }, { "epoch": 0.33, "learning_rate": 7.772325438971046e-06, "loss": 0.9715, "step": 14382 }, { "epoch": 0.33, "learning_rate": 7.772012884187003e-06, "loss": 1.1996, "step": 14383 }, { "epoch": 0.33, "learning_rate": 7.771700313763454e-06, "loss": 1.2137, "step": 14384 }, { "epoch": 0.33, "learning_rate": 7.77138772770216e-06, "loss": 0.7479, "step": 14385 }, { "epoch": 0.33, "learning_rate": 7.771075126004883e-06, "loss": 0.8632, "step": 14386 }, { "epoch": 0.33, "learning_rate": 7.770762508673391e-06, "loss": 0.8443, "step": 14387 }, { "epoch": 0.33, "learning_rate": 7.770449875709443e-06, "loss": 0.8205, "step": 14388 }, { "epoch": 0.33, "learning_rate": 7.770137227114807e-06, "loss": 0.7959, "step": 14389 }, { "epoch": 0.33, "learning_rate": 7.769824562891244e-06, "loss": 0.8925, "step": 14390 }, { "epoch": 0.33, "learning_rate": 7.76951188304052e-06, "loss": 0.8734, "step": 14391 }, { "epoch": 0.33, "learning_rate": 7.7691991875644e-06, "loss": 1.016, "step": 14392 }, { "epoch": 0.33, "learning_rate": 7.768886476464643e-06, "loss": 0.9034, "step": 14393 }, { "epoch": 0.33, "learning_rate": 7.768573749743019e-06, "loss": 0.9036, "step": 14394 }, { "epoch": 0.33, "learning_rate": 7.76826100740129e-06, "loss": 1.1441, "step": 14395 }, { "epoch": 0.33, "learning_rate": 7.76794824944122e-06, "loss": 1.0936, "step": 14396 }, { "epoch": 0.33, "learning_rate": 7.767635475864576e-06, "loss": 0.9558, "step": 14397 }, { "epoch": 0.33, "learning_rate": 7.767322686673118e-06, "loss": 1.3143, "step": 14398 }, { "epoch": 0.33, "learning_rate": 7.767009881868617e-06, "loss": 0.9425, "step": 14399 }, { "epoch": 0.33, "learning_rate": 7.766697061452833e-06, "loss": 1.0531, "step": 14400 }, { "epoch": 0.33, "learning_rate": 7.76638422542753e-06, "loss": 0.7478, "step": 14401 }, { "epoch": 0.33, "learning_rate": 7.76607137379448e-06, "loss": 0.8114, "step": 14402 }, { "epoch": 0.33, "learning_rate": 7.765758506555438e-06, "loss": 1.1133, "step": 14403 }, { "epoch": 0.33, "learning_rate": 7.76544562371218e-06, "loss": 1.2061, "step": 14404 }, { "epoch": 0.33, "learning_rate": 7.765132725266463e-06, "loss": 1.079, "step": 14405 }, { "epoch": 0.33, "learning_rate": 7.764819811220055e-06, "loss": 0.9603, "step": 14406 }, { "epoch": 0.33, "learning_rate": 7.764506881574722e-06, "loss": 0.9285, "step": 14407 }, { "epoch": 0.33, "learning_rate": 7.76419393633223e-06, "loss": 0.9293, "step": 14408 }, { "epoch": 0.33, "learning_rate": 7.763880975494344e-06, "loss": 0.7645, "step": 14409 }, { "epoch": 0.33, "learning_rate": 7.763567999062828e-06, "loss": 1.0178, "step": 14410 }, { "epoch": 0.33, "learning_rate": 7.763255007039451e-06, "loss": 0.9709, "step": 14411 }, { "epoch": 0.33, "learning_rate": 7.762941999425977e-06, "loss": 0.8648, "step": 14412 }, { "epoch": 0.33, "learning_rate": 7.762628976224172e-06, "loss": 0.8021, "step": 14413 }, { "epoch": 0.33, "learning_rate": 7.762315937435803e-06, "loss": 0.9531, "step": 14414 }, { "epoch": 0.33, "learning_rate": 7.762002883062634e-06, "loss": 0.8014, "step": 14415 }, { "epoch": 0.33, "learning_rate": 7.761689813106432e-06, "loss": 1.0352, "step": 14416 }, { "epoch": 0.33, "learning_rate": 7.761376727568966e-06, "loss": 1.1576, "step": 14417 }, { "epoch": 0.33, "learning_rate": 7.761063626451998e-06, "loss": 0.916, "step": 14418 }, { "epoch": 0.33, "learning_rate": 7.7607505097573e-06, "loss": 0.9985, "step": 14419 }, { "epoch": 0.33, "learning_rate": 7.760437377486632e-06, "loss": 1.179, "step": 14420 }, { "epoch": 0.33, "learning_rate": 7.760124229641765e-06, "loss": 1.0513, "step": 14421 }, { "epoch": 0.33, "learning_rate": 7.759811066224465e-06, "loss": 1.0619, "step": 14422 }, { "epoch": 0.33, "learning_rate": 7.7594978872365e-06, "loss": 1.0101, "step": 14423 }, { "epoch": 0.33, "learning_rate": 7.759184692679634e-06, "loss": 1.0211, "step": 14424 }, { "epoch": 0.33, "learning_rate": 7.758871482555636e-06, "loss": 0.8981, "step": 14425 }, { "epoch": 0.33, "learning_rate": 7.758558256866274e-06, "loss": 1.0878, "step": 14426 }, { "epoch": 0.33, "learning_rate": 7.758245015613312e-06, "loss": 1.0451, "step": 14427 }, { "epoch": 0.33, "learning_rate": 7.75793175879852e-06, "loss": 0.8736, "step": 14428 }, { "epoch": 0.33, "learning_rate": 7.757618486423665e-06, "loss": 1.0059, "step": 14429 }, { "epoch": 0.33, "learning_rate": 7.757305198490514e-06, "loss": 0.9007, "step": 14430 }, { "epoch": 0.33, "learning_rate": 7.756991895000836e-06, "loss": 0.535, "step": 14431 }, { "epoch": 0.33, "learning_rate": 7.756678575956396e-06, "loss": 0.7954, "step": 14432 }, { "epoch": 0.33, "learning_rate": 7.756365241358962e-06, "loss": 0.744, "step": 14433 }, { "epoch": 0.33, "learning_rate": 7.756051891210304e-06, "loss": 1.1764, "step": 14434 }, { "epoch": 0.33, "learning_rate": 7.755738525512188e-06, "loss": 1.0331, "step": 14435 }, { "epoch": 0.33, "learning_rate": 7.755425144266384e-06, "loss": 1.0037, "step": 14436 }, { "epoch": 0.33, "learning_rate": 7.755111747474658e-06, "loss": 0.7612, "step": 14437 }, { "epoch": 0.33, "learning_rate": 7.754798335138777e-06, "loss": 0.988, "step": 14438 }, { "epoch": 0.33, "learning_rate": 7.754484907260513e-06, "loss": 0.8346, "step": 14439 }, { "epoch": 0.33, "learning_rate": 7.754171463841634e-06, "loss": 1.1024, "step": 14440 }, { "epoch": 0.33, "learning_rate": 7.753858004883904e-06, "loss": 1.1086, "step": 14441 }, { "epoch": 0.33, "learning_rate": 7.753544530389096e-06, "loss": 0.827, "step": 14442 }, { "epoch": 0.33, "learning_rate": 7.753231040358977e-06, "loss": 1.0986, "step": 14443 }, { "epoch": 0.33, "learning_rate": 7.752917534795315e-06, "loss": 0.7508, "step": 14444 }, { "epoch": 0.34, "learning_rate": 7.75260401369988e-06, "loss": 0.6967, "step": 14445 }, { "epoch": 0.34, "learning_rate": 7.752290477074441e-06, "loss": 0.883, "step": 14446 }, { "epoch": 0.34, "learning_rate": 7.751976924920765e-06, "loss": 0.8874, "step": 14447 }, { "epoch": 0.34, "learning_rate": 7.751663357240624e-06, "loss": 0.9501, "step": 14448 }, { "epoch": 0.34, "learning_rate": 7.751349774035784e-06, "loss": 0.7796, "step": 14449 }, { "epoch": 0.34, "learning_rate": 7.751036175308018e-06, "loss": 0.7285, "step": 14450 }, { "epoch": 0.34, "learning_rate": 7.75072256105909e-06, "loss": 0.7466, "step": 14451 }, { "epoch": 0.34, "learning_rate": 7.750408931290774e-06, "loss": 1.0811, "step": 14452 }, { "epoch": 0.34, "learning_rate": 7.750095286004839e-06, "loss": 0.9905, "step": 14453 }, { "epoch": 0.34, "learning_rate": 7.749781625203053e-06, "loss": 0.7973, "step": 14454 }, { "epoch": 0.34, "learning_rate": 7.749467948887184e-06, "loss": 0.8786, "step": 14455 }, { "epoch": 0.34, "learning_rate": 7.749154257059005e-06, "loss": 1.0748, "step": 14456 }, { "epoch": 0.34, "learning_rate": 7.748840549720285e-06, "loss": 1.021, "step": 14457 }, { "epoch": 0.34, "learning_rate": 7.748526826872794e-06, "loss": 0.9792, "step": 14458 }, { "epoch": 0.34, "learning_rate": 7.748213088518301e-06, "loss": 0.694, "step": 14459 }, { "epoch": 0.34, "learning_rate": 7.747899334658575e-06, "loss": 0.9368, "step": 14460 }, { "epoch": 0.34, "learning_rate": 7.74758556529539e-06, "loss": 0.8282, "step": 14461 }, { "epoch": 0.34, "learning_rate": 7.747271780430515e-06, "loss": 1.0254, "step": 14462 }, { "epoch": 0.34, "learning_rate": 7.746957980065717e-06, "loss": 0.9711, "step": 14463 }, { "epoch": 0.34, "learning_rate": 7.74664416420277e-06, "loss": 0.8908, "step": 14464 }, { "epoch": 0.34, "learning_rate": 7.746330332843444e-06, "loss": 0.8538, "step": 14465 }, { "epoch": 0.34, "learning_rate": 7.74601648598951e-06, "loss": 1.0029, "step": 14466 }, { "epoch": 0.34, "learning_rate": 7.745702623642734e-06, "loss": 0.871, "step": 14467 }, { "epoch": 0.34, "learning_rate": 7.745388745804894e-06, "loss": 1.0415, "step": 14468 }, { "epoch": 0.34, "learning_rate": 7.745074852477757e-06, "loss": 0.8491, "step": 14469 }, { "epoch": 0.34, "learning_rate": 7.744760943663094e-06, "loss": 0.777, "step": 14470 }, { "epoch": 0.34, "learning_rate": 7.744447019362675e-06, "loss": 0.783, "step": 14471 }, { "epoch": 0.34, "learning_rate": 7.744133079578276e-06, "loss": 1.0135, "step": 14472 }, { "epoch": 0.34, "learning_rate": 7.743819124311662e-06, "loss": 1.0993, "step": 14473 }, { "epoch": 0.34, "learning_rate": 7.743505153564608e-06, "loss": 1.0367, "step": 14474 }, { "epoch": 0.34, "learning_rate": 7.743191167338883e-06, "loss": 0.9529, "step": 14475 }, { "epoch": 0.34, "learning_rate": 7.742877165636262e-06, "loss": 1.1359, "step": 14476 }, { "epoch": 0.34, "learning_rate": 7.742563148458516e-06, "loss": 0.8526, "step": 14477 }, { "epoch": 0.34, "learning_rate": 7.742249115807413e-06, "loss": 0.8895, "step": 14478 }, { "epoch": 0.34, "learning_rate": 7.741935067684726e-06, "loss": 0.9469, "step": 14479 }, { "epoch": 0.34, "learning_rate": 7.741621004092231e-06, "loss": 0.9383, "step": 14480 }, { "epoch": 0.34, "learning_rate": 7.741306925031693e-06, "loss": 0.918, "step": 14481 }, { "epoch": 0.34, "learning_rate": 7.74099283050489e-06, "loss": 0.9376, "step": 14482 }, { "epoch": 0.34, "learning_rate": 7.740678720513591e-06, "loss": 1.0805, "step": 14483 }, { "epoch": 0.34, "learning_rate": 7.740364595059571e-06, "loss": 0.7673, "step": 14484 }, { "epoch": 0.34, "learning_rate": 7.7400504541446e-06, "loss": 0.6641, "step": 14485 }, { "epoch": 0.34, "learning_rate": 7.739736297770448e-06, "loss": 0.9663, "step": 14486 }, { "epoch": 0.34, "learning_rate": 7.73942212593889e-06, "loss": 0.7422, "step": 14487 }, { "epoch": 0.34, "learning_rate": 7.739107938651703e-06, "loss": 0.7116, "step": 14488 }, { "epoch": 0.34, "learning_rate": 7.738793735910653e-06, "loss": 1.1818, "step": 14489 }, { "epoch": 0.34, "learning_rate": 7.738479517717515e-06, "loss": 0.6531, "step": 14490 }, { "epoch": 0.34, "learning_rate": 7.738165284074062e-06, "loss": 0.798, "step": 14491 }, { "epoch": 0.34, "learning_rate": 7.737851034982066e-06, "loss": 0.9324, "step": 14492 }, { "epoch": 0.34, "learning_rate": 7.737536770443302e-06, "loss": 1.0077, "step": 14493 }, { "epoch": 0.34, "learning_rate": 7.73722249045954e-06, "loss": 1.1902, "step": 14494 }, { "epoch": 0.34, "learning_rate": 7.736908195032557e-06, "loss": 1.1545, "step": 14495 }, { "epoch": 0.34, "learning_rate": 7.736593884164121e-06, "loss": 1.2308, "step": 14496 }, { "epoch": 0.34, "learning_rate": 7.736279557856011e-06, "loss": 0.9849, "step": 14497 }, { "epoch": 0.34, "learning_rate": 7.735965216109997e-06, "loss": 0.9528, "step": 14498 }, { "epoch": 0.34, "learning_rate": 7.735650858927854e-06, "loss": 0.9015, "step": 14499 }, { "epoch": 0.34, "learning_rate": 7.735336486311355e-06, "loss": 0.7546, "step": 14500 }, { "epoch": 0.34, "learning_rate": 7.735022098262273e-06, "loss": 1.193, "step": 14501 }, { "epoch": 0.34, "learning_rate": 7.734707694782385e-06, "loss": 0.846, "step": 14502 }, { "epoch": 0.34, "learning_rate": 7.734393275873458e-06, "loss": 0.9965, "step": 14503 }, { "epoch": 0.34, "learning_rate": 7.734078841537271e-06, "loss": 0.5649, "step": 14504 }, { "epoch": 0.34, "learning_rate": 7.733764391775598e-06, "loss": 1.0498, "step": 14505 }, { "epoch": 0.34, "learning_rate": 7.733449926590214e-06, "loss": 1.0335, "step": 14506 }, { "epoch": 0.34, "learning_rate": 7.733135445982889e-06, "loss": 1.0544, "step": 14507 }, { "epoch": 0.34, "learning_rate": 7.7328209499554e-06, "loss": 0.935, "step": 14508 }, { "epoch": 0.34, "learning_rate": 7.732506438509522e-06, "loss": 0.7629, "step": 14509 }, { "epoch": 0.34, "learning_rate": 7.732191911647028e-06, "loss": 0.8593, "step": 14510 }, { "epoch": 0.34, "learning_rate": 7.731877369369694e-06, "loss": 1.0357, "step": 14511 }, { "epoch": 0.34, "learning_rate": 7.731562811679291e-06, "loss": 1.0643, "step": 14512 }, { "epoch": 0.34, "learning_rate": 7.731248238577598e-06, "loss": 0.9977, "step": 14513 }, { "epoch": 0.34, "learning_rate": 7.73093365006639e-06, "loss": 0.8665, "step": 14514 }, { "epoch": 0.34, "learning_rate": 7.730619046147438e-06, "loss": 0.8801, "step": 14515 }, { "epoch": 0.34, "learning_rate": 7.73030442682252e-06, "loss": 0.7782, "step": 14516 }, { "epoch": 0.34, "learning_rate": 7.729989792093412e-06, "loss": 0.9978, "step": 14517 }, { "epoch": 0.34, "learning_rate": 7.729675141961883e-06, "loss": 0.9211, "step": 14518 }, { "epoch": 0.34, "learning_rate": 7.729360476429715e-06, "loss": 1.0183, "step": 14519 }, { "epoch": 0.34, "learning_rate": 7.72904579549868e-06, "loss": 1.1548, "step": 14520 }, { "epoch": 0.34, "learning_rate": 7.728731099170554e-06, "loss": 0.8127, "step": 14521 }, { "epoch": 0.34, "learning_rate": 7.728416387447115e-06, "loss": 1.1072, "step": 14522 }, { "epoch": 0.34, "learning_rate": 7.728101660330134e-06, "loss": 0.7206, "step": 14523 }, { "epoch": 0.34, "learning_rate": 7.727786917821389e-06, "loss": 1.1421, "step": 14524 }, { "epoch": 0.34, "learning_rate": 7.727472159922658e-06, "loss": 0.9276, "step": 14525 }, { "epoch": 0.34, "learning_rate": 7.727157386635712e-06, "loss": 0.8799, "step": 14526 }, { "epoch": 0.34, "learning_rate": 7.726842597962332e-06, "loss": 1.0122, "step": 14527 }, { "epoch": 0.34, "learning_rate": 7.72652779390429e-06, "loss": 0.8628, "step": 14528 }, { "epoch": 0.34, "learning_rate": 7.726212974463364e-06, "loss": 0.7368, "step": 14529 }, { "epoch": 0.34, "learning_rate": 7.72589813964133e-06, "loss": 0.8933, "step": 14530 }, { "epoch": 0.34, "learning_rate": 7.725583289439963e-06, "loss": 0.9479, "step": 14531 }, { "epoch": 0.34, "learning_rate": 7.725268423861041e-06, "loss": 0.8046, "step": 14532 }, { "epoch": 0.34, "learning_rate": 7.72495354290634e-06, "loss": 1.1035, "step": 14533 }, { "epoch": 0.34, "learning_rate": 7.724638646577638e-06, "loss": 1.0819, "step": 14534 }, { "epoch": 0.34, "learning_rate": 7.72432373487671e-06, "loss": 1.0593, "step": 14535 }, { "epoch": 0.34, "learning_rate": 7.72400880780533e-06, "loss": 1.1638, "step": 14536 }, { "epoch": 0.34, "learning_rate": 7.723693865365279e-06, "loss": 1.1042, "step": 14537 }, { "epoch": 0.34, "learning_rate": 7.723378907558331e-06, "loss": 0.8443, "step": 14538 }, { "epoch": 0.34, "learning_rate": 7.723063934386269e-06, "loss": 1.0746, "step": 14539 }, { "epoch": 0.34, "learning_rate": 7.722748945850861e-06, "loss": 0.8908, "step": 14540 }, { "epoch": 0.34, "learning_rate": 7.722433941953891e-06, "loss": 1.3163, "step": 14541 }, { "epoch": 0.34, "learning_rate": 7.722118922697133e-06, "loss": 1.1576, "step": 14542 }, { "epoch": 0.34, "learning_rate": 7.721803888082366e-06, "loss": 1.1089, "step": 14543 }, { "epoch": 0.34, "learning_rate": 7.721488838111365e-06, "loss": 0.8867, "step": 14544 }, { "epoch": 0.34, "learning_rate": 7.721173772785911e-06, "loss": 1.1039, "step": 14545 }, { "epoch": 0.34, "learning_rate": 7.720858692107778e-06, "loss": 0.9496, "step": 14546 }, { "epoch": 0.34, "learning_rate": 7.720543596078746e-06, "loss": 1.08, "step": 14547 }, { "epoch": 0.34, "learning_rate": 7.720228484700592e-06, "loss": 1.029, "step": 14548 }, { "epoch": 0.34, "learning_rate": 7.719913357975095e-06, "loss": 1.0453, "step": 14549 }, { "epoch": 0.34, "learning_rate": 7.719598215904029e-06, "loss": 1.0481, "step": 14550 }, { "epoch": 0.34, "learning_rate": 7.719283058489178e-06, "loss": 1.1436, "step": 14551 }, { "epoch": 0.34, "learning_rate": 7.718967885732315e-06, "loss": 0.9003, "step": 14552 }, { "epoch": 0.34, "learning_rate": 7.71865269763522e-06, "loss": 1.0379, "step": 14553 }, { "epoch": 0.34, "learning_rate": 7.718337494199674e-06, "loss": 0.7891, "step": 14554 }, { "epoch": 0.34, "learning_rate": 7.71802227542745e-06, "loss": 0.7623, "step": 14555 }, { "epoch": 0.34, "learning_rate": 7.71770704132033e-06, "loss": 0.8423, "step": 14556 }, { "epoch": 0.34, "learning_rate": 7.717391791880093e-06, "loss": 0.9519, "step": 14557 }, { "epoch": 0.34, "learning_rate": 7.717076527108514e-06, "loss": 1.029, "step": 14558 }, { "epoch": 0.34, "learning_rate": 7.716761247007376e-06, "loss": 1.0094, "step": 14559 }, { "epoch": 0.34, "learning_rate": 7.716445951578456e-06, "loss": 1.0009, "step": 14560 }, { "epoch": 0.34, "learning_rate": 7.716130640823531e-06, "loss": 1.1787, "step": 14561 }, { "epoch": 0.34, "learning_rate": 7.715815314744383e-06, "loss": 1.1132, "step": 14562 }, { "epoch": 0.34, "learning_rate": 7.715499973342788e-06, "loss": 0.8789, "step": 14563 }, { "epoch": 0.34, "learning_rate": 7.715184616620529e-06, "loss": 1.0302, "step": 14564 }, { "epoch": 0.34, "learning_rate": 7.714869244579381e-06, "loss": 1.0016, "step": 14565 }, { "epoch": 0.34, "learning_rate": 7.714553857221128e-06, "loss": 0.8278, "step": 14566 }, { "epoch": 0.34, "learning_rate": 7.714238454547545e-06, "loss": 1.1204, "step": 14567 }, { "epoch": 0.34, "learning_rate": 7.713923036560414e-06, "loss": 0.9732, "step": 14568 }, { "epoch": 0.34, "learning_rate": 7.713607603261513e-06, "loss": 1.0398, "step": 14569 }, { "epoch": 0.34, "learning_rate": 7.713292154652623e-06, "loss": 1.064, "step": 14570 }, { "epoch": 0.34, "learning_rate": 7.712976690735522e-06, "loss": 0.6427, "step": 14571 }, { "epoch": 0.34, "learning_rate": 7.712661211511994e-06, "loss": 1.1574, "step": 14572 }, { "epoch": 0.34, "learning_rate": 7.712345716983814e-06, "loss": 0.9173, "step": 14573 }, { "epoch": 0.34, "learning_rate": 7.712030207152763e-06, "loss": 0.9903, "step": 14574 }, { "epoch": 0.34, "learning_rate": 7.711714682020623e-06, "loss": 1.0877, "step": 14575 }, { "epoch": 0.34, "learning_rate": 7.711399141589175e-06, "loss": 1.0673, "step": 14576 }, { "epoch": 0.34, "learning_rate": 7.711083585860196e-06, "loss": 0.6735, "step": 14577 }, { "epoch": 0.34, "learning_rate": 7.710768014835465e-06, "loss": 0.932, "step": 14578 }, { "epoch": 0.34, "learning_rate": 7.71045242851677e-06, "loss": 1.013, "step": 14579 }, { "epoch": 0.34, "learning_rate": 7.710136826905885e-06, "loss": 1.256, "step": 14580 }, { "epoch": 0.34, "learning_rate": 7.709821210004592e-06, "loss": 0.7744, "step": 14581 }, { "epoch": 0.34, "learning_rate": 7.70950557781467e-06, "loss": 1.0076, "step": 14582 }, { "epoch": 0.34, "learning_rate": 7.709189930337906e-06, "loss": 0.9767, "step": 14583 }, { "epoch": 0.34, "learning_rate": 7.708874267576074e-06, "loss": 0.9986, "step": 14584 }, { "epoch": 0.34, "learning_rate": 7.708558589530958e-06, "loss": 0.8292, "step": 14585 }, { "epoch": 0.34, "learning_rate": 7.70824289620434e-06, "loss": 1.0606, "step": 14586 }, { "epoch": 0.34, "learning_rate": 7.707927187598e-06, "loss": 0.9773, "step": 14587 }, { "epoch": 0.34, "learning_rate": 7.707611463713717e-06, "loss": 0.9055, "step": 14588 }, { "epoch": 0.34, "learning_rate": 7.707295724553273e-06, "loss": 1.301, "step": 14589 }, { "epoch": 0.34, "learning_rate": 7.706979970118453e-06, "loss": 0.6507, "step": 14590 }, { "epoch": 0.34, "learning_rate": 7.706664200411036e-06, "loss": 0.9763, "step": 14591 }, { "epoch": 0.34, "learning_rate": 7.706348415432804e-06, "loss": 0.701, "step": 14592 }, { "epoch": 0.34, "learning_rate": 7.70603261518554e-06, "loss": 0.8743, "step": 14593 }, { "epoch": 0.34, "learning_rate": 7.705716799671019e-06, "loss": 1.0731, "step": 14594 }, { "epoch": 0.34, "learning_rate": 7.705400968891031e-06, "loss": 1.2661, "step": 14595 }, { "epoch": 0.34, "learning_rate": 7.705085122847356e-06, "loss": 0.9435, "step": 14596 }, { "epoch": 0.34, "learning_rate": 7.704769261541773e-06, "loss": 0.9616, "step": 14597 }, { "epoch": 0.34, "learning_rate": 7.704453384976067e-06, "loss": 1.2212, "step": 14598 }, { "epoch": 0.34, "learning_rate": 7.704137493152017e-06, "loss": 0.9097, "step": 14599 }, { "epoch": 0.34, "learning_rate": 7.703821586071407e-06, "loss": 1.2451, "step": 14600 }, { "epoch": 0.34, "learning_rate": 7.703505663736022e-06, "loss": 1.1464, "step": 14601 }, { "epoch": 0.34, "learning_rate": 7.70318972614764e-06, "loss": 1.0145, "step": 14602 }, { "epoch": 0.34, "learning_rate": 7.702873773308046e-06, "loss": 0.8126, "step": 14603 }, { "epoch": 0.34, "learning_rate": 7.702557805219022e-06, "loss": 1.045, "step": 14604 }, { "epoch": 0.34, "learning_rate": 7.702241821882351e-06, "loss": 0.961, "step": 14605 }, { "epoch": 0.34, "learning_rate": 7.701925823299816e-06, "loss": 1.2203, "step": 14606 }, { "epoch": 0.34, "learning_rate": 7.701609809473198e-06, "loss": 1.0069, "step": 14607 }, { "epoch": 0.34, "learning_rate": 7.701293780404281e-06, "loss": 0.953, "step": 14608 }, { "epoch": 0.34, "learning_rate": 7.70097773609485e-06, "loss": 0.9333, "step": 14609 }, { "epoch": 0.34, "learning_rate": 7.700661676546685e-06, "loss": 1.1419, "step": 14610 }, { "epoch": 0.34, "learning_rate": 7.700345601761572e-06, "loss": 1.1281, "step": 14611 }, { "epoch": 0.34, "learning_rate": 7.700029511741291e-06, "loss": 0.6733, "step": 14612 }, { "epoch": 0.34, "learning_rate": 7.699713406487627e-06, "loss": 0.975, "step": 14613 }, { "epoch": 0.34, "learning_rate": 7.699397286002367e-06, "loss": 1.0528, "step": 14614 }, { "epoch": 0.34, "learning_rate": 7.699081150287286e-06, "loss": 0.9979, "step": 14615 }, { "epoch": 0.34, "learning_rate": 7.698764999344175e-06, "loss": 1.1799, "step": 14616 }, { "epoch": 0.34, "learning_rate": 7.698448833174816e-06, "loss": 0.935, "step": 14617 }, { "epoch": 0.34, "learning_rate": 7.698132651780993e-06, "loss": 1.022, "step": 14618 }, { "epoch": 0.34, "learning_rate": 7.697816455164489e-06, "loss": 0.7407, "step": 14619 }, { "epoch": 0.34, "learning_rate": 7.697500243327086e-06, "loss": 0.8823, "step": 14620 }, { "epoch": 0.34, "learning_rate": 7.69718401627057e-06, "loss": 0.9743, "step": 14621 }, { "epoch": 0.34, "learning_rate": 7.696867773996727e-06, "loss": 1.0776, "step": 14622 }, { "epoch": 0.34, "learning_rate": 7.69655151650734e-06, "loss": 1.0531, "step": 14623 }, { "epoch": 0.34, "learning_rate": 7.69623524380419e-06, "loss": 0.9804, "step": 14624 }, { "epoch": 0.34, "learning_rate": 7.695918955889068e-06, "loss": 1.0621, "step": 14625 }, { "epoch": 0.34, "learning_rate": 7.695602652763752e-06, "loss": 1.1275, "step": 14626 }, { "epoch": 0.34, "learning_rate": 7.69528633443003e-06, "loss": 0.9033, "step": 14627 }, { "epoch": 0.34, "learning_rate": 7.694970000889686e-06, "loss": 0.7783, "step": 14628 }, { "epoch": 0.34, "learning_rate": 7.694653652144504e-06, "loss": 0.9563, "step": 14629 }, { "epoch": 0.34, "learning_rate": 7.694337288196268e-06, "loss": 1.2137, "step": 14630 }, { "epoch": 0.34, "learning_rate": 7.694020909046766e-06, "loss": 0.883, "step": 14631 }, { "epoch": 0.34, "learning_rate": 7.693704514697781e-06, "loss": 0.9153, "step": 14632 }, { "epoch": 0.34, "learning_rate": 7.693388105151099e-06, "loss": 0.8699, "step": 14633 }, { "epoch": 0.34, "learning_rate": 7.693071680408504e-06, "loss": 0.7675, "step": 14634 }, { "epoch": 0.34, "learning_rate": 7.692755240471782e-06, "loss": 0.927, "step": 14635 }, { "epoch": 0.34, "learning_rate": 7.692438785342718e-06, "loss": 0.9953, "step": 14636 }, { "epoch": 0.34, "learning_rate": 7.692122315023095e-06, "loss": 0.9755, "step": 14637 }, { "epoch": 0.34, "learning_rate": 7.691805829514705e-06, "loss": 0.9738, "step": 14638 }, { "epoch": 0.34, "learning_rate": 7.691489328819328e-06, "loss": 0.5958, "step": 14639 }, { "epoch": 0.34, "learning_rate": 7.691172812938752e-06, "loss": 0.794, "step": 14640 }, { "epoch": 0.34, "learning_rate": 7.69085628187476e-06, "loss": 0.9333, "step": 14641 }, { "epoch": 0.34, "learning_rate": 7.690539735629141e-06, "loss": 0.7051, "step": 14642 }, { "epoch": 0.34, "learning_rate": 7.69022317420368e-06, "loss": 1.1371, "step": 14643 }, { "epoch": 0.34, "learning_rate": 7.689906597600163e-06, "loss": 0.8914, "step": 14644 }, { "epoch": 0.34, "learning_rate": 7.689590005820376e-06, "loss": 1.0636, "step": 14645 }, { "epoch": 0.34, "learning_rate": 7.689273398866104e-06, "loss": 0.7796, "step": 14646 }, { "epoch": 0.34, "learning_rate": 7.688956776739137e-06, "loss": 0.9619, "step": 14647 }, { "epoch": 0.34, "learning_rate": 7.688640139441256e-06, "loss": 0.933, "step": 14648 }, { "epoch": 0.34, "learning_rate": 7.688323486974251e-06, "loss": 0.7122, "step": 14649 }, { "epoch": 0.34, "learning_rate": 7.68800681933991e-06, "loss": 0.7201, "step": 14650 }, { "epoch": 0.34, "learning_rate": 7.687690136540014e-06, "loss": 0.9468, "step": 14651 }, { "epoch": 0.34, "learning_rate": 7.687373438576355e-06, "loss": 0.9989, "step": 14652 }, { "epoch": 0.34, "learning_rate": 7.687056725450716e-06, "loss": 1.0202, "step": 14653 }, { "epoch": 0.34, "learning_rate": 7.686739997164887e-06, "loss": 0.9197, "step": 14654 }, { "epoch": 0.34, "learning_rate": 7.686423253720653e-06, "loss": 0.9331, "step": 14655 }, { "epoch": 0.34, "learning_rate": 7.686106495119805e-06, "loss": 0.6572, "step": 14656 }, { "epoch": 0.34, "learning_rate": 7.685789721364124e-06, "loss": 1.2578, "step": 14657 }, { "epoch": 0.34, "learning_rate": 7.6854729324554e-06, "loss": 1.0313, "step": 14658 }, { "epoch": 0.34, "learning_rate": 7.685156128395421e-06, "loss": 0.8941, "step": 14659 }, { "epoch": 0.34, "learning_rate": 7.684839309185974e-06, "loss": 1.1758, "step": 14660 }, { "epoch": 0.34, "learning_rate": 7.684522474828844e-06, "loss": 0.9574, "step": 14661 }, { "epoch": 0.34, "learning_rate": 7.684205625325824e-06, "loss": 0.8664, "step": 14662 }, { "epoch": 0.34, "learning_rate": 7.683888760678697e-06, "loss": 1.0611, "step": 14663 }, { "epoch": 0.34, "learning_rate": 7.683571880889252e-06, "loss": 0.7886, "step": 14664 }, { "epoch": 0.34, "learning_rate": 7.683254985959277e-06, "loss": 0.7601, "step": 14665 }, { "epoch": 0.34, "learning_rate": 7.68293807589056e-06, "loss": 0.795, "step": 14666 }, { "epoch": 0.34, "learning_rate": 7.68262115068489e-06, "loss": 0.9104, "step": 14667 }, { "epoch": 0.34, "learning_rate": 7.682304210344051e-06, "loss": 0.8517, "step": 14668 }, { "epoch": 0.34, "learning_rate": 7.681987254869837e-06, "loss": 0.7894, "step": 14669 }, { "epoch": 0.34, "learning_rate": 7.681670284264033e-06, "loss": 1.0038, "step": 14670 }, { "epoch": 0.34, "learning_rate": 7.681353298528426e-06, "loss": 1.169, "step": 14671 }, { "epoch": 0.34, "learning_rate": 7.681036297664808e-06, "loss": 0.8728, "step": 14672 }, { "epoch": 0.34, "learning_rate": 7.680719281674965e-06, "loss": 0.9469, "step": 14673 }, { "epoch": 0.34, "learning_rate": 7.680402250560683e-06, "loss": 0.9606, "step": 14674 }, { "epoch": 0.34, "learning_rate": 7.680085204323758e-06, "loss": 1.0538, "step": 14675 }, { "epoch": 0.34, "learning_rate": 7.679768142965973e-06, "loss": 0.8412, "step": 14676 }, { "epoch": 0.34, "learning_rate": 7.67945106648912e-06, "loss": 0.9818, "step": 14677 }, { "epoch": 0.34, "learning_rate": 7.679133974894984e-06, "loss": 0.8183, "step": 14678 }, { "epoch": 0.34, "learning_rate": 7.678816868185358e-06, "loss": 0.7997, "step": 14679 }, { "epoch": 0.34, "learning_rate": 7.678499746362028e-06, "loss": 0.7823, "step": 14680 }, { "epoch": 0.34, "learning_rate": 7.678182609426785e-06, "loss": 0.9464, "step": 14681 }, { "epoch": 0.34, "learning_rate": 7.677865457381417e-06, "loss": 1.1357, "step": 14682 }, { "epoch": 0.34, "learning_rate": 7.677548290227717e-06, "loss": 1.0444, "step": 14683 }, { "epoch": 0.34, "learning_rate": 7.67723110796747e-06, "loss": 1.1271, "step": 14684 }, { "epoch": 0.34, "learning_rate": 7.676913910602468e-06, "loss": 0.9624, "step": 14685 }, { "epoch": 0.34, "learning_rate": 7.676596698134497e-06, "loss": 0.9548, "step": 14686 }, { "epoch": 0.34, "learning_rate": 7.676279470565353e-06, "loss": 1.0545, "step": 14687 }, { "epoch": 0.34, "learning_rate": 7.67596222789682e-06, "loss": 0.9488, "step": 14688 }, { "epoch": 0.34, "learning_rate": 7.675644970130694e-06, "loss": 1.0167, "step": 14689 }, { "epoch": 0.34, "learning_rate": 7.675327697268755e-06, "loss": 1.0099, "step": 14690 }, { "epoch": 0.34, "learning_rate": 7.675010409312803e-06, "loss": 0.9761, "step": 14691 }, { "epoch": 0.34, "learning_rate": 7.674693106264624e-06, "loss": 0.9815, "step": 14692 }, { "epoch": 0.34, "learning_rate": 7.674375788126008e-06, "loss": 1.0176, "step": 14693 }, { "epoch": 0.34, "learning_rate": 7.674058454898745e-06, "loss": 0.9518, "step": 14694 }, { "epoch": 0.34, "learning_rate": 7.673741106584627e-06, "loss": 0.8687, "step": 14695 }, { "epoch": 0.34, "learning_rate": 7.673423743185444e-06, "loss": 1.1215, "step": 14696 }, { "epoch": 0.34, "learning_rate": 7.673106364702984e-06, "loss": 0.8319, "step": 14697 }, { "epoch": 0.34, "learning_rate": 7.672788971139042e-06, "loss": 1.0713, "step": 14698 }, { "epoch": 0.34, "learning_rate": 7.672471562495406e-06, "loss": 0.9588, "step": 14699 }, { "epoch": 0.34, "learning_rate": 7.672154138773867e-06, "loss": 1.1936, "step": 14700 }, { "epoch": 0.34, "learning_rate": 7.671836699976213e-06, "loss": 1.0548, "step": 14701 }, { "epoch": 0.34, "learning_rate": 7.671519246104243e-06, "loss": 0.8967, "step": 14702 }, { "epoch": 0.34, "learning_rate": 7.67120177715974e-06, "loss": 0.8478, "step": 14703 }, { "epoch": 0.34, "learning_rate": 7.6708842931445e-06, "loss": 1.1027, "step": 14704 }, { "epoch": 0.34, "learning_rate": 7.67056679406031e-06, "loss": 1.0862, "step": 14705 }, { "epoch": 0.34, "learning_rate": 7.670249279908968e-06, "loss": 1.0304, "step": 14706 }, { "epoch": 0.34, "learning_rate": 7.669931750692257e-06, "loss": 0.8857, "step": 14707 }, { "epoch": 0.34, "learning_rate": 7.669614206411975e-06, "loss": 1.1401, "step": 14708 }, { "epoch": 0.34, "learning_rate": 7.66929664706991e-06, "loss": 0.8686, "step": 14709 }, { "epoch": 0.34, "learning_rate": 7.668979072667858e-06, "loss": 1.2158, "step": 14710 }, { "epoch": 0.34, "learning_rate": 7.668661483207605e-06, "loss": 0.7941, "step": 14711 }, { "epoch": 0.34, "learning_rate": 7.668343878690944e-06, "loss": 0.9706, "step": 14712 }, { "epoch": 0.34, "learning_rate": 7.66802625911967e-06, "loss": 1.02, "step": 14713 }, { "epoch": 0.34, "learning_rate": 7.667708624495574e-06, "loss": 1.0294, "step": 14714 }, { "epoch": 0.34, "learning_rate": 7.667390974820446e-06, "loss": 1.0392, "step": 14715 }, { "epoch": 0.34, "learning_rate": 7.66707331009608e-06, "loss": 0.9558, "step": 14716 }, { "epoch": 0.34, "learning_rate": 7.666755630324268e-06, "loss": 0.6608, "step": 14717 }, { "epoch": 0.34, "learning_rate": 7.666437935506804e-06, "loss": 0.9306, "step": 14718 }, { "epoch": 0.34, "learning_rate": 7.666120225645475e-06, "loss": 0.9703, "step": 14719 }, { "epoch": 0.34, "learning_rate": 7.66580250074208e-06, "loss": 0.9505, "step": 14720 }, { "epoch": 0.34, "learning_rate": 7.665484760798406e-06, "loss": 0.8376, "step": 14721 }, { "epoch": 0.34, "learning_rate": 7.66516700581625e-06, "loss": 0.9477, "step": 14722 }, { "epoch": 0.34, "learning_rate": 7.664849235797402e-06, "loss": 0.9007, "step": 14723 }, { "epoch": 0.34, "learning_rate": 7.664531450743657e-06, "loss": 0.8243, "step": 14724 }, { "epoch": 0.34, "learning_rate": 7.664213650656806e-06, "loss": 0.8065, "step": 14725 }, { "epoch": 0.34, "learning_rate": 7.663895835538643e-06, "loss": 0.8378, "step": 14726 }, { "epoch": 0.34, "learning_rate": 7.663578005390962e-06, "loss": 0.7961, "step": 14727 }, { "epoch": 0.34, "learning_rate": 7.663260160215552e-06, "loss": 1.0687, "step": 14728 }, { "epoch": 0.34, "learning_rate": 7.662942300014214e-06, "loss": 1.2125, "step": 14729 }, { "epoch": 0.34, "learning_rate": 7.662624424788733e-06, "loss": 1.0074, "step": 14730 }, { "epoch": 0.34, "learning_rate": 7.662306534540908e-06, "loss": 0.8668, "step": 14731 }, { "epoch": 0.34, "learning_rate": 7.66198862927253e-06, "loss": 0.8577, "step": 14732 }, { "epoch": 0.34, "learning_rate": 7.661670708985392e-06, "loss": 1.0092, "step": 14733 }, { "epoch": 0.34, "learning_rate": 7.66135277368129e-06, "loss": 1.0068, "step": 14734 }, { "epoch": 0.34, "learning_rate": 7.661034823362017e-06, "loss": 0.9108, "step": 14735 }, { "epoch": 0.34, "learning_rate": 7.660716858029366e-06, "loss": 0.9887, "step": 14736 }, { "epoch": 0.34, "learning_rate": 7.660398877685132e-06, "loss": 0.8373, "step": 14737 }, { "epoch": 0.34, "learning_rate": 7.660080882331109e-06, "loss": 0.789, "step": 14738 }, { "epoch": 0.34, "learning_rate": 7.659762871969089e-06, "loss": 0.9934, "step": 14739 }, { "epoch": 0.34, "learning_rate": 7.659444846600868e-06, "loss": 0.9642, "step": 14740 }, { "epoch": 0.34, "learning_rate": 7.659126806228242e-06, "loss": 0.8702, "step": 14741 }, { "epoch": 0.34, "learning_rate": 7.658808750853e-06, "loss": 0.7593, "step": 14742 }, { "epoch": 0.34, "learning_rate": 7.658490680476943e-06, "loss": 0.9773, "step": 14743 }, { "epoch": 0.34, "learning_rate": 7.658172595101861e-06, "loss": 0.9392, "step": 14744 }, { "epoch": 0.34, "learning_rate": 7.657854494729551e-06, "loss": 0.9965, "step": 14745 }, { "epoch": 0.34, "learning_rate": 7.657536379361806e-06, "loss": 0.9988, "step": 14746 }, { "epoch": 0.34, "learning_rate": 7.657218249000422e-06, "loss": 0.8714, "step": 14747 }, { "epoch": 0.34, "learning_rate": 7.656900103647193e-06, "loss": 0.8133, "step": 14748 }, { "epoch": 0.34, "learning_rate": 7.656581943303914e-06, "loss": 0.8088, "step": 14749 }, { "epoch": 0.34, "learning_rate": 7.65626376797238e-06, "loss": 0.9796, "step": 14750 }, { "epoch": 0.34, "learning_rate": 7.655945577654388e-06, "loss": 0.8777, "step": 14751 }, { "epoch": 0.34, "learning_rate": 7.65562737235173e-06, "loss": 0.7292, "step": 14752 }, { "epoch": 0.34, "learning_rate": 7.655309152066204e-06, "loss": 0.9038, "step": 14753 }, { "epoch": 0.34, "learning_rate": 7.654990916799603e-06, "loss": 0.9669, "step": 14754 }, { "epoch": 0.34, "learning_rate": 7.654672666553726e-06, "loss": 1.007, "step": 14755 }, { "epoch": 0.34, "learning_rate": 7.654354401330367e-06, "loss": 0.7926, "step": 14756 }, { "epoch": 0.34, "learning_rate": 7.654036121131319e-06, "loss": 0.7778, "step": 14757 }, { "epoch": 0.34, "learning_rate": 7.65371782595838e-06, "loss": 0.6403, "step": 14758 }, { "epoch": 0.34, "learning_rate": 7.653399515813345e-06, "loss": 1.0824, "step": 14759 }, { "epoch": 0.34, "learning_rate": 7.653081190698012e-06, "loss": 0.9212, "step": 14760 }, { "epoch": 0.34, "learning_rate": 7.652762850614175e-06, "loss": 1.1403, "step": 14761 }, { "epoch": 0.34, "learning_rate": 7.652444495563631e-06, "loss": 0.7665, "step": 14762 }, { "epoch": 0.34, "learning_rate": 7.652126125548174e-06, "loss": 1.1946, "step": 14763 }, { "epoch": 0.34, "learning_rate": 7.651807740569602e-06, "loss": 0.7047, "step": 14764 }, { "epoch": 0.34, "learning_rate": 7.651489340629712e-06, "loss": 0.8183, "step": 14765 }, { "epoch": 0.34, "learning_rate": 7.651170925730297e-06, "loss": 0.7607, "step": 14766 }, { "epoch": 0.34, "learning_rate": 7.650852495873159e-06, "loss": 1.1114, "step": 14767 }, { "epoch": 0.34, "learning_rate": 7.650534051060092e-06, "loss": 0.6695, "step": 14768 }, { "epoch": 0.34, "learning_rate": 7.650215591292888e-06, "loss": 0.9371, "step": 14769 }, { "epoch": 0.34, "learning_rate": 7.649897116573353e-06, "loss": 0.9696, "step": 14770 }, { "epoch": 0.34, "learning_rate": 7.649578626903276e-06, "loss": 0.9462, "step": 14771 }, { "epoch": 0.34, "learning_rate": 7.649260122284456e-06, "loss": 0.6525, "step": 14772 }, { "epoch": 0.34, "learning_rate": 7.648941602718692e-06, "loss": 1.2671, "step": 14773 }, { "epoch": 0.34, "learning_rate": 7.648623068207778e-06, "loss": 0.7577, "step": 14774 }, { "epoch": 0.34, "learning_rate": 7.648304518753516e-06, "loss": 1.298, "step": 14775 }, { "epoch": 0.34, "learning_rate": 7.647985954357698e-06, "loss": 1.1065, "step": 14776 }, { "epoch": 0.34, "learning_rate": 7.64766737502212e-06, "loss": 0.7961, "step": 14777 }, { "epoch": 0.34, "learning_rate": 7.647348780748589e-06, "loss": 0.7704, "step": 14778 }, { "epoch": 0.34, "learning_rate": 7.647030171538892e-06, "loss": 0.9268, "step": 14779 }, { "epoch": 0.34, "learning_rate": 7.646711547394835e-06, "loss": 1.0222, "step": 14780 }, { "epoch": 0.34, "learning_rate": 7.646392908318207e-06, "loss": 1.0014, "step": 14781 }, { "epoch": 0.34, "learning_rate": 7.64607425431081e-06, "loss": 1.1069, "step": 14782 }, { "epoch": 0.34, "learning_rate": 7.645755585374445e-06, "loss": 0.9962, "step": 14783 }, { "epoch": 0.34, "learning_rate": 7.645436901510906e-06, "loss": 0.9508, "step": 14784 }, { "epoch": 0.34, "learning_rate": 7.645118202721993e-06, "loss": 1.2843, "step": 14785 }, { "epoch": 0.34, "learning_rate": 7.6447994890095e-06, "loss": 1.2259, "step": 14786 }, { "epoch": 0.34, "learning_rate": 7.644480760375232e-06, "loss": 0.9357, "step": 14787 }, { "epoch": 0.34, "learning_rate": 7.644162016820981e-06, "loss": 0.8262, "step": 14788 }, { "epoch": 0.34, "learning_rate": 7.64384325834855e-06, "loss": 0.9303, "step": 14789 }, { "epoch": 0.34, "learning_rate": 7.643524484959732e-06, "loss": 0.999, "step": 14790 }, { "epoch": 0.34, "learning_rate": 7.64320569665633e-06, "loss": 0.878, "step": 14791 }, { "epoch": 0.34, "learning_rate": 7.64288689344014e-06, "loss": 1.0212, "step": 14792 }, { "epoch": 0.34, "learning_rate": 7.642568075312965e-06, "loss": 0.9685, "step": 14793 }, { "epoch": 0.34, "learning_rate": 7.642249242276599e-06, "loss": 0.9259, "step": 14794 }, { "epoch": 0.34, "learning_rate": 7.641930394332842e-06, "loss": 0.9127, "step": 14795 }, { "epoch": 0.34, "learning_rate": 7.641611531483493e-06, "loss": 0.7093, "step": 14796 }, { "epoch": 0.34, "learning_rate": 7.641292653730355e-06, "loss": 1.0521, "step": 14797 }, { "epoch": 0.34, "learning_rate": 7.640973761075218e-06, "loss": 1.0461, "step": 14798 }, { "epoch": 0.34, "learning_rate": 7.64065485351989e-06, "loss": 0.8946, "step": 14799 }, { "epoch": 0.34, "learning_rate": 7.640335931066167e-06, "loss": 0.7938, "step": 14800 }, { "epoch": 0.34, "learning_rate": 7.640016993715847e-06, "loss": 1.1223, "step": 14801 }, { "epoch": 0.34, "learning_rate": 7.639698041470732e-06, "loss": 0.9892, "step": 14802 }, { "epoch": 0.34, "learning_rate": 7.63937907433262e-06, "loss": 1.2753, "step": 14803 }, { "epoch": 0.34, "learning_rate": 7.639060092303308e-06, "loss": 1.03, "step": 14804 }, { "epoch": 0.34, "learning_rate": 7.638741095384603e-06, "loss": 0.746, "step": 14805 }, { "epoch": 0.34, "learning_rate": 7.638422083578296e-06, "loss": 0.7708, "step": 14806 }, { "epoch": 0.34, "learning_rate": 7.638103056886195e-06, "loss": 1.1392, "step": 14807 }, { "epoch": 0.34, "learning_rate": 7.637784015310093e-06, "loss": 1.1692, "step": 14808 }, { "epoch": 0.34, "learning_rate": 7.637464958851795e-06, "loss": 0.8351, "step": 14809 }, { "epoch": 0.34, "learning_rate": 7.637145887513097e-06, "loss": 1.0979, "step": 14810 }, { "epoch": 0.34, "learning_rate": 7.636826801295803e-06, "loss": 0.8833, "step": 14811 }, { "epoch": 0.34, "learning_rate": 7.636507700201712e-06, "loss": 0.8639, "step": 14812 }, { "epoch": 0.34, "learning_rate": 7.636188584232622e-06, "loss": 0.795, "step": 14813 }, { "epoch": 0.34, "learning_rate": 7.635869453390337e-06, "loss": 0.9447, "step": 14814 }, { "epoch": 0.34, "learning_rate": 7.635550307676656e-06, "loss": 0.8141, "step": 14815 }, { "epoch": 0.34, "learning_rate": 7.635231147093376e-06, "loss": 1.1071, "step": 14816 }, { "epoch": 0.34, "learning_rate": 7.634911971642304e-06, "loss": 0.8379, "step": 14817 }, { "epoch": 0.34, "learning_rate": 7.634592781325238e-06, "loss": 0.8683, "step": 14818 }, { "epoch": 0.34, "learning_rate": 7.634273576143978e-06, "loss": 1.1668, "step": 14819 }, { "epoch": 0.34, "learning_rate": 7.633954356100326e-06, "loss": 0.6703, "step": 14820 }, { "epoch": 0.34, "learning_rate": 7.633635121196083e-06, "loss": 1.0087, "step": 14821 }, { "epoch": 0.34, "learning_rate": 7.633315871433049e-06, "loss": 1.144, "step": 14822 }, { "epoch": 0.34, "learning_rate": 7.632996606813028e-06, "loss": 0.9404, "step": 14823 }, { "epoch": 0.34, "learning_rate": 7.632677327337816e-06, "loss": 0.8085, "step": 14824 }, { "epoch": 0.34, "learning_rate": 7.63235803300922e-06, "loss": 0.7879, "step": 14825 }, { "epoch": 0.34, "learning_rate": 7.632038723829038e-06, "loss": 0.6719, "step": 14826 }, { "epoch": 0.34, "learning_rate": 7.631719399799074e-06, "loss": 0.9898, "step": 14827 }, { "epoch": 0.34, "learning_rate": 7.631400060921126e-06, "loss": 1.064, "step": 14828 }, { "epoch": 0.34, "learning_rate": 7.631080707196999e-06, "loss": 0.8125, "step": 14829 }, { "epoch": 0.34, "learning_rate": 7.630761338628493e-06, "loss": 0.9258, "step": 14830 }, { "epoch": 0.34, "learning_rate": 7.630441955217411e-06, "loss": 0.9634, "step": 14831 }, { "epoch": 0.34, "learning_rate": 7.630122556965556e-06, "loss": 0.9016, "step": 14832 }, { "epoch": 0.34, "learning_rate": 7.629803143874725e-06, "loss": 0.8185, "step": 14833 }, { "epoch": 0.34, "learning_rate": 7.629483715946727e-06, "loss": 0.9312, "step": 14834 }, { "epoch": 0.34, "learning_rate": 7.629164273183358e-06, "loss": 0.9708, "step": 14835 }, { "epoch": 0.34, "learning_rate": 7.628844815586424e-06, "loss": 0.8987, "step": 14836 }, { "epoch": 0.34, "learning_rate": 7.628525343157727e-06, "loss": 0.776, "step": 14837 }, { "epoch": 0.34, "learning_rate": 7.628205855899067e-06, "loss": 1.0951, "step": 14838 }, { "epoch": 0.34, "learning_rate": 7.627886353812251e-06, "loss": 0.8809, "step": 14839 }, { "epoch": 0.34, "learning_rate": 7.627566836899076e-06, "loss": 0.9036, "step": 14840 }, { "epoch": 0.34, "learning_rate": 7.627247305161349e-06, "loss": 0.9398, "step": 14841 }, { "epoch": 0.34, "learning_rate": 7.626927758600872e-06, "loss": 1.2021, "step": 14842 }, { "epoch": 0.34, "learning_rate": 7.626608197219446e-06, "loss": 1.0021, "step": 14843 }, { "epoch": 0.34, "learning_rate": 7.626288621018877e-06, "loss": 0.8463, "step": 14844 }, { "epoch": 0.34, "learning_rate": 7.625969030000965e-06, "loss": 1.0113, "step": 14845 }, { "epoch": 0.34, "learning_rate": 7.6256494241675135e-06, "loss": 1.0183, "step": 14846 }, { "epoch": 0.34, "learning_rate": 7.625329803520328e-06, "loss": 0.8318, "step": 14847 }, { "epoch": 0.34, "learning_rate": 7.625010168061211e-06, "loss": 1.1788, "step": 14848 }, { "epoch": 0.34, "learning_rate": 7.624690517791964e-06, "loss": 1.0406, "step": 14849 }, { "epoch": 0.34, "learning_rate": 7.624370852714391e-06, "loss": 1.0018, "step": 14850 }, { "epoch": 0.34, "learning_rate": 7.624051172830298e-06, "loss": 0.9365, "step": 14851 }, { "epoch": 0.34, "learning_rate": 7.623731478141485e-06, "loss": 0.8584, "step": 14852 }, { "epoch": 0.34, "learning_rate": 7.623411768649759e-06, "loss": 1.1132, "step": 14853 }, { "epoch": 0.34, "learning_rate": 7.623092044356921e-06, "loss": 1.045, "step": 14854 }, { "epoch": 0.34, "learning_rate": 7.6227723052647765e-06, "loss": 1.0034, "step": 14855 }, { "epoch": 0.34, "learning_rate": 7.622452551375129e-06, "loss": 0.7193, "step": 14856 }, { "epoch": 0.34, "learning_rate": 7.622132782689783e-06, "loss": 1.0394, "step": 14857 }, { "epoch": 0.34, "learning_rate": 7.621812999210541e-06, "loss": 1.1445, "step": 14858 }, { "epoch": 0.34, "learning_rate": 7.621493200939211e-06, "loss": 0.9314, "step": 14859 }, { "epoch": 0.34, "learning_rate": 7.6211733878775915e-06, "loss": 0.6217, "step": 14860 }, { "epoch": 0.34, "learning_rate": 7.6208535600274916e-06, "loss": 1.1036, "step": 14861 }, { "epoch": 0.34, "learning_rate": 7.620533717390715e-06, "loss": 0.8379, "step": 14862 }, { "epoch": 0.34, "learning_rate": 7.620213859969063e-06, "loss": 0.9684, "step": 14863 }, { "epoch": 0.34, "learning_rate": 7.619893987764344e-06, "loss": 0.9729, "step": 14864 }, { "epoch": 0.34, "learning_rate": 7.619574100778362e-06, "loss": 1.1219, "step": 14865 }, { "epoch": 0.34, "learning_rate": 7.619254199012921e-06, "loss": 0.8418, "step": 14866 }, { "epoch": 0.34, "learning_rate": 7.618934282469825e-06, "loss": 0.8454, "step": 14867 }, { "epoch": 0.34, "learning_rate": 7.618614351150879e-06, "loss": 0.6997, "step": 14868 }, { "epoch": 0.34, "learning_rate": 7.6182944050578925e-06, "loss": 0.9231, "step": 14869 }, { "epoch": 0.34, "learning_rate": 7.617974444192664e-06, "loss": 1.0325, "step": 14870 }, { "epoch": 0.34, "learning_rate": 7.617654468557003e-06, "loss": 0.8524, "step": 14871 }, { "epoch": 0.34, "learning_rate": 7.617334478152714e-06, "loss": 0.9894, "step": 14872 }, { "epoch": 0.34, "learning_rate": 7.617014472981601e-06, "loss": 0.7925, "step": 14873 }, { "epoch": 0.34, "learning_rate": 7.61669445304547e-06, "loss": 0.8708, "step": 14874 }, { "epoch": 0.34, "learning_rate": 7.616374418346127e-06, "loss": 1.3095, "step": 14875 }, { "epoch": 0.34, "learning_rate": 7.6160543688853784e-06, "loss": 1.0182, "step": 14876 }, { "epoch": 0.35, "learning_rate": 7.615734304665028e-06, "loss": 0.8593, "step": 14877 }, { "epoch": 0.35, "learning_rate": 7.615414225686884e-06, "loss": 0.7992, "step": 14878 }, { "epoch": 0.35, "learning_rate": 7.61509413195275e-06, "loss": 0.9333, "step": 14879 }, { "epoch": 0.35, "learning_rate": 7.6147740234644305e-06, "loss": 0.6936, "step": 14880 }, { "epoch": 0.35, "learning_rate": 7.6144539002237376e-06, "loss": 0.9932, "step": 14881 }, { "epoch": 0.35, "learning_rate": 7.6141337622324715e-06, "loss": 0.79, "step": 14882 }, { "epoch": 0.35, "learning_rate": 7.613813609492442e-06, "loss": 1.0148, "step": 14883 }, { "epoch": 0.35, "learning_rate": 7.613493442005453e-06, "loss": 1.0235, "step": 14884 }, { "epoch": 0.35, "learning_rate": 7.613173259773311e-06, "loss": 1.0054, "step": 14885 }, { "epoch": 0.35, "learning_rate": 7.612853062797825e-06, "loss": 1.119, "step": 14886 }, { "epoch": 0.35, "learning_rate": 7.612532851080799e-06, "loss": 0.9035, "step": 14887 }, { "epoch": 0.35, "learning_rate": 7.6122126246240394e-06, "loss": 1.1884, "step": 14888 }, { "epoch": 0.35, "learning_rate": 7.611892383429353e-06, "loss": 0.8517, "step": 14889 }, { "epoch": 0.35, "learning_rate": 7.6115721274985495e-06, "loss": 0.8099, "step": 14890 }, { "epoch": 0.35, "learning_rate": 7.611251856833434e-06, "loss": 0.8764, "step": 14891 }, { "epoch": 0.35, "learning_rate": 7.6109315714358125e-06, "loss": 1.0561, "step": 14892 }, { "epoch": 0.35, "learning_rate": 7.610611271307492e-06, "loss": 1.0814, "step": 14893 }, { "epoch": 0.35, "learning_rate": 7.6102909564502815e-06, "loss": 1.0985, "step": 14894 }, { "epoch": 0.35, "learning_rate": 7.609970626865985e-06, "loss": 1.1593, "step": 14895 }, { "epoch": 0.35, "learning_rate": 7.6096502825564134e-06, "loss": 1.1573, "step": 14896 }, { "epoch": 0.35, "learning_rate": 7.609329923523372e-06, "loss": 0.7574, "step": 14897 }, { "epoch": 0.35, "learning_rate": 7.609009549768669e-06, "loss": 0.8267, "step": 14898 }, { "epoch": 0.35, "learning_rate": 7.608689161294111e-06, "loss": 1.0066, "step": 14899 }, { "epoch": 0.35, "learning_rate": 7.608368758101505e-06, "loss": 1.0304, "step": 14900 }, { "epoch": 0.35, "learning_rate": 7.608048340192662e-06, "loss": 0.8064, "step": 14901 }, { "epoch": 0.35, "learning_rate": 7.607727907569388e-06, "loss": 0.9915, "step": 14902 }, { "epoch": 0.35, "learning_rate": 7.6074074602334895e-06, "loss": 1.0186, "step": 14903 }, { "epoch": 0.35, "learning_rate": 7.607086998186774e-06, "loss": 1.007, "step": 14904 }, { "epoch": 0.35, "learning_rate": 7.606766521431052e-06, "loss": 0.8307, "step": 14905 }, { "epoch": 0.35, "learning_rate": 7.606446029968133e-06, "loss": 0.8601, "step": 14906 }, { "epoch": 0.35, "learning_rate": 7.60612552379982e-06, "loss": 0.9189, "step": 14907 }, { "epoch": 0.35, "learning_rate": 7.6058050029279265e-06, "loss": 0.9194, "step": 14908 }, { "epoch": 0.35, "learning_rate": 7.6054844673542545e-06, "loss": 0.8062, "step": 14909 }, { "epoch": 0.35, "learning_rate": 7.6051639170806205e-06, "loss": 0.9817, "step": 14910 }, { "epoch": 0.35, "learning_rate": 7.604843352108826e-06, "loss": 0.9859, "step": 14911 }, { "epoch": 0.35, "learning_rate": 7.604522772440683e-06, "loss": 0.8508, "step": 14912 }, { "epoch": 0.35, "learning_rate": 7.604202178078002e-06, "loss": 0.6282, "step": 14913 }, { "epoch": 0.35, "learning_rate": 7.603881569022587e-06, "loss": 0.8855, "step": 14914 }, { "epoch": 0.35, "learning_rate": 7.603560945276249e-06, "loss": 0.8351, "step": 14915 }, { "epoch": 0.35, "learning_rate": 7.6032403068407986e-06, "loss": 0.9362, "step": 14916 }, { "epoch": 0.35, "learning_rate": 7.602919653718044e-06, "loss": 0.9503, "step": 14917 }, { "epoch": 0.35, "learning_rate": 7.602598985909793e-06, "loss": 0.9201, "step": 14918 }, { "epoch": 0.35, "learning_rate": 7.602278303417856e-06, "loss": 0.8753, "step": 14919 }, { "epoch": 0.35, "learning_rate": 7.60195760624404e-06, "loss": 0.9552, "step": 14920 }, { "epoch": 0.35, "learning_rate": 7.601636894390159e-06, "loss": 1.0592, "step": 14921 }, { "epoch": 0.35, "learning_rate": 7.601316167858016e-06, "loss": 0.9856, "step": 14922 }, { "epoch": 0.35, "learning_rate": 7.600995426649427e-06, "loss": 0.9005, "step": 14923 }, { "epoch": 0.35, "learning_rate": 7.600674670766197e-06, "loss": 0.9646, "step": 14924 }, { "epoch": 0.35, "learning_rate": 7.600353900210138e-06, "loss": 1.0102, "step": 14925 }, { "epoch": 0.35, "learning_rate": 7.600033114983061e-06, "loss": 0.8024, "step": 14926 }, { "epoch": 0.35, "learning_rate": 7.599712315086771e-06, "loss": 0.6697, "step": 14927 }, { "epoch": 0.35, "learning_rate": 7.599391500523083e-06, "loss": 0.8752, "step": 14928 }, { "epoch": 0.35, "learning_rate": 7.599070671293804e-06, "loss": 0.8903, "step": 14929 }, { "epoch": 0.35, "learning_rate": 7.598749827400747e-06, "loss": 0.8726, "step": 14930 }, { "epoch": 0.35, "learning_rate": 7.598428968845718e-06, "loss": 0.8998, "step": 14931 }, { "epoch": 0.35, "learning_rate": 7.59810809563053e-06, "loss": 0.6351, "step": 14932 }, { "epoch": 0.35, "learning_rate": 7.597787207756993e-06, "loss": 0.7163, "step": 14933 }, { "epoch": 0.35, "learning_rate": 7.597466305226917e-06, "loss": 0.904, "step": 14934 }, { "epoch": 0.35, "learning_rate": 7.597145388042113e-06, "loss": 0.7703, "step": 14935 }, { "epoch": 0.35, "learning_rate": 7.596824456204391e-06, "loss": 1.2622, "step": 14936 }, { "epoch": 0.35, "learning_rate": 7.596503509715562e-06, "loss": 1.0481, "step": 14937 }, { "epoch": 0.35, "learning_rate": 7.596182548577438e-06, "loss": 0.9204, "step": 14938 }, { "epoch": 0.35, "learning_rate": 7.595861572791828e-06, "loss": 0.8545, "step": 14939 }, { "epoch": 0.35, "learning_rate": 7.595540582360543e-06, "loss": 0.7769, "step": 14940 }, { "epoch": 0.35, "learning_rate": 7.595219577285397e-06, "loss": 0.8719, "step": 14941 }, { "epoch": 0.35, "learning_rate": 7.594898557568195e-06, "loss": 0.9228, "step": 14942 }, { "epoch": 0.35, "learning_rate": 7.594577523210755e-06, "loss": 1.2001, "step": 14943 }, { "epoch": 0.35, "learning_rate": 7.594256474214883e-06, "loss": 0.8266, "step": 14944 }, { "epoch": 0.35, "learning_rate": 7.593935410582393e-06, "loss": 0.8746, "step": 14945 }, { "epoch": 0.35, "learning_rate": 7.593614332315096e-06, "loss": 1.0031, "step": 14946 }, { "epoch": 0.35, "learning_rate": 7.593293239414805e-06, "loss": 0.7064, "step": 14947 }, { "epoch": 0.35, "learning_rate": 7.592972131883327e-06, "loss": 0.7665, "step": 14948 }, { "epoch": 0.35, "learning_rate": 7.592651009722478e-06, "loss": 1.0273, "step": 14949 }, { "epoch": 0.35, "learning_rate": 7.592329872934067e-06, "loss": 1.1027, "step": 14950 }, { "epoch": 0.35, "learning_rate": 7.59200872151991e-06, "loss": 0.7934, "step": 14951 }, { "epoch": 0.35, "learning_rate": 7.591687555481815e-06, "loss": 1.0196, "step": 14952 }, { "epoch": 0.35, "learning_rate": 7.591366374821594e-06, "loss": 0.8898, "step": 14953 }, { "epoch": 0.35, "learning_rate": 7.591045179541061e-06, "loss": 1.1126, "step": 14954 }, { "epoch": 0.35, "learning_rate": 7.590723969642027e-06, "loss": 1.0629, "step": 14955 }, { "epoch": 0.35, "learning_rate": 7.5904027451263065e-06, "loss": 0.7077, "step": 14956 }, { "epoch": 0.35, "learning_rate": 7.590081505995708e-06, "loss": 1.1043, "step": 14957 }, { "epoch": 0.35, "learning_rate": 7.589760252252046e-06, "loss": 0.9052, "step": 14958 }, { "epoch": 0.35, "learning_rate": 7.589438983897132e-06, "loss": 1.0392, "step": 14959 }, { "epoch": 0.35, "learning_rate": 7.589117700932781e-06, "loss": 0.92, "step": 14960 }, { "epoch": 0.35, "learning_rate": 7.588796403360802e-06, "loss": 1.1135, "step": 14961 }, { "epoch": 0.35, "learning_rate": 7.5884750911830114e-06, "loss": 1.1654, "step": 14962 }, { "epoch": 0.35, "learning_rate": 7.58815376440122e-06, "loss": 0.8251, "step": 14963 }, { "epoch": 0.35, "learning_rate": 7.5878324230172405e-06, "loss": 1.0297, "step": 14964 }, { "epoch": 0.35, "learning_rate": 7.587511067032888e-06, "loss": 0.9946, "step": 14965 }, { "epoch": 0.35, "learning_rate": 7.5871896964499726e-06, "loss": 0.7852, "step": 14966 }, { "epoch": 0.35, "learning_rate": 7.58686831127031e-06, "loss": 0.9462, "step": 14967 }, { "epoch": 0.35, "learning_rate": 7.586546911495712e-06, "loss": 1.1651, "step": 14968 }, { "epoch": 0.35, "learning_rate": 7.5862254971279926e-06, "loss": 1.0867, "step": 14969 }, { "epoch": 0.35, "learning_rate": 7.585904068168964e-06, "loss": 0.9689, "step": 14970 }, { "epoch": 0.35, "learning_rate": 7.58558262462044e-06, "loss": 1.0022, "step": 14971 }, { "epoch": 0.35, "learning_rate": 7.585261166484237e-06, "loss": 0.8148, "step": 14972 }, { "epoch": 0.35, "learning_rate": 7.584939693762164e-06, "loss": 1.1972, "step": 14973 }, { "epoch": 0.35, "learning_rate": 7.5846182064560395e-06, "loss": 1.0211, "step": 14974 }, { "epoch": 0.35, "learning_rate": 7.584296704567673e-06, "loss": 0.9333, "step": 14975 }, { "epoch": 0.35, "learning_rate": 7.58397518809888e-06, "loss": 0.7909, "step": 14976 }, { "epoch": 0.35, "learning_rate": 7.583653657051475e-06, "loss": 1.0194, "step": 14977 }, { "epoch": 0.35, "learning_rate": 7.583332111427273e-06, "loss": 0.8052, "step": 14978 }, { "epoch": 0.35, "learning_rate": 7.583010551228087e-06, "loss": 0.863, "step": 14979 }, { "epoch": 0.35, "learning_rate": 7.58268897645573e-06, "loss": 0.8237, "step": 14980 }, { "epoch": 0.35, "learning_rate": 7.5823673871120176e-06, "loss": 0.7648, "step": 14981 }, { "epoch": 0.35, "learning_rate": 7.582045783198765e-06, "loss": 0.9805, "step": 14982 }, { "epoch": 0.35, "learning_rate": 7.581724164717786e-06, "loss": 0.6337, "step": 14983 }, { "epoch": 0.35, "learning_rate": 7.581402531670893e-06, "loss": 1.187, "step": 14984 }, { "epoch": 0.35, "learning_rate": 7.581080884059903e-06, "loss": 0.895, "step": 14985 }, { "epoch": 0.35, "learning_rate": 7.580759221886631e-06, "loss": 1.0297, "step": 14986 }, { "epoch": 0.35, "learning_rate": 7.58043754515289e-06, "loss": 0.926, "step": 14987 }, { "epoch": 0.35, "learning_rate": 7.580115853860497e-06, "loss": 0.8202, "step": 14988 }, { "epoch": 0.35, "learning_rate": 7.579794148011266e-06, "loss": 1.0289, "step": 14989 }, { "epoch": 0.35, "learning_rate": 7.579472427607011e-06, "loss": 0.9742, "step": 14990 }, { "epoch": 0.35, "learning_rate": 7.5791506926495486e-06, "loss": 1.178, "step": 14991 }, { "epoch": 0.35, "learning_rate": 7.578828943140693e-06, "loss": 1.0114, "step": 14992 }, { "epoch": 0.35, "learning_rate": 7.57850717908226e-06, "loss": 0.7925, "step": 14993 }, { "epoch": 0.35, "learning_rate": 7.578185400476065e-06, "loss": 1.1119, "step": 14994 }, { "epoch": 0.35, "learning_rate": 7.577863607323923e-06, "loss": 0.8181, "step": 14995 }, { "epoch": 0.35, "learning_rate": 7.57754179962765e-06, "loss": 1.1002, "step": 14996 }, { "epoch": 0.35, "learning_rate": 7.577219977389062e-06, "loss": 0.9683, "step": 14997 }, { "epoch": 0.35, "learning_rate": 7.576898140609973e-06, "loss": 0.7653, "step": 14998 }, { "epoch": 0.35, "learning_rate": 7.576576289292201e-06, "loss": 1.046, "step": 14999 }, { "epoch": 0.35, "learning_rate": 7.576254423437561e-06, "loss": 1.0748, "step": 15000 } ], "logging_steps": 1.0, "max_steps": 43119, "num_train_epochs": 1, "save_steps": 5000, "total_flos": 4.96809906536448e+18, "trial_name": null, "trial_params": null }