{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "global_step": 7199, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 9.259259259259259e-08, "loss": 1.2556, "step": 1 }, { "epoch": 0.0, "learning_rate": 1.8518518518518518e-07, "loss": 1.6235, "step": 2 }, { "epoch": 0.0, "learning_rate": 2.7777777777777776e-07, "loss": 1.5728, "step": 3 }, { "epoch": 0.0, "learning_rate": 3.7037037037037036e-07, "loss": 1.729, "step": 4 }, { "epoch": 0.0, "learning_rate": 4.6296296296296297e-07, "loss": 1.7358, "step": 5 }, { "epoch": 0.0, "learning_rate": 5.555555555555555e-07, "loss": 0.9945, "step": 6 }, { "epoch": 0.0, "learning_rate": 6.481481481481481e-07, "loss": 1.626, "step": 7 }, { "epoch": 0.0, "learning_rate": 7.407407407407407e-07, "loss": 1.6162, "step": 8 }, { "epoch": 0.0, "learning_rate": 8.333333333333333e-07, "loss": 1.6914, "step": 9 }, { "epoch": 0.0, "learning_rate": 9.259259259259259e-07, "loss": 1.5693, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.0185185185185185e-06, "loss": 1.5894, "step": 11 }, { "epoch": 0.0, "learning_rate": 1.111111111111111e-06, "loss": 1.5581, "step": 12 }, { "epoch": 0.0, "learning_rate": 1.2037037037037037e-06, "loss": 1.5439, "step": 13 }, { "epoch": 0.0, "learning_rate": 1.2962962962962962e-06, "loss": 1.4526, "step": 14 }, { "epoch": 0.0, "learning_rate": 1.3888888888888892e-06, "loss": 1.4907, "step": 15 }, { "epoch": 0.0, "learning_rate": 1.4814814814814815e-06, "loss": 1.4399, "step": 16 }, { "epoch": 0.0, "learning_rate": 1.5740740740740742e-06, "loss": 1.4019, "step": 17 }, { "epoch": 0.0, "learning_rate": 1.6666666666666667e-06, "loss": 1.3154, "step": 18 }, { "epoch": 0.0, "learning_rate": 1.7592592592592594e-06, "loss": 1.4316, "step": 19 }, { "epoch": 0.0, "learning_rate": 1.8518518518518519e-06, "loss": 1.4116, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.944444444444445e-06, "loss": 1.3501, "step": 21 }, { "epoch": 0.0, "learning_rate": 2.037037037037037e-06, "loss": 1.3101, "step": 22 }, { "epoch": 0.0, "learning_rate": 2.1296296296296298e-06, "loss": 1.2856, "step": 23 }, { "epoch": 0.0, "learning_rate": 2.222222222222222e-06, "loss": 1.3047, "step": 24 }, { "epoch": 0.0, "learning_rate": 2.314814814814815e-06, "loss": 0.7908, "step": 25 }, { "epoch": 0.0, "learning_rate": 2.4074074074074075e-06, "loss": 1.239, "step": 26 }, { "epoch": 0.0, "learning_rate": 2.5e-06, "loss": 1.2212, "step": 27 }, { "epoch": 0.0, "learning_rate": 2.5925925925925925e-06, "loss": 1.3018, "step": 28 }, { "epoch": 0.0, "learning_rate": 2.6851851851851856e-06, "loss": 1.2471, "step": 29 }, { "epoch": 0.0, "learning_rate": 2.7777777777777783e-06, "loss": 1.2429, "step": 30 }, { "epoch": 0.0, "learning_rate": 2.8703703703703706e-06, "loss": 1.1785, "step": 31 }, { "epoch": 0.0, "learning_rate": 2.962962962962963e-06, "loss": 1.0918, "step": 32 }, { "epoch": 0.0, "learning_rate": 3.055555555555556e-06, "loss": 1.2007, "step": 33 }, { "epoch": 0.0, "learning_rate": 3.1481481481481483e-06, "loss": 1.1787, "step": 34 }, { "epoch": 0.0, "learning_rate": 3.240740740740741e-06, "loss": 1.2004, "step": 35 }, { "epoch": 0.01, "learning_rate": 3.3333333333333333e-06, "loss": 1.1362, "step": 36 }, { "epoch": 0.01, "learning_rate": 3.4259259259259265e-06, "loss": 1.0535, "step": 37 }, { "epoch": 0.01, "learning_rate": 3.5185185185185187e-06, "loss": 1.217, "step": 38 }, { "epoch": 0.01, "learning_rate": 3.6111111111111115e-06, "loss": 1.1851, "step": 39 }, { "epoch": 0.01, "learning_rate": 3.7037037037037037e-06, "loss": 1.1392, "step": 40 }, { "epoch": 0.01, "learning_rate": 3.796296296296297e-06, "loss": 1.1057, "step": 41 }, { "epoch": 0.01, "learning_rate": 3.88888888888889e-06, "loss": 1.0376, "step": 42 }, { "epoch": 0.01, "learning_rate": 3.9814814814814814e-06, "loss": 1.0496, "step": 43 }, { "epoch": 0.01, "learning_rate": 4.074074074074074e-06, "loss": 1.1035, "step": 44 }, { "epoch": 0.01, "learning_rate": 4.166666666666667e-06, "loss": 1.1025, "step": 45 }, { "epoch": 0.01, "learning_rate": 4.2592592592592596e-06, "loss": 1.1487, "step": 46 }, { "epoch": 0.01, "learning_rate": 4.351851851851852e-06, "loss": 1.1082, "step": 47 }, { "epoch": 0.01, "learning_rate": 4.444444444444444e-06, "loss": 1.0774, "step": 48 }, { "epoch": 0.01, "learning_rate": 4.537037037037038e-06, "loss": 1.0955, "step": 49 }, { "epoch": 0.01, "learning_rate": 4.62962962962963e-06, "loss": 1.0767, "step": 50 }, { "epoch": 0.01, "learning_rate": 4.722222222222222e-06, "loss": 1.1257, "step": 51 }, { "epoch": 0.01, "learning_rate": 4.814814814814815e-06, "loss": 1.0845, "step": 52 }, { "epoch": 0.01, "learning_rate": 4.907407407407408e-06, "loss": 1.0684, "step": 53 }, { "epoch": 0.01, "learning_rate": 5e-06, "loss": 1.0945, "step": 54 }, { "epoch": 0.01, "learning_rate": 5.092592592592593e-06, "loss": 1.0991, "step": 55 }, { "epoch": 0.01, "learning_rate": 5.185185185185185e-06, "loss": 1.0149, "step": 56 }, { "epoch": 0.01, "learning_rate": 5.2777777777777785e-06, "loss": 1.0457, "step": 57 }, { "epoch": 0.01, "learning_rate": 5.370370370370371e-06, "loss": 0.9873, "step": 58 }, { "epoch": 0.01, "learning_rate": 5.462962962962963e-06, "loss": 1.0586, "step": 59 }, { "epoch": 0.01, "learning_rate": 5.555555555555557e-06, "loss": 1.0447, "step": 60 }, { "epoch": 0.01, "learning_rate": 5.6481481481481485e-06, "loss": 1.0076, "step": 61 }, { "epoch": 0.01, "learning_rate": 5.740740740740741e-06, "loss": 1.0652, "step": 62 }, { "epoch": 0.01, "learning_rate": 5.833333333333334e-06, "loss": 1.0171, "step": 63 }, { "epoch": 0.01, "learning_rate": 5.925925925925926e-06, "loss": 1.1018, "step": 64 }, { "epoch": 0.01, "learning_rate": 6.018518518518519e-06, "loss": 1.0356, "step": 65 }, { "epoch": 0.01, "learning_rate": 6.111111111111112e-06, "loss": 1.0315, "step": 66 }, { "epoch": 0.01, "learning_rate": 6.203703703703704e-06, "loss": 1.0608, "step": 67 }, { "epoch": 0.01, "learning_rate": 6.296296296296297e-06, "loss": 1.0288, "step": 68 }, { "epoch": 0.01, "learning_rate": 6.3888888888888885e-06, "loss": 1.0647, "step": 69 }, { "epoch": 0.01, "learning_rate": 6.481481481481482e-06, "loss": 0.9517, "step": 70 }, { "epoch": 0.01, "learning_rate": 6.574074074074075e-06, "loss": 1.0269, "step": 71 }, { "epoch": 0.01, "learning_rate": 6.666666666666667e-06, "loss": 0.7502, "step": 72 }, { "epoch": 0.01, "learning_rate": 6.75925925925926e-06, "loss": 1.0635, "step": 73 }, { "epoch": 0.01, "learning_rate": 6.851851851851853e-06, "loss": 1.0312, "step": 74 }, { "epoch": 0.01, "learning_rate": 6.944444444444445e-06, "loss": 1.0886, "step": 75 }, { "epoch": 0.01, "learning_rate": 7.0370370370370375e-06, "loss": 1.0422, "step": 76 }, { "epoch": 0.01, "learning_rate": 7.129629629629629e-06, "loss": 1.0437, "step": 77 }, { "epoch": 0.01, "learning_rate": 7.222222222222223e-06, "loss": 0.7366, "step": 78 }, { "epoch": 0.01, "learning_rate": 7.314814814814816e-06, "loss": 1.0461, "step": 79 }, { "epoch": 0.01, "learning_rate": 7.4074074074074075e-06, "loss": 1.0801, "step": 80 }, { "epoch": 0.01, "learning_rate": 7.500000000000001e-06, "loss": 0.6398, "step": 81 }, { "epoch": 0.01, "learning_rate": 7.592592592592594e-06, "loss": 1.001, "step": 82 }, { "epoch": 0.01, "learning_rate": 7.685185185185185e-06, "loss": 1.0457, "step": 83 }, { "epoch": 0.01, "learning_rate": 7.77777777777778e-06, "loss": 1.0798, "step": 84 }, { "epoch": 0.01, "learning_rate": 7.870370370370372e-06, "loss": 1.04, "step": 85 }, { "epoch": 0.01, "learning_rate": 7.962962962962963e-06, "loss": 1.0405, "step": 86 }, { "epoch": 0.01, "learning_rate": 8.055555555555557e-06, "loss": 1.0088, "step": 87 }, { "epoch": 0.01, "learning_rate": 8.148148148148148e-06, "loss": 0.6862, "step": 88 }, { "epoch": 0.01, "learning_rate": 8.240740740740741e-06, "loss": 0.6724, "step": 89 }, { "epoch": 0.01, "learning_rate": 8.333333333333334e-06, "loss": 0.9912, "step": 90 }, { "epoch": 0.01, "learning_rate": 8.425925925925926e-06, "loss": 0.9688, "step": 91 }, { "epoch": 0.01, "learning_rate": 8.518518518518519e-06, "loss": 0.9841, "step": 92 }, { "epoch": 0.01, "learning_rate": 8.611111111111112e-06, "loss": 0.6307, "step": 93 }, { "epoch": 0.01, "learning_rate": 8.703703703703705e-06, "loss": 0.991, "step": 94 }, { "epoch": 0.01, "learning_rate": 8.796296296296297e-06, "loss": 0.9741, "step": 95 }, { "epoch": 0.01, "learning_rate": 8.888888888888888e-06, "loss": 0.9829, "step": 96 }, { "epoch": 0.01, "learning_rate": 8.981481481481483e-06, "loss": 0.9756, "step": 97 }, { "epoch": 0.01, "learning_rate": 9.074074074074075e-06, "loss": 1.0005, "step": 98 }, { "epoch": 0.01, "learning_rate": 9.166666666666666e-06, "loss": 0.6918, "step": 99 }, { "epoch": 0.01, "learning_rate": 9.25925925925926e-06, "loss": 0.9692, "step": 100 }, { "epoch": 0.01, "learning_rate": 9.351851851851854e-06, "loss": 0.9951, "step": 101 }, { "epoch": 0.01, "learning_rate": 9.444444444444445e-06, "loss": 0.9995, "step": 102 }, { "epoch": 0.01, "learning_rate": 9.537037037037037e-06, "loss": 1.0381, "step": 103 }, { "epoch": 0.01, "learning_rate": 9.62962962962963e-06, "loss": 1.0452, "step": 104 }, { "epoch": 0.01, "learning_rate": 9.722222222222223e-06, "loss": 1.0095, "step": 105 }, { "epoch": 0.01, "learning_rate": 9.814814814814815e-06, "loss": 0.991, "step": 106 }, { "epoch": 0.01, "learning_rate": 9.907407407407408e-06, "loss": 0.6447, "step": 107 }, { "epoch": 0.02, "learning_rate": 1e-05, "loss": 0.9778, "step": 108 }, { "epoch": 0.02, "learning_rate": 1.0092592592592594e-05, "loss": 0.998, "step": 109 }, { "epoch": 0.02, "learning_rate": 1.0185185185185186e-05, "loss": 1.0188, "step": 110 }, { "epoch": 0.02, "learning_rate": 1.0277777777777777e-05, "loss": 0.9729, "step": 111 }, { "epoch": 0.02, "learning_rate": 1.037037037037037e-05, "loss": 0.6531, "step": 112 }, { "epoch": 0.02, "learning_rate": 1.0462962962962964e-05, "loss": 0.6668, "step": 113 }, { "epoch": 0.02, "learning_rate": 1.0555555555555557e-05, "loss": 1.0403, "step": 114 }, { "epoch": 0.02, "learning_rate": 1.064814814814815e-05, "loss": 1.0598, "step": 115 }, { "epoch": 0.02, "learning_rate": 1.0740740740740742e-05, "loss": 0.9399, "step": 116 }, { "epoch": 0.02, "learning_rate": 1.0833333333333334e-05, "loss": 1.0017, "step": 117 }, { "epoch": 0.02, "learning_rate": 1.0925925925925926e-05, "loss": 1.0034, "step": 118 }, { "epoch": 0.02, "learning_rate": 1.1018518518518519e-05, "loss": 0.9863, "step": 119 }, { "epoch": 0.02, "learning_rate": 1.1111111111111113e-05, "loss": 0.9985, "step": 120 }, { "epoch": 0.02, "learning_rate": 1.1203703703703706e-05, "loss": 1.0347, "step": 121 }, { "epoch": 0.02, "learning_rate": 1.1296296296296297e-05, "loss": 1.0413, "step": 122 }, { "epoch": 0.02, "learning_rate": 1.138888888888889e-05, "loss": 1.0461, "step": 123 }, { "epoch": 0.02, "learning_rate": 1.1481481481481482e-05, "loss": 0.9878, "step": 124 }, { "epoch": 0.02, "learning_rate": 1.1574074074074075e-05, "loss": 0.9836, "step": 125 }, { "epoch": 0.02, "learning_rate": 1.1666666666666668e-05, "loss": 0.9636, "step": 126 }, { "epoch": 0.02, "learning_rate": 1.1759259259259259e-05, "loss": 0.9763, "step": 127 }, { "epoch": 0.02, "learning_rate": 1.1851851851851852e-05, "loss": 1.0042, "step": 128 }, { "epoch": 0.02, "learning_rate": 1.1944444444444444e-05, "loss": 0.9934, "step": 129 }, { "epoch": 0.02, "learning_rate": 1.2037037037037039e-05, "loss": 0.9824, "step": 130 }, { "epoch": 0.02, "learning_rate": 1.2129629629629631e-05, "loss": 0.9846, "step": 131 }, { "epoch": 0.02, "learning_rate": 1.2222222222222224e-05, "loss": 1.0708, "step": 132 }, { "epoch": 0.02, "learning_rate": 1.2314814814814815e-05, "loss": 0.981, "step": 133 }, { "epoch": 0.02, "learning_rate": 1.2407407407407408e-05, "loss": 1.0671, "step": 134 }, { "epoch": 0.02, "learning_rate": 1.25e-05, "loss": 1.0369, "step": 135 }, { "epoch": 0.02, "learning_rate": 1.2592592592592593e-05, "loss": 0.9382, "step": 136 }, { "epoch": 0.02, "learning_rate": 1.2685185185185188e-05, "loss": 0.9146, "step": 137 }, { "epoch": 0.02, "learning_rate": 1.2777777777777777e-05, "loss": 0.9578, "step": 138 }, { "epoch": 0.02, "learning_rate": 1.2870370370370371e-05, "loss": 0.9995, "step": 139 }, { "epoch": 0.02, "learning_rate": 1.2962962962962964e-05, "loss": 1.0576, "step": 140 }, { "epoch": 0.02, "learning_rate": 1.3055555555555557e-05, "loss": 1.0457, "step": 141 }, { "epoch": 0.02, "learning_rate": 1.314814814814815e-05, "loss": 0.9414, "step": 142 }, { "epoch": 0.02, "learning_rate": 1.3240740740740742e-05, "loss": 1.0159, "step": 143 }, { "epoch": 0.02, "learning_rate": 1.3333333333333333e-05, "loss": 0.9668, "step": 144 }, { "epoch": 0.02, "learning_rate": 1.3425925925925926e-05, "loss": 1.0334, "step": 145 }, { "epoch": 0.02, "learning_rate": 1.351851851851852e-05, "loss": 1.0312, "step": 146 }, { "epoch": 0.02, "learning_rate": 1.3611111111111113e-05, "loss": 0.9426, "step": 147 }, { "epoch": 0.02, "learning_rate": 1.3703703703703706e-05, "loss": 1.0029, "step": 148 }, { "epoch": 0.02, "learning_rate": 1.3796296296296297e-05, "loss": 1.0076, "step": 149 }, { "epoch": 0.02, "learning_rate": 1.388888888888889e-05, "loss": 0.9937, "step": 150 }, { "epoch": 0.02, "learning_rate": 1.3981481481481482e-05, "loss": 1.032, "step": 151 }, { "epoch": 0.02, "learning_rate": 1.4074074074074075e-05, "loss": 0.9216, "step": 152 }, { "epoch": 0.02, "learning_rate": 1.416666666666667e-05, "loss": 1.0295, "step": 153 }, { "epoch": 0.02, "learning_rate": 1.4259259259259259e-05, "loss": 1.001, "step": 154 }, { "epoch": 0.02, "learning_rate": 1.4351851851851853e-05, "loss": 0.9761, "step": 155 }, { "epoch": 0.02, "learning_rate": 1.4444444444444446e-05, "loss": 1.0581, "step": 156 }, { "epoch": 0.02, "learning_rate": 1.4537037037037039e-05, "loss": 0.9802, "step": 157 }, { "epoch": 0.02, "learning_rate": 1.4629629629629631e-05, "loss": 1.0486, "step": 158 }, { "epoch": 0.02, "learning_rate": 1.4722222222222224e-05, "loss": 1.0442, "step": 159 }, { "epoch": 0.02, "learning_rate": 1.4814814814814815e-05, "loss": 0.9592, "step": 160 }, { "epoch": 0.02, "learning_rate": 1.4907407407407408e-05, "loss": 0.9634, "step": 161 }, { "epoch": 0.02, "learning_rate": 1.5000000000000002e-05, "loss": 0.6413, "step": 162 }, { "epoch": 0.02, "learning_rate": 1.5092592592592595e-05, "loss": 1.0393, "step": 163 }, { "epoch": 0.02, "learning_rate": 1.5185185185185187e-05, "loss": 0.9976, "step": 164 }, { "epoch": 0.02, "learning_rate": 1.5277777777777777e-05, "loss": 0.9814, "step": 165 }, { "epoch": 0.02, "learning_rate": 1.537037037037037e-05, "loss": 0.9727, "step": 166 }, { "epoch": 0.02, "learning_rate": 1.5462962962962966e-05, "loss": 0.9946, "step": 167 }, { "epoch": 0.02, "learning_rate": 1.555555555555556e-05, "loss": 0.9812, "step": 168 }, { "epoch": 0.02, "learning_rate": 1.564814814814815e-05, "loss": 0.6392, "step": 169 }, { "epoch": 0.02, "learning_rate": 1.5740740740740744e-05, "loss": 1.0095, "step": 170 }, { "epoch": 0.02, "learning_rate": 1.5833333333333333e-05, "loss": 0.9954, "step": 171 }, { "epoch": 0.02, "learning_rate": 1.5925925925925926e-05, "loss": 0.999, "step": 172 }, { "epoch": 0.02, "learning_rate": 1.601851851851852e-05, "loss": 0.9993, "step": 173 }, { "epoch": 0.02, "learning_rate": 1.6111111111111115e-05, "loss": 0.915, "step": 174 }, { "epoch": 0.02, "learning_rate": 1.6203703703703707e-05, "loss": 0.6149, "step": 175 }, { "epoch": 0.02, "learning_rate": 1.6296296296296297e-05, "loss": 1.0339, "step": 176 }, { "epoch": 0.02, "learning_rate": 1.638888888888889e-05, "loss": 0.9932, "step": 177 }, { "epoch": 0.02, "learning_rate": 1.6481481481481482e-05, "loss": 0.9021, "step": 178 }, { "epoch": 0.02, "learning_rate": 1.6574074074074075e-05, "loss": 1.033, "step": 179 }, { "epoch": 0.03, "learning_rate": 1.6666666666666667e-05, "loss": 0.9187, "step": 180 }, { "epoch": 0.03, "learning_rate": 1.675925925925926e-05, "loss": 1.0264, "step": 181 }, { "epoch": 0.03, "learning_rate": 1.6851851851851853e-05, "loss": 0.9255, "step": 182 }, { "epoch": 0.03, "learning_rate": 1.6944444444444446e-05, "loss": 1.0688, "step": 183 }, { "epoch": 0.03, "learning_rate": 1.7037037037037038e-05, "loss": 0.9548, "step": 184 }, { "epoch": 0.03, "learning_rate": 1.712962962962963e-05, "loss": 0.9978, "step": 185 }, { "epoch": 0.03, "learning_rate": 1.7222222222222224e-05, "loss": 0.98, "step": 186 }, { "epoch": 0.03, "learning_rate": 1.7314814814814816e-05, "loss": 0.9878, "step": 187 }, { "epoch": 0.03, "learning_rate": 1.740740740740741e-05, "loss": 0.999, "step": 188 }, { "epoch": 0.03, "learning_rate": 1.7500000000000002e-05, "loss": 1.0122, "step": 189 }, { "epoch": 0.03, "learning_rate": 1.7592592592592595e-05, "loss": 0.9441, "step": 190 }, { "epoch": 0.03, "learning_rate": 1.7685185185185187e-05, "loss": 0.9617, "step": 191 }, { "epoch": 0.03, "learning_rate": 1.7777777777777777e-05, "loss": 1.0168, "step": 192 }, { "epoch": 0.03, "learning_rate": 1.7870370370370373e-05, "loss": 1.0115, "step": 193 }, { "epoch": 0.03, "learning_rate": 1.7962962962962965e-05, "loss": 0.9148, "step": 194 }, { "epoch": 0.03, "learning_rate": 1.8055555555555558e-05, "loss": 1.0098, "step": 195 }, { "epoch": 0.03, "learning_rate": 1.814814814814815e-05, "loss": 1.0439, "step": 196 }, { "epoch": 0.03, "learning_rate": 1.8240740740740744e-05, "loss": 1.0437, "step": 197 }, { "epoch": 0.03, "learning_rate": 1.8333333333333333e-05, "loss": 0.9888, "step": 198 }, { "epoch": 0.03, "learning_rate": 1.8425925925925926e-05, "loss": 1.0012, "step": 199 }, { "epoch": 0.03, "learning_rate": 1.851851851851852e-05, "loss": 0.9478, "step": 200 }, { "epoch": 0.03, "learning_rate": 1.8611111111111114e-05, "loss": 0.9707, "step": 201 }, { "epoch": 0.03, "learning_rate": 1.8703703703703707e-05, "loss": 0.928, "step": 202 }, { "epoch": 0.03, "learning_rate": 1.8796296296296296e-05, "loss": 0.9644, "step": 203 }, { "epoch": 0.03, "learning_rate": 1.888888888888889e-05, "loss": 1.0059, "step": 204 }, { "epoch": 0.03, "learning_rate": 1.8981481481481482e-05, "loss": 0.9678, "step": 205 }, { "epoch": 0.03, "learning_rate": 1.9074074074074075e-05, "loss": 1.0271, "step": 206 }, { "epoch": 0.03, "learning_rate": 1.916666666666667e-05, "loss": 0.9946, "step": 207 }, { "epoch": 0.03, "learning_rate": 1.925925925925926e-05, "loss": 1.0366, "step": 208 }, { "epoch": 0.03, "learning_rate": 1.9351851851851853e-05, "loss": 1.0571, "step": 209 }, { "epoch": 0.03, "learning_rate": 1.9444444444444445e-05, "loss": 1.0198, "step": 210 }, { "epoch": 0.03, "learning_rate": 1.9537037037037038e-05, "loss": 0.999, "step": 211 }, { "epoch": 0.03, "learning_rate": 1.962962962962963e-05, "loss": 0.9922, "step": 212 }, { "epoch": 0.03, "learning_rate": 1.9722222222222224e-05, "loss": 0.9832, "step": 213 }, { "epoch": 0.03, "learning_rate": 1.9814814814814816e-05, "loss": 0.6103, "step": 214 }, { "epoch": 0.03, "learning_rate": 1.990740740740741e-05, "loss": 1.0217, "step": 215 }, { "epoch": 0.03, "learning_rate": 2e-05, "loss": 0.9609, "step": 216 }, { "epoch": 0.03, "learning_rate": 1.999999898798801e-05, "loss": 0.9578, "step": 217 }, { "epoch": 0.03, "learning_rate": 1.9999995951952243e-05, "loss": 0.9233, "step": 218 }, { "epoch": 0.03, "learning_rate": 1.9999990891893314e-05, "loss": 0.9048, "step": 219 }, { "epoch": 0.03, "learning_rate": 1.9999983807812244e-05, "loss": 1.001, "step": 220 }, { "epoch": 0.03, "learning_rate": 1.9999974699710472e-05, "loss": 0.6437, "step": 221 }, { "epoch": 0.03, "learning_rate": 1.9999963567589836e-05, "loss": 0.9202, "step": 222 }, { "epoch": 0.03, "learning_rate": 1.9999950411452595e-05, "loss": 0.9445, "step": 223 }, { "epoch": 0.03, "learning_rate": 1.9999935231301405e-05, "loss": 0.9968, "step": 224 }, { "epoch": 0.03, "learning_rate": 1.9999918027139346e-05, "loss": 0.9292, "step": 225 }, { "epoch": 0.03, "learning_rate": 1.9999898798969898e-05, "loss": 1.0295, "step": 226 }, { "epoch": 0.03, "learning_rate": 1.9999877546796947e-05, "loss": 0.9895, "step": 227 }, { "epoch": 0.03, "learning_rate": 1.9999854270624803e-05, "loss": 0.9556, "step": 228 }, { "epoch": 0.03, "learning_rate": 1.999982897045817e-05, "loss": 1.0449, "step": 229 }, { "epoch": 0.03, "learning_rate": 1.9999801646302175e-05, "loss": 0.9634, "step": 230 }, { "epoch": 0.03, "learning_rate": 1.9999772298162344e-05, "loss": 1.0159, "step": 231 }, { "epoch": 0.03, "learning_rate": 1.9999740926044618e-05, "loss": 0.9624, "step": 232 }, { "epoch": 0.03, "learning_rate": 1.999970752995535e-05, "loss": 0.988, "step": 233 }, { "epoch": 0.03, "learning_rate": 1.9999672109901293e-05, "loss": 1.0029, "step": 234 }, { "epoch": 0.03, "learning_rate": 1.999963466588962e-05, "loss": 1.0005, "step": 235 }, { "epoch": 0.03, "learning_rate": 1.9999595197927914e-05, "loss": 0.9832, "step": 236 }, { "epoch": 0.03, "learning_rate": 1.9999553706024153e-05, "loss": 0.9968, "step": 237 }, { "epoch": 0.03, "learning_rate": 1.9999510190186745e-05, "loss": 0.9937, "step": 238 }, { "epoch": 0.03, "learning_rate": 1.9999464650424493e-05, "loss": 0.9546, "step": 239 }, { "epoch": 0.03, "learning_rate": 1.9999417086746616e-05, "loss": 0.8933, "step": 240 }, { "epoch": 0.03, "learning_rate": 1.9999367499162736e-05, "loss": 1.0039, "step": 241 }, { "epoch": 0.03, "learning_rate": 1.99993158876829e-05, "loss": 0.9988, "step": 242 }, { "epoch": 0.03, "learning_rate": 1.9999262252317545e-05, "loss": 0.9348, "step": 243 }, { "epoch": 0.03, "learning_rate": 1.9999206593077528e-05, "loss": 0.9546, "step": 244 }, { "epoch": 0.03, "learning_rate": 1.999914890997412e-05, "loss": 0.9885, "step": 245 }, { "epoch": 0.03, "learning_rate": 1.9999089203018994e-05, "loss": 0.9697, "step": 246 }, { "epoch": 0.03, "learning_rate": 1.999902747222423e-05, "loss": 1.012, "step": 247 }, { "epoch": 0.03, "learning_rate": 1.9998963717602327e-05, "loss": 0.9922, "step": 248 }, { "epoch": 0.03, "learning_rate": 1.999889793916619e-05, "loss": 1.0073, "step": 249 }, { "epoch": 0.03, "learning_rate": 1.9998830136929128e-05, "loss": 0.9766, "step": 250 }, { "epoch": 0.03, "learning_rate": 1.999876031090487e-05, "loss": 1.0234, "step": 251 }, { "epoch": 0.04, "learning_rate": 1.999868846110754e-05, "loss": 1.0317, "step": 252 }, { "epoch": 0.04, "learning_rate": 1.9998614587551695e-05, "loss": 1.0002, "step": 253 }, { "epoch": 0.04, "learning_rate": 1.9998538690252277e-05, "loss": 1.0203, "step": 254 }, { "epoch": 0.04, "learning_rate": 1.999846076922465e-05, "loss": 1.0071, "step": 255 }, { "epoch": 0.04, "learning_rate": 1.999838082448458e-05, "loss": 0.9548, "step": 256 }, { "epoch": 0.04, "learning_rate": 1.9998298856048257e-05, "loss": 1.0056, "step": 257 }, { "epoch": 0.04, "learning_rate": 1.999821486393227e-05, "loss": 0.9766, "step": 258 }, { "epoch": 0.04, "learning_rate": 1.9998128848153613e-05, "loss": 0.9924, "step": 259 }, { "epoch": 0.04, "learning_rate": 1.99980408087297e-05, "loss": 0.9968, "step": 260 }, { "epoch": 0.04, "learning_rate": 1.9997950745678354e-05, "loss": 0.9375, "step": 261 }, { "epoch": 0.04, "learning_rate": 1.9997858659017795e-05, "loss": 1.0149, "step": 262 }, { "epoch": 0.04, "learning_rate": 1.9997764548766668e-05, "loss": 0.9341, "step": 263 }, { "epoch": 0.04, "learning_rate": 1.9997668414944025e-05, "loss": 0.312, "step": 264 }, { "epoch": 0.04, "learning_rate": 1.9997570257569313e-05, "loss": 1.02, "step": 265 }, { "epoch": 0.04, "learning_rate": 1.9997470076662405e-05, "loss": 0.9814, "step": 266 }, { "epoch": 0.04, "learning_rate": 1.999736787224358e-05, "loss": 0.9719, "step": 267 }, { "epoch": 0.04, "learning_rate": 1.9997263644333522e-05, "loss": 1.031, "step": 268 }, { "epoch": 0.04, "learning_rate": 1.9997157392953327e-05, "loss": 0.9651, "step": 269 }, { "epoch": 0.04, "learning_rate": 1.99970491181245e-05, "loss": 0.9312, "step": 270 }, { "epoch": 0.04, "learning_rate": 1.9996938819868955e-05, "loss": 1.0076, "step": 271 }, { "epoch": 0.04, "learning_rate": 1.999682649820902e-05, "loss": 1.0137, "step": 272 }, { "epoch": 0.04, "learning_rate": 1.999671215316743e-05, "loss": 0.6426, "step": 273 }, { "epoch": 0.04, "learning_rate": 1.9996595784767322e-05, "loss": 1.0073, "step": 274 }, { "epoch": 0.04, "learning_rate": 1.9996477393032254e-05, "loss": 0.9561, "step": 275 }, { "epoch": 0.04, "learning_rate": 1.9996356977986193e-05, "loss": 0.9155, "step": 276 }, { "epoch": 0.04, "learning_rate": 1.99962345396535e-05, "loss": 0.9343, "step": 277 }, { "epoch": 0.04, "learning_rate": 1.999611007805897e-05, "loss": 0.969, "step": 278 }, { "epoch": 0.04, "learning_rate": 1.999598359322778e-05, "loss": 0.6214, "step": 279 }, { "epoch": 0.04, "learning_rate": 1.9995855085185544e-05, "loss": 0.9775, "step": 280 }, { "epoch": 0.04, "learning_rate": 1.9995724553958268e-05, "loss": 0.9895, "step": 281 }, { "epoch": 0.04, "learning_rate": 1.9995591999572367e-05, "loss": 0.8748, "step": 282 }, { "epoch": 0.04, "learning_rate": 1.9995457422054675e-05, "loss": 1.0227, "step": 283 }, { "epoch": 0.04, "learning_rate": 1.999532082143243e-05, "loss": 0.9829, "step": 284 }, { "epoch": 0.04, "learning_rate": 1.9995182197733277e-05, "loss": 0.9873, "step": 285 }, { "epoch": 0.04, "learning_rate": 1.9995041550985282e-05, "loss": 0.9973, "step": 286 }, { "epoch": 0.04, "learning_rate": 1.9994898881216905e-05, "loss": 1.0293, "step": 287 }, { "epoch": 0.04, "learning_rate": 1.9994754188457022e-05, "loss": 0.9612, "step": 288 }, { "epoch": 0.04, "learning_rate": 1.9994607472734925e-05, "loss": 0.9556, "step": 289 }, { "epoch": 0.04, "learning_rate": 1.999445873408031e-05, "loss": 0.917, "step": 290 }, { "epoch": 0.04, "learning_rate": 1.9994307972523272e-05, "loss": 1.0569, "step": 291 }, { "epoch": 0.04, "learning_rate": 1.9994155188094338e-05, "loss": 0.9946, "step": 292 }, { "epoch": 0.04, "learning_rate": 1.9994000380824423e-05, "loss": 0.9507, "step": 293 }, { "epoch": 0.04, "learning_rate": 1.9993843550744864e-05, "loss": 0.9431, "step": 294 }, { "epoch": 0.04, "learning_rate": 1.99936846978874e-05, "loss": 1.0049, "step": 295 }, { "epoch": 0.04, "learning_rate": 1.999352382228419e-05, "loss": 0.9387, "step": 296 }, { "epoch": 0.04, "learning_rate": 1.9993360923967792e-05, "loss": 0.9827, "step": 297 }, { "epoch": 0.04, "learning_rate": 1.9993196002971177e-05, "loss": 0.9343, "step": 298 }, { "epoch": 0.04, "learning_rate": 1.9993029059327725e-05, "loss": 1.0059, "step": 299 }, { "epoch": 0.04, "learning_rate": 1.9992860093071225e-05, "loss": 0.9536, "step": 300 }, { "epoch": 0.04, "learning_rate": 1.999268910423588e-05, "loss": 1.0002, "step": 301 }, { "epoch": 0.04, "learning_rate": 1.9992516092856294e-05, "loss": 0.9414, "step": 302 }, { "epoch": 0.04, "learning_rate": 1.9992341058967487e-05, "loss": 1.0308, "step": 303 }, { "epoch": 0.04, "learning_rate": 1.9992164002604887e-05, "loss": 1.0293, "step": 304 }, { "epoch": 0.04, "learning_rate": 1.999198492380433e-05, "loss": 1.0317, "step": 305 }, { "epoch": 0.04, "learning_rate": 1.9991803822602063e-05, "loss": 1.0024, "step": 306 }, { "epoch": 0.04, "learning_rate": 1.9991620699034738e-05, "loss": 0.915, "step": 307 }, { "epoch": 0.04, "learning_rate": 1.9991435553139422e-05, "loss": 0.8931, "step": 308 }, { "epoch": 0.04, "learning_rate": 1.9991248384953588e-05, "loss": 0.9495, "step": 309 }, { "epoch": 0.04, "learning_rate": 1.999105919451512e-05, "loss": 0.9546, "step": 310 }, { "epoch": 0.04, "learning_rate": 1.9990867981862312e-05, "loss": 0.9614, "step": 311 }, { "epoch": 0.04, "learning_rate": 1.9990674747033864e-05, "loss": 0.9688, "step": 312 }, { "epoch": 0.04, "learning_rate": 1.999047949006889e-05, "loss": 0.9783, "step": 313 }, { "epoch": 0.04, "learning_rate": 1.9990282211006903e-05, "loss": 0.9419, "step": 314 }, { "epoch": 0.04, "learning_rate": 1.999008290988784e-05, "loss": 1.0786, "step": 315 }, { "epoch": 0.04, "learning_rate": 1.998988158675204e-05, "loss": 0.9827, "step": 316 }, { "epoch": 0.04, "learning_rate": 1.998967824164025e-05, "loss": 0.9348, "step": 317 }, { "epoch": 0.04, "learning_rate": 1.9989472874593626e-05, "loss": 0.8892, "step": 318 }, { "epoch": 0.04, "learning_rate": 1.9989265485653733e-05, "loss": 0.9458, "step": 319 }, { "epoch": 0.04, "learning_rate": 1.998905607486255e-05, "loss": 0.9019, "step": 320 }, { "epoch": 0.04, "learning_rate": 1.9988844642262462e-05, "loss": 0.9302, "step": 321 }, { "epoch": 0.04, "learning_rate": 1.9988631187896267e-05, "loss": 0.9929, "step": 322 }, { "epoch": 0.04, "learning_rate": 1.998841571180716e-05, "loss": 0.6653, "step": 323 }, { "epoch": 0.05, "learning_rate": 1.9988198214038762e-05, "loss": 0.9668, "step": 324 }, { "epoch": 0.05, "learning_rate": 1.998797869463509e-05, "loss": 0.937, "step": 325 }, { "epoch": 0.05, "learning_rate": 1.998775715364058e-05, "loss": 0.9912, "step": 326 }, { "epoch": 0.05, "learning_rate": 1.9987533591100067e-05, "loss": 0.9875, "step": 327 }, { "epoch": 0.05, "learning_rate": 1.9987308007058803e-05, "loss": 1.0093, "step": 328 }, { "epoch": 0.05, "learning_rate": 1.998708040156245e-05, "loss": 0.5928, "step": 329 }, { "epoch": 0.05, "learning_rate": 1.998685077465707e-05, "loss": 0.9392, "step": 330 }, { "epoch": 0.05, "learning_rate": 1.998661912638914e-05, "loss": 0.9753, "step": 331 }, { "epoch": 0.05, "learning_rate": 1.9986385456805554e-05, "loss": 0.9656, "step": 332 }, { "epoch": 0.05, "learning_rate": 1.99861497659536e-05, "loss": 0.9951, "step": 333 }, { "epoch": 0.05, "learning_rate": 1.998591205388099e-05, "loss": 0.9822, "step": 334 }, { "epoch": 0.05, "learning_rate": 1.9985672320635826e-05, "loss": 0.9363, "step": 335 }, { "epoch": 0.05, "learning_rate": 1.9985430566266637e-05, "loss": 0.9609, "step": 336 }, { "epoch": 0.05, "learning_rate": 1.9985186790822358e-05, "loss": 0.665, "step": 337 }, { "epoch": 0.05, "learning_rate": 1.9984940994352324e-05, "loss": 0.9902, "step": 338 }, { "epoch": 0.05, "learning_rate": 1.9984693176906286e-05, "loss": 1.03, "step": 339 }, { "epoch": 0.05, "learning_rate": 1.9984443338534406e-05, "loss": 0.9773, "step": 340 }, { "epoch": 0.05, "learning_rate": 1.998419147928725e-05, "loss": 1.0293, "step": 341 }, { "epoch": 0.05, "learning_rate": 1.998393759921579e-05, "loss": 0.9802, "step": 342 }, { "epoch": 0.05, "learning_rate": 1.9983681698371426e-05, "loss": 0.9097, "step": 343 }, { "epoch": 0.05, "learning_rate": 1.9983423776805936e-05, "loss": 0.9832, "step": 344 }, { "epoch": 0.05, "learning_rate": 1.998316383457153e-05, "loss": 0.9097, "step": 345 }, { "epoch": 0.05, "learning_rate": 1.9982901871720828e-05, "loss": 0.8677, "step": 346 }, { "epoch": 0.05, "learning_rate": 1.9982637888306845e-05, "loss": 0.9934, "step": 347 }, { "epoch": 0.05, "learning_rate": 1.9982371884383012e-05, "loss": 0.9329, "step": 348 }, { "epoch": 0.05, "learning_rate": 1.998210386000317e-05, "loss": 1.0371, "step": 349 }, { "epoch": 0.05, "learning_rate": 1.9981833815221567e-05, "loss": 0.9856, "step": 350 }, { "epoch": 0.05, "learning_rate": 1.9981561750092864e-05, "loss": 0.9509, "step": 351 }, { "epoch": 0.05, "learning_rate": 1.9981287664672123e-05, "loss": 0.967, "step": 352 }, { "epoch": 0.05, "learning_rate": 1.9981011559014824e-05, "loss": 0.895, "step": 353 }, { "epoch": 0.05, "learning_rate": 1.9980733433176844e-05, "loss": 0.9548, "step": 354 }, { "epoch": 0.05, "learning_rate": 1.9980453287214487e-05, "loss": 0.6477, "step": 355 }, { "epoch": 0.05, "learning_rate": 1.9980171121184448e-05, "loss": 0.9573, "step": 356 }, { "epoch": 0.05, "learning_rate": 1.997988693514384e-05, "loss": 0.9294, "step": 357 }, { "epoch": 0.05, "learning_rate": 1.997960072915018e-05, "loss": 0.9519, "step": 358 }, { "epoch": 0.05, "learning_rate": 1.9979312503261403e-05, "loss": 0.9861, "step": 359 }, { "epoch": 0.05, "learning_rate": 1.997902225753584e-05, "loss": 0.628, "step": 360 }, { "epoch": 0.05, "learning_rate": 1.9978729992032243e-05, "loss": 0.9797, "step": 361 }, { "epoch": 0.05, "learning_rate": 1.9978435706809764e-05, "loss": 0.9688, "step": 362 }, { "epoch": 0.05, "learning_rate": 1.997813940192797e-05, "loss": 0.9683, "step": 363 }, { "epoch": 0.05, "learning_rate": 1.997784107744683e-05, "loss": 0.9473, "step": 364 }, { "epoch": 0.05, "learning_rate": 1.9977540733426722e-05, "loss": 0.9319, "step": 365 }, { "epoch": 0.05, "learning_rate": 1.9977238369928446e-05, "loss": 0.938, "step": 366 }, { "epoch": 0.05, "learning_rate": 1.9976933987013197e-05, "loss": 1.0061, "step": 367 }, { "epoch": 0.05, "learning_rate": 1.9976627584742583e-05, "loss": 1.0098, "step": 368 }, { "epoch": 0.05, "learning_rate": 1.997631916317862e-05, "loss": 0.9512, "step": 369 }, { "epoch": 0.05, "learning_rate": 1.9976008722383733e-05, "loss": 0.9207, "step": 370 }, { "epoch": 0.05, "learning_rate": 1.9975696262420756e-05, "loss": 0.6272, "step": 371 }, { "epoch": 0.05, "learning_rate": 1.9975381783352932e-05, "loss": 0.9585, "step": 372 }, { "epoch": 0.05, "learning_rate": 1.997506528524391e-05, "loss": 1.0078, "step": 373 }, { "epoch": 0.05, "learning_rate": 1.9974746768157757e-05, "loss": 0.9844, "step": 374 }, { "epoch": 0.05, "learning_rate": 1.997442623215893e-05, "loss": 0.9951, "step": 375 }, { "epoch": 0.05, "learning_rate": 1.9974103677312323e-05, "loss": 0.9336, "step": 376 }, { "epoch": 0.05, "learning_rate": 1.9973779103683203e-05, "loss": 0.9785, "step": 377 }, { "epoch": 0.05, "learning_rate": 1.997345251133728e-05, "loss": 0.9763, "step": 378 }, { "epoch": 0.05, "learning_rate": 1.9973123900340644e-05, "loss": 0.9006, "step": 379 }, { "epoch": 0.05, "learning_rate": 1.9972793270759818e-05, "loss": 0.9382, "step": 380 }, { "epoch": 0.05, "learning_rate": 1.9972460622661715e-05, "loss": 0.9731, "step": 381 }, { "epoch": 0.05, "learning_rate": 1.9972125956113667e-05, "loss": 0.9761, "step": 382 }, { "epoch": 0.05, "learning_rate": 1.997178927118341e-05, "loss": 0.9324, "step": 383 }, { "epoch": 0.05, "learning_rate": 1.997145056793909e-05, "loss": 0.9905, "step": 384 }, { "epoch": 0.05, "learning_rate": 1.9971109846449264e-05, "loss": 0.9155, "step": 385 }, { "epoch": 0.05, "learning_rate": 1.9970767106782887e-05, "loss": 1.0613, "step": 386 }, { "epoch": 0.05, "learning_rate": 1.9970422349009343e-05, "loss": 0.5364, "step": 387 }, { "epoch": 0.05, "learning_rate": 1.99700755731984e-05, "loss": 0.9749, "step": 388 }, { "epoch": 0.05, "learning_rate": 1.9969726779420254e-05, "loss": 0.6832, "step": 389 }, { "epoch": 0.05, "learning_rate": 1.9969375967745494e-05, "loss": 0.9785, "step": 390 }, { "epoch": 0.05, "learning_rate": 1.9969023138245133e-05, "loss": 0.9182, "step": 391 }, { "epoch": 0.05, "learning_rate": 1.9968668290990583e-05, "loss": 0.884, "step": 392 }, { "epoch": 0.05, "learning_rate": 1.9968311426053663e-05, "loss": 0.9233, "step": 393 }, { "epoch": 0.05, "learning_rate": 1.99679525435066e-05, "loss": 0.9971, "step": 394 }, { "epoch": 0.05, "learning_rate": 1.996759164342204e-05, "loss": 0.9929, "step": 395 }, { "epoch": 0.06, "learning_rate": 1.996722872587303e-05, "loss": 0.9124, "step": 396 }, { "epoch": 0.06, "learning_rate": 1.996686379093302e-05, "loss": 0.9419, "step": 397 }, { "epoch": 0.06, "learning_rate": 1.9966496838675878e-05, "loss": 0.9807, "step": 398 }, { "epoch": 0.06, "learning_rate": 1.996612786917587e-05, "loss": 0.9543, "step": 399 }, { "epoch": 0.06, "learning_rate": 1.9965756882507684e-05, "loss": 0.9636, "step": 400 }, { "epoch": 0.06, "learning_rate": 1.9965383878746407e-05, "loss": 0.97, "step": 401 }, { "epoch": 0.06, "learning_rate": 1.996500885796753e-05, "loss": 1.0029, "step": 402 }, { "epoch": 0.06, "learning_rate": 1.9964631820246967e-05, "loss": 0.9404, "step": 403 }, { "epoch": 0.06, "learning_rate": 1.996425276566102e-05, "loss": 0.9204, "step": 404 }, { "epoch": 0.06, "learning_rate": 1.9963871694286423e-05, "loss": 0.8713, "step": 405 }, { "epoch": 0.06, "learning_rate": 1.9963488606200298e-05, "loss": 0.9143, "step": 406 }, { "epoch": 0.06, "learning_rate": 1.9963103501480185e-05, "loss": 0.9678, "step": 407 }, { "epoch": 0.06, "learning_rate": 1.996271638020403e-05, "loss": 1.0137, "step": 408 }, { "epoch": 0.06, "learning_rate": 1.9962327242450185e-05, "loss": 0.9897, "step": 409 }, { "epoch": 0.06, "learning_rate": 1.996193608829742e-05, "loss": 0.9338, "step": 410 }, { "epoch": 0.06, "learning_rate": 1.9961542917824895e-05, "loss": 0.9026, "step": 411 }, { "epoch": 0.06, "learning_rate": 1.9961147731112195e-05, "loss": 0.9055, "step": 412 }, { "epoch": 0.06, "learning_rate": 1.9960750528239304e-05, "loss": 0.9207, "step": 413 }, { "epoch": 0.06, "learning_rate": 1.9960351309286622e-05, "loss": 0.9373, "step": 414 }, { "epoch": 0.06, "learning_rate": 1.9959950074334946e-05, "loss": 0.968, "step": 415 }, { "epoch": 0.06, "learning_rate": 1.995954682346549e-05, "loss": 0.9971, "step": 416 }, { "epoch": 0.06, "learning_rate": 1.995914155675987e-05, "loss": 0.9856, "step": 417 }, { "epoch": 0.06, "learning_rate": 1.9958734274300116e-05, "loss": 0.9829, "step": 418 }, { "epoch": 0.06, "learning_rate": 1.9958324976168667e-05, "loss": 1.0205, "step": 419 }, { "epoch": 0.06, "learning_rate": 1.9957913662448357e-05, "loss": 1.0291, "step": 420 }, { "epoch": 0.06, "learning_rate": 1.995750033322244e-05, "loss": 0.9509, "step": 421 }, { "epoch": 0.06, "learning_rate": 1.9957084988574574e-05, "loss": 0.99, "step": 422 }, { "epoch": 0.06, "learning_rate": 1.995666762858883e-05, "loss": 0.9751, "step": 423 }, { "epoch": 0.06, "learning_rate": 1.995624825334968e-05, "loss": 0.9604, "step": 424 }, { "epoch": 0.06, "learning_rate": 1.9955826862942006e-05, "loss": 1.0044, "step": 425 }, { "epoch": 0.06, "learning_rate": 1.9955403457451097e-05, "loss": 0.555, "step": 426 }, { "epoch": 0.06, "learning_rate": 1.9954978036962655e-05, "loss": 0.6744, "step": 427 }, { "epoch": 0.06, "learning_rate": 1.9954550601562786e-05, "loss": 0.6783, "step": 428 }, { "epoch": 0.06, "learning_rate": 1.9954121151338e-05, "loss": 0.9888, "step": 429 }, { "epoch": 0.06, "learning_rate": 1.9953689686375224e-05, "loss": 1.01, "step": 430 }, { "epoch": 0.06, "learning_rate": 1.9953256206761783e-05, "loss": 0.9292, "step": 431 }, { "epoch": 0.06, "learning_rate": 1.9952820712585414e-05, "loss": 1.0208, "step": 432 }, { "epoch": 0.06, "learning_rate": 1.9952383203934267e-05, "loss": 0.989, "step": 433 }, { "epoch": 0.06, "learning_rate": 1.9951943680896893e-05, "loss": 0.9841, "step": 434 }, { "epoch": 0.06, "learning_rate": 1.9951502143562248e-05, "loss": 0.6747, "step": 435 }, { "epoch": 0.06, "learning_rate": 1.9951058592019704e-05, "loss": 0.6736, "step": 436 }, { "epoch": 0.06, "learning_rate": 1.995061302635904e-05, "loss": 0.968, "step": 437 }, { "epoch": 0.06, "learning_rate": 1.9950165446670433e-05, "loss": 0.8733, "step": 438 }, { "epoch": 0.06, "learning_rate": 1.9949715853044476e-05, "loss": 0.9487, "step": 439 }, { "epoch": 0.06, "learning_rate": 1.9949264245572172e-05, "loss": 0.9971, "step": 440 }, { "epoch": 0.06, "learning_rate": 1.9948810624344924e-05, "loss": 1.0068, "step": 441 }, { "epoch": 0.06, "learning_rate": 1.9948354989454545e-05, "loss": 1.0161, "step": 442 }, { "epoch": 0.06, "learning_rate": 1.994789734099326e-05, "loss": 0.6247, "step": 443 }, { "epoch": 0.06, "learning_rate": 1.9947437679053692e-05, "loss": 1.0073, "step": 444 }, { "epoch": 0.06, "learning_rate": 1.9946976003728888e-05, "loss": 0.9707, "step": 445 }, { "epoch": 0.06, "learning_rate": 1.9946512315112285e-05, "loss": 0.6451, "step": 446 }, { "epoch": 0.06, "learning_rate": 1.994604661329773e-05, "loss": 0.9749, "step": 447 }, { "epoch": 0.06, "learning_rate": 1.9945578898379492e-05, "loss": 0.9133, "step": 448 }, { "epoch": 0.06, "learning_rate": 1.9945109170452236e-05, "loss": 0.9219, "step": 449 }, { "epoch": 0.06, "learning_rate": 1.994463742961103e-05, "loss": 0.6088, "step": 450 }, { "epoch": 0.06, "learning_rate": 1.9944163675951364e-05, "loss": 0.6104, "step": 451 }, { "epoch": 0.06, "learning_rate": 1.9943687909569117e-05, "loss": 0.937, "step": 452 }, { "epoch": 0.06, "learning_rate": 1.9943210130560594e-05, "loss": 0.9709, "step": 453 }, { "epoch": 0.06, "learning_rate": 1.9942730339022488e-05, "loss": 0.9658, "step": 454 }, { "epoch": 0.06, "learning_rate": 1.9942248535051924e-05, "loss": 0.9326, "step": 455 }, { "epoch": 0.06, "learning_rate": 1.9941764718746413e-05, "loss": 0.9941, "step": 456 }, { "epoch": 0.06, "learning_rate": 1.9941278890203877e-05, "loss": 0.9731, "step": 457 }, { "epoch": 0.06, "learning_rate": 1.9940791049522655e-05, "loss": 0.8562, "step": 458 }, { "epoch": 0.06, "learning_rate": 1.9940301196801484e-05, "loss": 1.0295, "step": 459 }, { "epoch": 0.06, "learning_rate": 1.993980933213951e-05, "loss": 0.9353, "step": 460 }, { "epoch": 0.06, "learning_rate": 1.9939315455636293e-05, "loss": 0.8955, "step": 461 }, { "epoch": 0.06, "learning_rate": 1.993881956739179e-05, "loss": 0.9849, "step": 462 }, { "epoch": 0.06, "learning_rate": 1.9938321667506373e-05, "loss": 0.9551, "step": 463 }, { "epoch": 0.06, "learning_rate": 1.9937821756080814e-05, "loss": 0.9226, "step": 464 }, { "epoch": 0.06, "learning_rate": 1.99373198332163e-05, "loss": 0.9578, "step": 465 }, { "epoch": 0.06, "learning_rate": 1.993681589901442e-05, "loss": 0.9709, "step": 466 }, { "epoch": 0.06, "learning_rate": 1.993630995357717e-05, "loss": 0.8838, "step": 467 }, { "epoch": 0.07, "learning_rate": 1.993580199700696e-05, "loss": 0.9087, "step": 468 }, { "epoch": 0.07, "learning_rate": 1.9935292029406595e-05, "loss": 0.9761, "step": 469 }, { "epoch": 0.07, "learning_rate": 1.99347800508793e-05, "loss": 1.0298, "step": 470 }, { "epoch": 0.07, "learning_rate": 1.9934266061528694e-05, "loss": 0.9155, "step": 471 }, { "epoch": 0.07, "learning_rate": 1.9933750061458815e-05, "loss": 0.9692, "step": 472 }, { "epoch": 0.07, "learning_rate": 1.9933232050774097e-05, "loss": 0.9888, "step": 473 }, { "epoch": 0.07, "learning_rate": 1.9932712029579396e-05, "loss": 0.9507, "step": 474 }, { "epoch": 0.07, "learning_rate": 1.9932189997979953e-05, "loss": 1.0022, "step": 475 }, { "epoch": 0.07, "learning_rate": 1.9931665956081438e-05, "loss": 0.9939, "step": 476 }, { "epoch": 0.07, "learning_rate": 1.993113990398992e-05, "loss": 0.9329, "step": 477 }, { "epoch": 0.07, "learning_rate": 1.9930611841811862e-05, "loss": 0.9836, "step": 478 }, { "epoch": 0.07, "learning_rate": 1.9930081769654155e-05, "loss": 0.9976, "step": 479 }, { "epoch": 0.07, "learning_rate": 1.9929549687624084e-05, "loss": 0.9736, "step": 480 }, { "epoch": 0.07, "learning_rate": 1.992901559582934e-05, "loss": 0.9399, "step": 481 }, { "epoch": 0.07, "learning_rate": 1.9928479494378034e-05, "loss": 0.9521, "step": 482 }, { "epoch": 0.07, "learning_rate": 1.992794138337866e-05, "loss": 0.9265, "step": 483 }, { "epoch": 0.07, "learning_rate": 1.9927401262940146e-05, "loss": 0.9421, "step": 484 }, { "epoch": 0.07, "learning_rate": 1.992685913317181e-05, "loss": 0.9573, "step": 485 }, { "epoch": 0.07, "learning_rate": 1.9926314994183378e-05, "loss": 0.9434, "step": 486 }, { "epoch": 0.07, "learning_rate": 1.9925768846084983e-05, "loss": 0.8804, "step": 487 }, { "epoch": 0.07, "learning_rate": 1.9925220688987172e-05, "loss": 1.0073, "step": 488 }, { "epoch": 0.07, "learning_rate": 1.992467052300089e-05, "loss": 0.938, "step": 489 }, { "epoch": 0.07, "learning_rate": 1.9924118348237495e-05, "loss": 0.9756, "step": 490 }, { "epoch": 0.07, "learning_rate": 1.9923564164808744e-05, "loss": 0.9626, "step": 491 }, { "epoch": 0.07, "learning_rate": 1.9923007972826808e-05, "loss": 0.9595, "step": 492 }, { "epoch": 0.07, "learning_rate": 1.992244977240426e-05, "loss": 0.9148, "step": 493 }, { "epoch": 0.07, "learning_rate": 1.9921889563654083e-05, "loss": 0.6132, "step": 494 }, { "epoch": 0.07, "learning_rate": 1.9921327346689666e-05, "loss": 0.9065, "step": 495 }, { "epoch": 0.07, "learning_rate": 1.99207631216248e-05, "loss": 0.9377, "step": 496 }, { "epoch": 0.07, "learning_rate": 1.9920196888573688e-05, "loss": 0.9316, "step": 497 }, { "epoch": 0.07, "learning_rate": 1.991962864765093e-05, "loss": 0.9172, "step": 498 }, { "epoch": 0.07, "learning_rate": 1.9919058398971548e-05, "loss": 0.9229, "step": 499 }, { "epoch": 0.07, "learning_rate": 1.9918486142650957e-05, "loss": 0.9617, "step": 500 }, { "epoch": 0.07, "learning_rate": 1.991791187880499e-05, "loss": 0.908, "step": 501 }, { "epoch": 0.07, "learning_rate": 1.9917335607549867e-05, "loss": 0.9004, "step": 502 }, { "epoch": 0.07, "learning_rate": 1.9916757329002238e-05, "loss": 0.9626, "step": 503 }, { "epoch": 0.07, "learning_rate": 1.9916177043279136e-05, "loss": 0.9529, "step": 504 }, { "epoch": 0.07, "learning_rate": 1.9915594750498025e-05, "loss": 0.5842, "step": 505 }, { "epoch": 0.07, "learning_rate": 1.991501045077676e-05, "loss": 0.97, "step": 506 }, { "epoch": 0.07, "learning_rate": 1.9914424144233596e-05, "loss": 0.9873, "step": 507 }, { "epoch": 0.07, "learning_rate": 1.991383583098721e-05, "loss": 0.906, "step": 508 }, { "epoch": 0.07, "learning_rate": 1.991324551115668e-05, "loss": 0.9158, "step": 509 }, { "epoch": 0.07, "learning_rate": 1.9912653184861483e-05, "loss": 0.8477, "step": 510 }, { "epoch": 0.07, "learning_rate": 1.9912058852221506e-05, "loss": 1.0061, "step": 511 }, { "epoch": 0.07, "learning_rate": 1.991146251335705e-05, "loss": 0.6531, "step": 512 }, { "epoch": 0.07, "learning_rate": 1.991086416838881e-05, "loss": 0.9246, "step": 513 }, { "epoch": 0.07, "learning_rate": 1.9910263817437894e-05, "loss": 1.0422, "step": 514 }, { "epoch": 0.07, "learning_rate": 1.9909661460625814e-05, "loss": 0.8926, "step": 515 }, { "epoch": 0.07, "learning_rate": 1.990905709807449e-05, "loss": 0.9412, "step": 516 }, { "epoch": 0.07, "learning_rate": 1.9908450729906245e-05, "loss": 0.97, "step": 517 }, { "epoch": 0.07, "learning_rate": 1.990784235624381e-05, "loss": 0.9094, "step": 518 }, { "epoch": 0.07, "learning_rate": 1.9907231977210323e-05, "loss": 0.9438, "step": 519 }, { "epoch": 0.07, "learning_rate": 1.9906619592929326e-05, "loss": 0.9167, "step": 520 }, { "epoch": 0.07, "learning_rate": 1.990600520352476e-05, "loss": 0.9119, "step": 521 }, { "epoch": 0.07, "learning_rate": 1.990538880912099e-05, "loss": 1.0195, "step": 522 }, { "epoch": 0.07, "learning_rate": 1.9904770409842767e-05, "loss": 0.9529, "step": 523 }, { "epoch": 0.07, "learning_rate": 1.9904150005815262e-05, "loss": 0.6244, "step": 524 }, { "epoch": 0.07, "learning_rate": 1.990352759716404e-05, "loss": 0.8948, "step": 525 }, { "epoch": 0.07, "learning_rate": 1.9902903184015082e-05, "loss": 0.9512, "step": 526 }, { "epoch": 0.07, "learning_rate": 1.9902276766494776e-05, "loss": 0.9397, "step": 527 }, { "epoch": 0.07, "learning_rate": 1.99016483447299e-05, "loss": 0.6127, "step": 528 }, { "epoch": 0.07, "learning_rate": 1.9901017918847654e-05, "loss": 0.9617, "step": 529 }, { "epoch": 0.07, "learning_rate": 1.9900385488975636e-05, "loss": 0.9504, "step": 530 }, { "epoch": 0.07, "learning_rate": 1.9899751055241854e-05, "loss": 0.9084, "step": 531 }, { "epoch": 0.07, "learning_rate": 1.9899114617774717e-05, "loss": 0.9495, "step": 532 }, { "epoch": 0.07, "learning_rate": 1.989847617670304e-05, "loss": 0.9319, "step": 533 }, { "epoch": 0.07, "learning_rate": 1.9897835732156045e-05, "loss": 0.9929, "step": 534 }, { "epoch": 0.07, "learning_rate": 1.9897193284263367e-05, "loss": 0.9302, "step": 535 }, { "epoch": 0.07, "learning_rate": 1.9896548833155024e-05, "loss": 0.9893, "step": 536 }, { "epoch": 0.07, "learning_rate": 1.9895902378961473e-05, "loss": 0.6317, "step": 537 }, { "epoch": 0.07, "learning_rate": 1.9895253921813543e-05, "loss": 0.9084, "step": 538 }, { "epoch": 0.07, "learning_rate": 1.9894603461842488e-05, "loss": 0.9705, "step": 539 }, { "epoch": 0.08, "learning_rate": 1.9893950999179963e-05, "loss": 0.9143, "step": 540 }, { "epoch": 0.08, "learning_rate": 1.989329653395803e-05, "loss": 0.8982, "step": 541 }, { "epoch": 0.08, "learning_rate": 1.9892640066309154e-05, "loss": 0.9155, "step": 542 }, { "epoch": 0.08, "learning_rate": 1.98919815963662e-05, "loss": 0.9714, "step": 543 }, { "epoch": 0.08, "learning_rate": 1.9891321124262452e-05, "loss": 0.9185, "step": 544 }, { "epoch": 0.08, "learning_rate": 1.9890658650131588e-05, "loss": 1.0154, "step": 545 }, { "epoch": 0.08, "learning_rate": 1.9889994174107688e-05, "loss": 0.9292, "step": 546 }, { "epoch": 0.08, "learning_rate": 1.9889327696325254e-05, "loss": 0.9565, "step": 547 }, { "epoch": 0.08, "learning_rate": 1.9888659216919177e-05, "loss": 0.9478, "step": 548 }, { "epoch": 0.08, "learning_rate": 1.988798873602476e-05, "loss": 0.9124, "step": 549 }, { "epoch": 0.08, "learning_rate": 1.9887316253777707e-05, "loss": 1.0371, "step": 550 }, { "epoch": 0.08, "learning_rate": 1.9886641770314133e-05, "loss": 0.9238, "step": 551 }, { "epoch": 0.08, "learning_rate": 1.9885965285770556e-05, "loss": 0.9421, "step": 552 }, { "epoch": 0.08, "learning_rate": 1.9885286800283897e-05, "loss": 0.6481, "step": 553 }, { "epoch": 0.08, "learning_rate": 1.988460631399148e-05, "loss": 0.9614, "step": 554 }, { "epoch": 0.08, "learning_rate": 1.9883923827031044e-05, "loss": 0.9204, "step": 555 }, { "epoch": 0.08, "learning_rate": 1.9883239339540722e-05, "loss": 0.6005, "step": 556 }, { "epoch": 0.08, "learning_rate": 1.9882552851659055e-05, "loss": 0.9363, "step": 557 }, { "epoch": 0.08, "learning_rate": 1.9881864363524987e-05, "loss": 0.9409, "step": 558 }, { "epoch": 0.08, "learning_rate": 1.9881173875277876e-05, "loss": 0.9714, "step": 559 }, { "epoch": 0.08, "learning_rate": 1.9880481387057474e-05, "loss": 0.9807, "step": 560 }, { "epoch": 0.08, "learning_rate": 1.987978689900395e-05, "loss": 0.9614, "step": 561 }, { "epoch": 0.08, "learning_rate": 1.9879090411257857e-05, "loss": 0.9795, "step": 562 }, { "epoch": 0.08, "learning_rate": 1.9878391923960176e-05, "loss": 0.9358, "step": 563 }, { "epoch": 0.08, "learning_rate": 1.987769143725228e-05, "loss": 1.0088, "step": 564 }, { "epoch": 0.08, "learning_rate": 1.9876988951275947e-05, "loss": 0.9629, "step": 565 }, { "epoch": 0.08, "learning_rate": 1.9876284466173366e-05, "loss": 0.9956, "step": 566 }, { "epoch": 0.08, "learning_rate": 1.987557798208712e-05, "loss": 0.9663, "step": 567 }, { "epoch": 0.08, "learning_rate": 1.987486949916021e-05, "loss": 1.0022, "step": 568 }, { "epoch": 0.08, "learning_rate": 1.987415901753603e-05, "loss": 0.999, "step": 569 }, { "epoch": 0.08, "learning_rate": 1.9873446537358387e-05, "loss": 0.95, "step": 570 }, { "epoch": 0.08, "learning_rate": 1.9872732058771484e-05, "loss": 0.9316, "step": 571 }, { "epoch": 0.08, "learning_rate": 1.9872015581919936e-05, "loss": 1.0088, "step": 572 }, { "epoch": 0.08, "learning_rate": 1.987129710694876e-05, "loss": 0.9502, "step": 573 }, { "epoch": 0.08, "learning_rate": 1.9870576634003375e-05, "loss": 0.8933, "step": 574 }, { "epoch": 0.08, "learning_rate": 1.986985416322961e-05, "loss": 0.9631, "step": 575 }, { "epoch": 0.08, "learning_rate": 1.986912969477369e-05, "loss": 1.0068, "step": 576 }, { "epoch": 0.08, "learning_rate": 1.9868403228782257e-05, "loss": 0.8948, "step": 577 }, { "epoch": 0.08, "learning_rate": 1.9867674765402337e-05, "loss": 0.6697, "step": 578 }, { "epoch": 0.08, "learning_rate": 1.9866944304781385e-05, "loss": 1.0044, "step": 579 }, { "epoch": 0.08, "learning_rate": 1.986621184706724e-05, "loss": 0.9773, "step": 580 }, { "epoch": 0.08, "learning_rate": 1.986547739240816e-05, "loss": 0.9287, "step": 581 }, { "epoch": 0.08, "learning_rate": 1.9864740940952793e-05, "loss": 0.6442, "step": 582 }, { "epoch": 0.08, "learning_rate": 1.9864002492850203e-05, "loss": 0.9365, "step": 583 }, { "epoch": 0.08, "learning_rate": 1.9863262048249852e-05, "loss": 0.9329, "step": 584 }, { "epoch": 0.08, "learning_rate": 1.986251960730161e-05, "loss": 0.9473, "step": 585 }, { "epoch": 0.08, "learning_rate": 1.9861775170155748e-05, "loss": 0.6248, "step": 586 }, { "epoch": 0.08, "learning_rate": 1.986102873696294e-05, "loss": 0.905, "step": 587 }, { "epoch": 0.08, "learning_rate": 1.9860280307874266e-05, "loss": 0.6538, "step": 588 }, { "epoch": 0.08, "learning_rate": 1.9859529883041214e-05, "loss": 0.9387, "step": 589 }, { "epoch": 0.08, "learning_rate": 1.9858777462615664e-05, "loss": 0.6409, "step": 590 }, { "epoch": 0.08, "learning_rate": 1.985802304674992e-05, "loss": 0.9253, "step": 591 }, { "epoch": 0.08, "learning_rate": 1.985726663559666e-05, "loss": 0.9932, "step": 592 }, { "epoch": 0.08, "learning_rate": 1.9856508229309e-05, "loss": 0.885, "step": 593 }, { "epoch": 0.08, "learning_rate": 1.9855747828040435e-05, "loss": 0.9668, "step": 594 }, { "epoch": 0.08, "learning_rate": 1.9854985431944873e-05, "loss": 0.9709, "step": 595 }, { "epoch": 0.08, "learning_rate": 1.9854221041176628e-05, "loss": 0.9722, "step": 596 }, { "epoch": 0.08, "learning_rate": 1.9853454655890408e-05, "loss": 0.9458, "step": 597 }, { "epoch": 0.08, "learning_rate": 1.9852686276241336e-05, "loss": 0.9822, "step": 598 }, { "epoch": 0.08, "learning_rate": 1.9851915902384937e-05, "loss": 0.9243, "step": 599 }, { "epoch": 0.08, "learning_rate": 1.9851143534477127e-05, "loss": 0.5939, "step": 600 }, { "epoch": 0.08, "learning_rate": 1.985036917267425e-05, "loss": 0.9636, "step": 601 }, { "epoch": 0.08, "learning_rate": 1.984959281713302e-05, "loss": 0.9768, "step": 602 }, { "epoch": 0.08, "learning_rate": 1.9848814468010586e-05, "loss": 0.9097, "step": 603 }, { "epoch": 0.08, "learning_rate": 1.9848034125464485e-05, "loss": 0.9539, "step": 604 }, { "epoch": 0.08, "learning_rate": 1.984725178965266e-05, "loss": 0.9646, "step": 605 }, { "epoch": 0.08, "learning_rate": 1.9846467460733455e-05, "loss": 0.9534, "step": 606 }, { "epoch": 0.08, "learning_rate": 1.9845681138865624e-05, "loss": 0.9307, "step": 607 }, { "epoch": 0.08, "learning_rate": 1.9844892824208318e-05, "loss": 0.9221, "step": 608 }, { "epoch": 0.08, "learning_rate": 1.9844102516921095e-05, "loss": 0.9524, "step": 609 }, { "epoch": 0.08, "learning_rate": 1.9843310217163917e-05, "loss": 0.9285, "step": 610 }, { "epoch": 0.08, "learning_rate": 1.984251592509714e-05, "loss": 0.9392, "step": 611 }, { "epoch": 0.09, "learning_rate": 1.984171964088154e-05, "loss": 0.9128, "step": 612 }, { "epoch": 0.09, "learning_rate": 1.9840921364678278e-05, "loss": 0.9006, "step": 613 }, { "epoch": 0.09, "learning_rate": 1.9840121096648933e-05, "loss": 0.8909, "step": 614 }, { "epoch": 0.09, "learning_rate": 1.9839318836955482e-05, "loss": 0.9236, "step": 615 }, { "epoch": 0.09, "learning_rate": 1.98385145857603e-05, "loss": 0.9563, "step": 616 }, { "epoch": 0.09, "learning_rate": 1.9837708343226173e-05, "loss": 0.9109, "step": 617 }, { "epoch": 0.09, "learning_rate": 1.983690010951628e-05, "loss": 0.9424, "step": 618 }, { "epoch": 0.09, "learning_rate": 1.983608988479422e-05, "loss": 0.853, "step": 619 }, { "epoch": 0.09, "learning_rate": 1.9835277669223974e-05, "loss": 0.8711, "step": 620 }, { "epoch": 0.09, "learning_rate": 1.9834463462969944e-05, "loss": 0.9519, "step": 621 }, { "epoch": 0.09, "learning_rate": 1.9833647266196924e-05, "loss": 1.0225, "step": 622 }, { "epoch": 0.09, "learning_rate": 1.983282907907011e-05, "loss": 0.9263, "step": 623 }, { "epoch": 0.09, "learning_rate": 1.9832008901755115e-05, "loss": 0.666, "step": 624 }, { "epoch": 0.09, "learning_rate": 1.9831186734417937e-05, "loss": 0.9534, "step": 625 }, { "epoch": 0.09, "learning_rate": 1.983036257722499e-05, "loss": 0.9941, "step": 626 }, { "epoch": 0.09, "learning_rate": 1.9829536430343077e-05, "loss": 0.958, "step": 627 }, { "epoch": 0.09, "learning_rate": 1.9828708293939417e-05, "loss": 0.9324, "step": 628 }, { "epoch": 0.09, "learning_rate": 1.9827878168181634e-05, "loss": 0.9841, "step": 629 }, { "epoch": 0.09, "learning_rate": 1.9827046053237736e-05, "loss": 0.9475, "step": 630 }, { "epoch": 0.09, "learning_rate": 1.982621194927615e-05, "loss": 0.9211, "step": 631 }, { "epoch": 0.09, "learning_rate": 1.9825375856465703e-05, "loss": 0.9758, "step": 632 }, { "epoch": 0.09, "learning_rate": 1.9824537774975615e-05, "loss": 0.9351, "step": 633 }, { "epoch": 0.09, "learning_rate": 1.9823697704975523e-05, "loss": 0.9741, "step": 634 }, { "epoch": 0.09, "learning_rate": 1.982285564663546e-05, "loss": 0.9497, "step": 635 }, { "epoch": 0.09, "learning_rate": 1.982201160012585e-05, "loss": 0.6489, "step": 636 }, { "epoch": 0.09, "learning_rate": 1.9821165565617543e-05, "loss": 0.9507, "step": 637 }, { "epoch": 0.09, "learning_rate": 1.982031754328177e-05, "loss": 0.9775, "step": 638 }, { "epoch": 0.09, "learning_rate": 1.9819467533290174e-05, "loss": 0.8989, "step": 639 }, { "epoch": 0.09, "learning_rate": 1.9818615535814802e-05, "loss": 0.9004, "step": 640 }, { "epoch": 0.09, "learning_rate": 1.9817761551028097e-05, "loss": 0.9006, "step": 641 }, { "epoch": 0.09, "learning_rate": 1.981690557910291e-05, "loss": 0.9324, "step": 642 }, { "epoch": 0.09, "learning_rate": 1.9816047620212493e-05, "loss": 0.9514, "step": 643 }, { "epoch": 0.09, "learning_rate": 1.9815187674530497e-05, "loss": 0.9048, "step": 644 }, { "epoch": 0.09, "learning_rate": 1.9814325742230976e-05, "loss": 0.9185, "step": 645 }, { "epoch": 0.09, "learning_rate": 1.981346182348839e-05, "loss": 0.9788, "step": 646 }, { "epoch": 0.09, "learning_rate": 1.981259591847759e-05, "loss": 0.9487, "step": 647 }, { "epoch": 0.09, "learning_rate": 1.981172802737385e-05, "loss": 0.9712, "step": 648 }, { "epoch": 0.09, "learning_rate": 1.9810858150352823e-05, "loss": 0.9358, "step": 649 }, { "epoch": 0.09, "learning_rate": 1.980998628759058e-05, "loss": 0.9563, "step": 650 }, { "epoch": 0.09, "learning_rate": 1.9809112439263588e-05, "loss": 0.9561, "step": 651 }, { "epoch": 0.09, "learning_rate": 1.980823660554871e-05, "loss": 0.6631, "step": 652 }, { "epoch": 0.09, "learning_rate": 1.9807358786623223e-05, "loss": 0.9226, "step": 653 }, { "epoch": 0.09, "learning_rate": 1.98064789826648e-05, "loss": 0.9573, "step": 654 }, { "epoch": 0.09, "learning_rate": 1.980559719385151e-05, "loss": 0.9224, "step": 655 }, { "epoch": 0.09, "learning_rate": 1.9804713420361838e-05, "loss": 0.8662, "step": 656 }, { "epoch": 0.09, "learning_rate": 1.9803827662374648e-05, "loss": 0.9176, "step": 657 }, { "epoch": 0.09, "learning_rate": 1.980293992006923e-05, "loss": 0.9966, "step": 658 }, { "epoch": 0.09, "learning_rate": 1.9802050193625265e-05, "loss": 0.9031, "step": 659 }, { "epoch": 0.09, "learning_rate": 1.9801158483222835e-05, "loss": 0.8875, "step": 660 }, { "epoch": 0.09, "learning_rate": 1.980026478904242e-05, "loss": 0.9609, "step": 661 }, { "epoch": 0.09, "learning_rate": 1.9799369111264914e-05, "loss": 0.9893, "step": 662 }, { "epoch": 0.09, "learning_rate": 1.979847145007159e-05, "loss": 0.8701, "step": 663 }, { "epoch": 0.09, "learning_rate": 1.9797571805644155e-05, "loss": 0.9607, "step": 664 }, { "epoch": 0.09, "learning_rate": 1.9796670178164684e-05, "loss": 0.8877, "step": 665 }, { "epoch": 0.09, "learning_rate": 1.9795766567815676e-05, "loss": 0.8833, "step": 666 }, { "epoch": 0.09, "learning_rate": 1.9794860974780027e-05, "loss": 0.9377, "step": 667 }, { "epoch": 0.09, "learning_rate": 1.9793953399241023e-05, "loss": 0.8862, "step": 668 }, { "epoch": 0.09, "learning_rate": 1.9793043841382366e-05, "loss": 0.9417, "step": 669 }, { "epoch": 0.09, "learning_rate": 1.9792132301388143e-05, "loss": 0.9563, "step": 670 }, { "epoch": 0.09, "learning_rate": 1.9791218779442866e-05, "loss": 0.8977, "step": 671 }, { "epoch": 0.09, "learning_rate": 1.9790303275731424e-05, "loss": 0.9312, "step": 672 }, { "epoch": 0.09, "learning_rate": 1.9789385790439118e-05, "loss": 0.9441, "step": 673 }, { "epoch": 0.09, "learning_rate": 1.9788466323751655e-05, "loss": 0.9775, "step": 674 }, { "epoch": 0.09, "learning_rate": 1.9787544875855134e-05, "loss": 0.9302, "step": 675 }, { "epoch": 0.09, "learning_rate": 1.9786621446936056e-05, "loss": 0.9983, "step": 676 }, { "epoch": 0.09, "learning_rate": 1.9785696037181326e-05, "loss": 0.9268, "step": 677 }, { "epoch": 0.09, "learning_rate": 1.978476864677825e-05, "loss": 0.928, "step": 678 }, { "epoch": 0.09, "learning_rate": 1.9783839275914537e-05, "loss": 0.9465, "step": 679 }, { "epoch": 0.09, "learning_rate": 1.978290792477829e-05, "loss": 0.9368, "step": 680 }, { "epoch": 0.09, "learning_rate": 1.9781974593558016e-05, "loss": 0.9512, "step": 681 }, { "epoch": 0.09, "learning_rate": 1.9781039282442627e-05, "loss": 0.9043, "step": 682 }, { "epoch": 0.09, "learning_rate": 1.978010199162143e-05, "loss": 0.9143, "step": 683 }, { "epoch": 0.1, "learning_rate": 1.9779162721284135e-05, "loss": 0.8967, "step": 684 }, { "epoch": 0.1, "learning_rate": 1.9778221471620854e-05, "loss": 0.9749, "step": 685 }, { "epoch": 0.1, "learning_rate": 1.9777278242822097e-05, "loss": 0.9221, "step": 686 }, { "epoch": 0.1, "learning_rate": 1.9776333035078774e-05, "loss": 0.8926, "step": 687 }, { "epoch": 0.1, "learning_rate": 1.9775385848582204e-05, "loss": 0.8618, "step": 688 }, { "epoch": 0.1, "learning_rate": 1.977443668352409e-05, "loss": 0.5945, "step": 689 }, { "epoch": 0.1, "learning_rate": 1.977348554009655e-05, "loss": 0.9656, "step": 690 }, { "epoch": 0.1, "learning_rate": 1.97725324184921e-05, "loss": 0.8833, "step": 691 }, { "epoch": 0.1, "learning_rate": 1.9771577318903655e-05, "loss": 0.9875, "step": 692 }, { "epoch": 0.1, "learning_rate": 1.9770620241524524e-05, "loss": 0.6475, "step": 693 }, { "epoch": 0.1, "learning_rate": 1.976966118654842e-05, "loss": 0.9243, "step": 694 }, { "epoch": 0.1, "learning_rate": 1.976870015416947e-05, "loss": 0.9333, "step": 695 }, { "epoch": 0.1, "learning_rate": 1.9767737144582176e-05, "loss": 0.6398, "step": 696 }, { "epoch": 0.1, "learning_rate": 1.9766772157981462e-05, "loss": 0.9417, "step": 697 }, { "epoch": 0.1, "learning_rate": 1.976580519456264e-05, "loss": 0.6115, "step": 698 }, { "epoch": 0.1, "learning_rate": 1.9764836254521426e-05, "loss": 0.9531, "step": 699 }, { "epoch": 0.1, "learning_rate": 1.976386533805394e-05, "loss": 0.936, "step": 700 }, { "epoch": 0.1, "learning_rate": 1.9762892445356688e-05, "loss": 0.9924, "step": 701 }, { "epoch": 0.1, "learning_rate": 1.9761917576626594e-05, "loss": 0.9978, "step": 702 }, { "epoch": 0.1, "learning_rate": 1.9760940732060973e-05, "loss": 0.9536, "step": 703 }, { "epoch": 0.1, "learning_rate": 1.9759961911857538e-05, "loss": 0.647, "step": 704 }, { "epoch": 0.1, "learning_rate": 1.9758981116214407e-05, "loss": 0.9277, "step": 705 }, { "epoch": 0.1, "learning_rate": 1.9757998345330095e-05, "loss": 0.9668, "step": 706 }, { "epoch": 0.1, "learning_rate": 1.9757013599403515e-05, "loss": 0.9653, "step": 707 }, { "epoch": 0.1, "learning_rate": 1.975602687863398e-05, "loss": 0.9224, "step": 708 }, { "epoch": 0.1, "learning_rate": 1.9755038183221213e-05, "loss": 0.9116, "step": 709 }, { "epoch": 0.1, "learning_rate": 1.975404751336532e-05, "loss": 0.9253, "step": 710 }, { "epoch": 0.1, "learning_rate": 1.975305486926682e-05, "loss": 0.613, "step": 711 }, { "epoch": 0.1, "learning_rate": 1.9752060251126625e-05, "loss": 0.9587, "step": 712 }, { "epoch": 0.1, "learning_rate": 1.9751063659146047e-05, "loss": 0.8684, "step": 713 }, { "epoch": 0.1, "learning_rate": 1.9750065093526803e-05, "loss": 0.9819, "step": 714 }, { "epoch": 0.1, "learning_rate": 1.9749064554470995e-05, "loss": 0.6713, "step": 715 }, { "epoch": 0.1, "learning_rate": 1.9748062042181147e-05, "loss": 0.9758, "step": 716 }, { "epoch": 0.1, "learning_rate": 1.9747057556860163e-05, "loss": 0.9697, "step": 717 }, { "epoch": 0.1, "learning_rate": 1.9746051098711353e-05, "loss": 0.9854, "step": 718 }, { "epoch": 0.1, "learning_rate": 1.974504266793843e-05, "loss": 0.9424, "step": 719 }, { "epoch": 0.1, "learning_rate": 1.9744032264745494e-05, "loss": 0.9338, "step": 720 }, { "epoch": 0.1, "learning_rate": 1.9743019889337065e-05, "loss": 0.9668, "step": 721 }, { "epoch": 0.1, "learning_rate": 1.9742005541918045e-05, "loss": 0.9211, "step": 722 }, { "epoch": 0.1, "learning_rate": 1.9740989222693737e-05, "loss": 0.9729, "step": 723 }, { "epoch": 0.1, "learning_rate": 1.973997093186985e-05, "loss": 0.9182, "step": 724 }, { "epoch": 0.1, "learning_rate": 1.9738950669652493e-05, "loss": 0.9575, "step": 725 }, { "epoch": 0.1, "learning_rate": 1.973792843624816e-05, "loss": 0.9529, "step": 726 }, { "epoch": 0.1, "learning_rate": 1.973690423186376e-05, "loss": 0.9583, "step": 727 }, { "epoch": 0.1, "learning_rate": 1.973587805670659e-05, "loss": 0.8445, "step": 728 }, { "epoch": 0.1, "learning_rate": 1.973484991098436e-05, "loss": 0.8892, "step": 729 }, { "epoch": 0.1, "learning_rate": 1.9733819794905153e-05, "loss": 0.9531, "step": 730 }, { "epoch": 0.1, "learning_rate": 1.973278770867748e-05, "loss": 0.8303, "step": 731 }, { "epoch": 0.1, "learning_rate": 1.9731753652510236e-05, "loss": 0.9736, "step": 732 }, { "epoch": 0.1, "learning_rate": 1.973071762661271e-05, "loss": 0.9963, "step": 733 }, { "epoch": 0.1, "learning_rate": 1.9729679631194605e-05, "loss": 0.907, "step": 734 }, { "epoch": 0.1, "learning_rate": 1.9728639666466004e-05, "loss": 0.9639, "step": 735 }, { "epoch": 0.1, "learning_rate": 1.9727597732637406e-05, "loss": 0.947, "step": 736 }, { "epoch": 0.1, "learning_rate": 1.97265538299197e-05, "loss": 0.9238, "step": 737 }, { "epoch": 0.1, "learning_rate": 1.972550795852417e-05, "loss": 0.9675, "step": 738 }, { "epoch": 0.1, "learning_rate": 1.9724460118662504e-05, "loss": 0.9373, "step": 739 }, { "epoch": 0.1, "learning_rate": 1.9723410310546794e-05, "loss": 0.6313, "step": 740 }, { "epoch": 0.1, "learning_rate": 1.9722358534389517e-05, "loss": 0.9229, "step": 741 }, { "epoch": 0.1, "learning_rate": 1.9721304790403555e-05, "loss": 0.981, "step": 742 }, { "epoch": 0.1, "learning_rate": 1.972024907880219e-05, "loss": 0.9209, "step": 743 }, { "epoch": 0.1, "learning_rate": 1.9719191399799102e-05, "loss": 0.9392, "step": 744 }, { "epoch": 0.1, "learning_rate": 1.9718131753608362e-05, "loss": 0.8762, "step": 745 }, { "epoch": 0.1, "learning_rate": 1.9717070140444455e-05, "loss": 0.95, "step": 746 }, { "epoch": 0.1, "learning_rate": 1.9716006560522246e-05, "loss": 0.9275, "step": 747 }, { "epoch": 0.1, "learning_rate": 1.971494101405701e-05, "loss": 0.9453, "step": 748 }, { "epoch": 0.1, "learning_rate": 1.971387350126441e-05, "loss": 0.907, "step": 749 }, { "epoch": 0.1, "learning_rate": 1.9712804022360517e-05, "loss": 0.9348, "step": 750 }, { "epoch": 0.1, "learning_rate": 1.9711732577561803e-05, "loss": 0.9312, "step": 751 }, { "epoch": 0.1, "learning_rate": 1.971065916708512e-05, "loss": 0.6656, "step": 752 }, { "epoch": 0.1, "learning_rate": 1.9709583791147738e-05, "loss": 0.9243, "step": 753 }, { "epoch": 0.1, "learning_rate": 1.970850644996731e-05, "loss": 0.634, "step": 754 }, { "epoch": 0.1, "learning_rate": 1.970742714376189e-05, "loss": 0.9114, "step": 755 }, { "epoch": 0.11, "learning_rate": 1.970634587274994e-05, "loss": 0.6027, "step": 756 }, { "epoch": 0.11, "learning_rate": 1.9705262637150304e-05, "loss": 0.9565, "step": 757 }, { "epoch": 0.11, "learning_rate": 1.970417743718224e-05, "loss": 0.9187, "step": 758 }, { "epoch": 0.11, "learning_rate": 1.9703090273065388e-05, "loss": 0.9495, "step": 759 }, { "epoch": 0.11, "learning_rate": 1.9702001145019794e-05, "loss": 0.9102, "step": 760 }, { "epoch": 0.11, "learning_rate": 1.97009100532659e-05, "loss": 0.9707, "step": 761 }, { "epoch": 0.11, "learning_rate": 1.9699816998024547e-05, "loss": 0.9287, "step": 762 }, { "epoch": 0.11, "learning_rate": 1.9698721979516973e-05, "loss": 0.6978, "step": 763 }, { "epoch": 0.11, "learning_rate": 1.969762499796481e-05, "loss": 0.8865, "step": 764 }, { "epoch": 0.11, "learning_rate": 1.9696526053590092e-05, "loss": 0.6203, "step": 765 }, { "epoch": 0.11, "learning_rate": 1.9695425146615246e-05, "loss": 0.9656, "step": 766 }, { "epoch": 0.11, "learning_rate": 1.9694322277263102e-05, "loss": 0.8994, "step": 767 }, { "epoch": 0.11, "learning_rate": 1.9693217445756875e-05, "loss": 0.9072, "step": 768 }, { "epoch": 0.11, "learning_rate": 1.9692110652320196e-05, "loss": 0.9424, "step": 769 }, { "epoch": 0.11, "learning_rate": 1.9691001897177072e-05, "loss": 0.9612, "step": 770 }, { "epoch": 0.11, "learning_rate": 1.9689891180551925e-05, "loss": 0.9326, "step": 771 }, { "epoch": 0.11, "learning_rate": 1.9688778502669568e-05, "loss": 0.9688, "step": 772 }, { "epoch": 0.11, "learning_rate": 1.9687663863755204e-05, "loss": 0.9219, "step": 773 }, { "epoch": 0.11, "learning_rate": 1.968654726403444e-05, "loss": 0.9492, "step": 774 }, { "epoch": 0.11, "learning_rate": 1.9685428703733285e-05, "loss": 0.9072, "step": 775 }, { "epoch": 0.11, "learning_rate": 1.9684308183078127e-05, "loss": 0.9226, "step": 776 }, { "epoch": 0.11, "learning_rate": 1.968318570229577e-05, "loss": 0.9604, "step": 777 }, { "epoch": 0.11, "learning_rate": 1.9682061261613406e-05, "loss": 0.9297, "step": 778 }, { "epoch": 0.11, "learning_rate": 1.968093486125862e-05, "loss": 0.9709, "step": 779 }, { "epoch": 0.11, "learning_rate": 1.9679806501459406e-05, "loss": 0.9502, "step": 780 }, { "epoch": 0.11, "learning_rate": 1.9678676182444137e-05, "loss": 0.9844, "step": 781 }, { "epoch": 0.11, "learning_rate": 1.96775439044416e-05, "loss": 0.6061, "step": 782 }, { "epoch": 0.11, "learning_rate": 1.9676409667680973e-05, "loss": 0.9746, "step": 783 }, { "epoch": 0.11, "learning_rate": 1.9675273472391817e-05, "loss": 0.8916, "step": 784 }, { "epoch": 0.11, "learning_rate": 1.9674135318804107e-05, "loss": 0.9209, "step": 785 }, { "epoch": 0.11, "learning_rate": 1.967299520714821e-05, "loss": 0.9512, "step": 786 }, { "epoch": 0.11, "learning_rate": 1.9671853137654887e-05, "loss": 0.6273, "step": 787 }, { "epoch": 0.11, "learning_rate": 1.9670709110555292e-05, "loss": 0.8706, "step": 788 }, { "epoch": 0.11, "learning_rate": 1.966956312608098e-05, "loss": 0.8826, "step": 789 }, { "epoch": 0.11, "learning_rate": 1.9668415184463905e-05, "loss": 0.6449, "step": 790 }, { "epoch": 0.11, "learning_rate": 1.9667265285936407e-05, "loss": 0.9375, "step": 791 }, { "epoch": 0.11, "learning_rate": 1.9666113430731233e-05, "loss": 0.9331, "step": 792 }, { "epoch": 0.11, "learning_rate": 1.9664959619081518e-05, "loss": 0.877, "step": 793 }, { "epoch": 0.11, "learning_rate": 1.9663803851220798e-05, "loss": 0.9351, "step": 794 }, { "epoch": 0.11, "learning_rate": 1.9662646127383004e-05, "loss": 0.5934, "step": 795 }, { "epoch": 0.11, "learning_rate": 1.966148644780246e-05, "loss": 0.9617, "step": 796 }, { "epoch": 0.11, "learning_rate": 1.966032481271389e-05, "loss": 0.9282, "step": 797 }, { "epoch": 0.11, "learning_rate": 1.965916122235241e-05, "loss": 0.9851, "step": 798 }, { "epoch": 0.11, "learning_rate": 1.9657995676953533e-05, "loss": 0.9443, "step": 799 }, { "epoch": 0.11, "learning_rate": 1.965682817675317e-05, "loss": 0.9873, "step": 800 }, { "epoch": 0.11, "learning_rate": 1.965565872198763e-05, "loss": 0.959, "step": 801 }, { "epoch": 0.11, "learning_rate": 1.9654487312893602e-05, "loss": 0.9531, "step": 802 }, { "epoch": 0.11, "learning_rate": 1.965331394970819e-05, "loss": 1.0085, "step": 803 }, { "epoch": 0.11, "learning_rate": 1.9652138632668886e-05, "loss": 0.9885, "step": 804 }, { "epoch": 0.11, "learning_rate": 1.9650961362013573e-05, "loss": 0.9138, "step": 805 }, { "epoch": 0.11, "learning_rate": 1.964978213798054e-05, "loss": 0.957, "step": 806 }, { "epoch": 0.11, "learning_rate": 1.9648600960808456e-05, "loss": 0.9343, "step": 807 }, { "epoch": 0.11, "learning_rate": 1.9647417830736397e-05, "loss": 0.9583, "step": 808 }, { "epoch": 0.11, "learning_rate": 1.9646232748003834e-05, "loss": 0.8794, "step": 809 }, { "epoch": 0.11, "learning_rate": 1.9645045712850632e-05, "loss": 0.9016, "step": 810 }, { "epoch": 0.11, "learning_rate": 1.9643856725517045e-05, "loss": 0.936, "step": 811 }, { "epoch": 0.11, "learning_rate": 1.9642665786243732e-05, "loss": 0.9197, "step": 812 }, { "epoch": 0.11, "learning_rate": 1.9641472895271736e-05, "loss": 0.9124, "step": 813 }, { "epoch": 0.11, "learning_rate": 1.96402780528425e-05, "loss": 0.9397, "step": 814 }, { "epoch": 0.11, "learning_rate": 1.9639081259197877e-05, "loss": 0.9333, "step": 815 }, { "epoch": 0.11, "learning_rate": 1.9637882514580086e-05, "loss": 0.9856, "step": 816 }, { "epoch": 0.11, "learning_rate": 1.9636681819231756e-05, "loss": 0.9382, "step": 817 }, { "epoch": 0.11, "learning_rate": 1.9635479173395923e-05, "loss": 0.9763, "step": 818 }, { "epoch": 0.11, "learning_rate": 1.963427457731599e-05, "loss": 0.9221, "step": 819 }, { "epoch": 0.11, "learning_rate": 1.9633068031235783e-05, "loss": 0.9294, "step": 820 }, { "epoch": 0.11, "learning_rate": 1.9631859535399506e-05, "loss": 0.9812, "step": 821 }, { "epoch": 0.11, "learning_rate": 1.9630649090051754e-05, "loss": 0.9446, "step": 822 }, { "epoch": 0.11, "learning_rate": 1.9629436695437533e-05, "loss": 0.9199, "step": 823 }, { "epoch": 0.11, "learning_rate": 1.9628222351802232e-05, "loss": 0.9382, "step": 824 }, { "epoch": 0.11, "learning_rate": 1.9627006059391636e-05, "loss": 0.9097, "step": 825 }, { "epoch": 0.11, "learning_rate": 1.962578781845193e-05, "loss": 0.9407, "step": 826 }, { "epoch": 0.11, "learning_rate": 1.9624567629229682e-05, "loss": 0.8828, "step": 827 }, { "epoch": 0.12, "learning_rate": 1.9623345491971862e-05, "loss": 0.9232, "step": 828 }, { "epoch": 0.12, "learning_rate": 1.962212140692584e-05, "loss": 0.9158, "step": 829 }, { "epoch": 0.12, "learning_rate": 1.9620895374339367e-05, "loss": 0.9531, "step": 830 }, { "epoch": 0.12, "learning_rate": 1.96196673944606e-05, "loss": 0.814, "step": 831 }, { "epoch": 0.12, "learning_rate": 1.961843746753808e-05, "loss": 0.9075, "step": 832 }, { "epoch": 0.12, "learning_rate": 1.9617205593820748e-05, "loss": 0.9421, "step": 833 }, { "epoch": 0.12, "learning_rate": 1.9615971773557946e-05, "loss": 0.937, "step": 834 }, { "epoch": 0.12, "learning_rate": 1.961473600699939e-05, "loss": 0.9121, "step": 835 }, { "epoch": 0.12, "learning_rate": 1.9613498294395214e-05, "loss": 0.9058, "step": 836 }, { "epoch": 0.12, "learning_rate": 1.9612258635995922e-05, "loss": 0.9504, "step": 837 }, { "epoch": 0.12, "learning_rate": 1.9611017032052434e-05, "loss": 0.978, "step": 838 }, { "epoch": 0.12, "learning_rate": 1.960977348281605e-05, "loss": 0.9304, "step": 839 }, { "epoch": 0.12, "learning_rate": 1.960852798853847e-05, "loss": 0.9224, "step": 840 }, { "epoch": 0.12, "learning_rate": 1.9607280549471777e-05, "loss": 0.9695, "step": 841 }, { "epoch": 0.12, "learning_rate": 1.960603116586846e-05, "loss": 0.8831, "step": 842 }, { "epoch": 0.12, "learning_rate": 1.96047798379814e-05, "loss": 0.9858, "step": 843 }, { "epoch": 0.12, "learning_rate": 1.9603526566063866e-05, "loss": 0.9414, "step": 844 }, { "epoch": 0.12, "learning_rate": 1.9602271350369525e-05, "loss": 0.9106, "step": 845 }, { "epoch": 0.12, "learning_rate": 1.9601014191152435e-05, "loss": 0.9392, "step": 846 }, { "epoch": 0.12, "learning_rate": 1.9599755088667048e-05, "loss": 0.8948, "step": 847 }, { "epoch": 0.12, "learning_rate": 1.9598494043168206e-05, "loss": 0.9412, "step": 848 }, { "epoch": 0.12, "learning_rate": 1.9597231054911155e-05, "loss": 0.9985, "step": 849 }, { "epoch": 0.12, "learning_rate": 1.959596612415152e-05, "loss": 0.8638, "step": 850 }, { "epoch": 0.12, "learning_rate": 1.959469925114533e-05, "loss": 0.8511, "step": 851 }, { "epoch": 0.12, "learning_rate": 1.9593430436148998e-05, "loss": 0.9685, "step": 852 }, { "epoch": 0.12, "learning_rate": 1.9592159679419343e-05, "loss": 0.9062, "step": 853 }, { "epoch": 0.12, "learning_rate": 1.9590886981213565e-05, "loss": 0.9722, "step": 854 }, { "epoch": 0.12, "learning_rate": 1.958961234178926e-05, "loss": 0.9832, "step": 855 }, { "epoch": 0.12, "learning_rate": 1.958833576140442e-05, "loss": 0.9351, "step": 856 }, { "epoch": 0.12, "learning_rate": 1.9587057240317423e-05, "loss": 0.939, "step": 857 }, { "epoch": 0.12, "learning_rate": 1.9585776778787055e-05, "loss": 0.9736, "step": 858 }, { "epoch": 0.12, "learning_rate": 1.9584494377072477e-05, "loss": 0.9419, "step": 859 }, { "epoch": 0.12, "learning_rate": 1.958321003543325e-05, "loss": 0.9109, "step": 860 }, { "epoch": 0.12, "learning_rate": 1.958192375412933e-05, "loss": 0.8989, "step": 861 }, { "epoch": 0.12, "learning_rate": 1.9580635533421065e-05, "loss": 0.9263, "step": 862 }, { "epoch": 0.12, "learning_rate": 1.957934537356919e-05, "loss": 0.6035, "step": 863 }, { "epoch": 0.12, "learning_rate": 1.9578053274834835e-05, "loss": 0.9683, "step": 864 }, { "epoch": 0.12, "learning_rate": 1.9576759237479534e-05, "loss": 0.9075, "step": 865 }, { "epoch": 0.12, "learning_rate": 1.957546326176519e-05, "loss": 0.8776, "step": 866 }, { "epoch": 0.12, "learning_rate": 1.9574165347954125e-05, "loss": 0.9602, "step": 867 }, { "epoch": 0.12, "learning_rate": 1.957286549630903e-05, "loss": 0.8425, "step": 868 }, { "epoch": 0.12, "learning_rate": 1.9571563707092997e-05, "loss": 0.9353, "step": 869 }, { "epoch": 0.12, "learning_rate": 1.957025998056952e-05, "loss": 0.959, "step": 870 }, { "epoch": 0.12, "learning_rate": 1.956895431700247e-05, "loss": 0.9604, "step": 871 }, { "epoch": 0.12, "learning_rate": 1.956764671665612e-05, "loss": 0.9678, "step": 872 }, { "epoch": 0.12, "learning_rate": 1.9566337179795124e-05, "loss": 0.928, "step": 873 }, { "epoch": 0.12, "learning_rate": 1.956502570668455e-05, "loss": 0.9187, "step": 874 }, { "epoch": 0.12, "learning_rate": 1.9563712297589827e-05, "loss": 0.8738, "step": 875 }, { "epoch": 0.12, "learning_rate": 1.95623969527768e-05, "loss": 0.9773, "step": 876 }, { "epoch": 0.12, "learning_rate": 1.95610796725117e-05, "loss": 0.9387, "step": 877 }, { "epoch": 0.12, "learning_rate": 1.9559760457061143e-05, "loss": 0.9565, "step": 878 }, { "epoch": 0.12, "learning_rate": 1.9558439306692144e-05, "loss": 0.9463, "step": 879 }, { "epoch": 0.12, "learning_rate": 1.9557116221672107e-05, "loss": 0.5966, "step": 880 }, { "epoch": 0.12, "learning_rate": 1.9555791202268827e-05, "loss": 0.8831, "step": 881 }, { "epoch": 0.12, "learning_rate": 1.9554464248750492e-05, "loss": 0.9536, "step": 882 }, { "epoch": 0.12, "learning_rate": 1.955313536138568e-05, "loss": 0.9932, "step": 883 }, { "epoch": 0.12, "learning_rate": 1.9551804540443357e-05, "loss": 0.95, "step": 884 }, { "epoch": 0.12, "learning_rate": 1.955047178619289e-05, "loss": 0.9111, "step": 885 }, { "epoch": 0.12, "learning_rate": 1.954913709890403e-05, "loss": 0.8813, "step": 886 }, { "epoch": 0.12, "learning_rate": 1.954780047884692e-05, "loss": 0.9556, "step": 887 }, { "epoch": 0.12, "learning_rate": 1.9546461926292097e-05, "loss": 0.9133, "step": 888 }, { "epoch": 0.12, "learning_rate": 1.9545121441510483e-05, "loss": 0.9082, "step": 889 }, { "epoch": 0.12, "learning_rate": 1.9543779024773403e-05, "loss": 0.9006, "step": 890 }, { "epoch": 0.12, "learning_rate": 1.9542434676352557e-05, "loss": 0.8857, "step": 891 }, { "epoch": 0.12, "learning_rate": 1.954108839652005e-05, "loss": 0.9902, "step": 892 }, { "epoch": 0.12, "learning_rate": 1.953974018554837e-05, "loss": 0.9285, "step": 893 }, { "epoch": 0.12, "learning_rate": 1.9538390043710395e-05, "loss": 0.5588, "step": 894 }, { "epoch": 0.12, "learning_rate": 1.9537037971279403e-05, "loss": 0.9126, "step": 895 }, { "epoch": 0.12, "learning_rate": 1.9535683968529056e-05, "loss": 0.9238, "step": 896 }, { "epoch": 0.12, "learning_rate": 1.9534328035733403e-05, "loss": 0.8503, "step": 897 }, { "epoch": 0.12, "learning_rate": 1.9532970173166893e-05, "loss": 0.908, "step": 898 }, { "epoch": 0.12, "learning_rate": 1.9531610381104353e-05, "loss": 0.9563, "step": 899 }, { "epoch": 0.13, "learning_rate": 1.953024865982102e-05, "loss": 0.8958, "step": 900 }, { "epoch": 0.13, "learning_rate": 1.9528885009592497e-05, "loss": 0.9277, "step": 901 }, { "epoch": 0.13, "learning_rate": 1.9527519430694798e-05, "loss": 0.925, "step": 902 }, { "epoch": 0.13, "learning_rate": 1.9526151923404316e-05, "loss": 0.8997, "step": 903 }, { "epoch": 0.13, "learning_rate": 1.9524782487997843e-05, "loss": 0.9578, "step": 904 }, { "epoch": 0.13, "learning_rate": 1.952341112475255e-05, "loss": 0.9111, "step": 905 }, { "epoch": 0.13, "learning_rate": 1.9522037833946005e-05, "loss": 0.9329, "step": 906 }, { "epoch": 0.13, "learning_rate": 1.952066261585617e-05, "loss": 0.8923, "step": 907 }, { "epoch": 0.13, "learning_rate": 1.9519285470761387e-05, "loss": 0.9014, "step": 908 }, { "epoch": 0.13, "learning_rate": 1.9517906398940397e-05, "loss": 0.915, "step": 909 }, { "epoch": 0.13, "learning_rate": 1.9516525400672327e-05, "loss": 0.9622, "step": 910 }, { "epoch": 0.13, "learning_rate": 1.951514247623669e-05, "loss": 0.9211, "step": 911 }, { "epoch": 0.13, "learning_rate": 1.9513757625913396e-05, "loss": 0.9775, "step": 912 }, { "epoch": 0.13, "learning_rate": 1.9512370849982747e-05, "loss": 0.9343, "step": 913 }, { "epoch": 0.13, "learning_rate": 1.9510982148725427e-05, "loss": 0.8901, "step": 914 }, { "epoch": 0.13, "learning_rate": 1.9509591522422508e-05, "loss": 0.9209, "step": 915 }, { "epoch": 0.13, "learning_rate": 1.9508198971355458e-05, "loss": 0.8921, "step": 916 }, { "epoch": 0.13, "learning_rate": 1.9506804495806133e-05, "loss": 0.8611, "step": 917 }, { "epoch": 0.13, "learning_rate": 1.9505408096056782e-05, "loss": 0.8945, "step": 918 }, { "epoch": 0.13, "learning_rate": 1.9504009772390032e-05, "loss": 0.9268, "step": 919 }, { "epoch": 0.13, "learning_rate": 1.9502609525088917e-05, "loss": 0.9219, "step": 920 }, { "epoch": 0.13, "learning_rate": 1.9501207354436845e-05, "loss": 0.99, "step": 921 }, { "epoch": 0.13, "learning_rate": 1.949980326071762e-05, "loss": 0.9346, "step": 922 }, { "epoch": 0.13, "learning_rate": 1.9498397244215426e-05, "loss": 0.9143, "step": 923 }, { "epoch": 0.13, "learning_rate": 1.9496989305214854e-05, "loss": 0.8992, "step": 924 }, { "epoch": 0.13, "learning_rate": 1.949557944400087e-05, "loss": 0.9827, "step": 925 }, { "epoch": 0.13, "learning_rate": 1.949416766085884e-05, "loss": 0.9048, "step": 926 }, { "epoch": 0.13, "learning_rate": 1.9492753956074503e-05, "loss": 0.8958, "step": 927 }, { "epoch": 0.13, "learning_rate": 1.9491338329934e-05, "loss": 0.9194, "step": 928 }, { "epoch": 0.13, "learning_rate": 1.9489920782723854e-05, "loss": 0.8962, "step": 929 }, { "epoch": 0.13, "learning_rate": 1.9488501314730986e-05, "loss": 0.905, "step": 930 }, { "epoch": 0.13, "learning_rate": 1.94870799262427e-05, "loss": 0.927, "step": 931 }, { "epoch": 0.13, "learning_rate": 1.948565661754668e-05, "loss": 0.9089, "step": 932 }, { "epoch": 0.13, "learning_rate": 1.948423138893101e-05, "loss": 0.9609, "step": 933 }, { "epoch": 0.13, "learning_rate": 1.9482804240684168e-05, "loss": 0.9453, "step": 934 }, { "epoch": 0.13, "learning_rate": 1.9481375173095002e-05, "loss": 0.9189, "step": 935 }, { "epoch": 0.13, "learning_rate": 1.9479944186452765e-05, "loss": 0.8657, "step": 936 }, { "epoch": 0.13, "learning_rate": 1.9478511281047094e-05, "loss": 0.8596, "step": 937 }, { "epoch": 0.13, "learning_rate": 1.9477076457168e-05, "loss": 0.9355, "step": 938 }, { "epoch": 0.13, "learning_rate": 1.947563971510591e-05, "loss": 1.0066, "step": 939 }, { "epoch": 0.13, "learning_rate": 1.9474201055151613e-05, "loss": 0.936, "step": 940 }, { "epoch": 0.13, "learning_rate": 1.9472760477596303e-05, "loss": 0.9106, "step": 941 }, { "epoch": 0.13, "learning_rate": 1.9471317982731557e-05, "loss": 0.9431, "step": 942 }, { "epoch": 0.13, "learning_rate": 1.9469873570849335e-05, "loss": 0.9504, "step": 943 }, { "epoch": 0.13, "learning_rate": 1.9468427242241992e-05, "loss": 0.6659, "step": 944 }, { "epoch": 0.13, "learning_rate": 1.9466978997202268e-05, "loss": 0.8873, "step": 945 }, { "epoch": 0.13, "learning_rate": 1.9465528836023293e-05, "loss": 0.989, "step": 946 }, { "epoch": 0.13, "learning_rate": 1.946407675899858e-05, "loss": 0.9192, "step": 947 }, { "epoch": 0.13, "learning_rate": 1.9462622766422034e-05, "loss": 0.6592, "step": 948 }, { "epoch": 0.13, "learning_rate": 1.9461166858587947e-05, "loss": 0.936, "step": 949 }, { "epoch": 0.13, "learning_rate": 1.9459709035791002e-05, "loss": 0.866, "step": 950 }, { "epoch": 0.13, "learning_rate": 1.9458249298326258e-05, "loss": 0.8887, "step": 951 }, { "epoch": 0.13, "learning_rate": 1.9456787646489173e-05, "loss": 0.9031, "step": 952 }, { "epoch": 0.13, "learning_rate": 1.945532408057559e-05, "loss": 0.9282, "step": 953 }, { "epoch": 0.13, "learning_rate": 1.945385860088174e-05, "loss": 0.9001, "step": 954 }, { "epoch": 0.13, "learning_rate": 1.9452391207704234e-05, "loss": 0.9448, "step": 955 }, { "epoch": 0.13, "learning_rate": 1.945092190134008e-05, "loss": 0.9424, "step": 956 }, { "epoch": 0.13, "learning_rate": 1.9449450682086668e-05, "loss": 0.8557, "step": 957 }, { "epoch": 0.13, "learning_rate": 1.9447977550241775e-05, "loss": 0.8828, "step": 958 }, { "epoch": 0.13, "learning_rate": 1.944650250610357e-05, "loss": 0.9146, "step": 959 }, { "epoch": 0.13, "learning_rate": 1.9445025549970604e-05, "loss": 0.8752, "step": 960 }, { "epoch": 0.13, "learning_rate": 1.9443546682141813e-05, "loss": 0.9597, "step": 961 }, { "epoch": 0.13, "learning_rate": 1.9442065902916528e-05, "loss": 0.927, "step": 962 }, { "epoch": 0.13, "learning_rate": 1.944058321259446e-05, "loss": 0.9158, "step": 963 }, { "epoch": 0.13, "learning_rate": 1.943909861147571e-05, "loss": 0.9495, "step": 964 }, { "epoch": 0.13, "learning_rate": 1.9437612099860764e-05, "loss": 0.9529, "step": 965 }, { "epoch": 0.13, "learning_rate": 1.9436123678050496e-05, "loss": 0.9539, "step": 966 }, { "epoch": 0.13, "learning_rate": 1.9434633346346167e-05, "loss": 0.8848, "step": 967 }, { "epoch": 0.13, "learning_rate": 1.9433141105049417e-05, "loss": 0.9502, "step": 968 }, { "epoch": 0.13, "learning_rate": 1.943164695446229e-05, "loss": 0.9468, "step": 969 }, { "epoch": 0.13, "learning_rate": 1.94301508948872e-05, "loss": 0.6364, "step": 970 }, { "epoch": 0.13, "learning_rate": 1.9428652926626954e-05, "loss": 0.9551, "step": 971 }, { "epoch": 0.14, "learning_rate": 1.9427153049984743e-05, "loss": 0.5981, "step": 972 }, { "epoch": 0.14, "learning_rate": 1.9425651265264148e-05, "loss": 0.9509, "step": 973 }, { "epoch": 0.14, "learning_rate": 1.942414757276913e-05, "loss": 0.9565, "step": 974 }, { "epoch": 0.14, "learning_rate": 1.9422641972804046e-05, "loss": 0.8748, "step": 975 }, { "epoch": 0.14, "learning_rate": 1.9421134465673628e-05, "loss": 1.0015, "step": 976 }, { "epoch": 0.14, "learning_rate": 1.9419625051683e-05, "loss": 0.9409, "step": 977 }, { "epoch": 0.14, "learning_rate": 1.941811373113767e-05, "loss": 0.5695, "step": 978 }, { "epoch": 0.14, "learning_rate": 1.9416600504343535e-05, "loss": 0.9451, "step": 979 }, { "epoch": 0.14, "learning_rate": 1.9415085371606878e-05, "loss": 0.9033, "step": 980 }, { "epoch": 0.14, "learning_rate": 1.941356833323436e-05, "loss": 0.9397, "step": 981 }, { "epoch": 0.14, "learning_rate": 1.9412049389533038e-05, "loss": 0.9485, "step": 982 }, { "epoch": 0.14, "learning_rate": 1.9410528540810343e-05, "loss": 0.9497, "step": 983 }, { "epoch": 0.14, "learning_rate": 1.940900578737411e-05, "loss": 0.9321, "step": 984 }, { "epoch": 0.14, "learning_rate": 1.940748112953254e-05, "loss": 0.9353, "step": 985 }, { "epoch": 0.14, "learning_rate": 1.940595456759422e-05, "loss": 0.8799, "step": 986 }, { "epoch": 0.14, "learning_rate": 1.9404426101868144e-05, "loss": 0.9653, "step": 987 }, { "epoch": 0.14, "learning_rate": 1.9402895732663672e-05, "loss": 0.9404, "step": 988 }, { "epoch": 0.14, "learning_rate": 1.9401363460290557e-05, "loss": 0.9368, "step": 989 }, { "epoch": 0.14, "learning_rate": 1.9399829285058926e-05, "loss": 0.6115, "step": 990 }, { "epoch": 0.14, "learning_rate": 1.9398293207279307e-05, "loss": 0.9397, "step": 991 }, { "epoch": 0.14, "learning_rate": 1.9396755227262606e-05, "loss": 0.9678, "step": 992 }, { "epoch": 0.14, "learning_rate": 1.9395215345320108e-05, "loss": 0.9431, "step": 993 }, { "epoch": 0.14, "learning_rate": 1.9393673561763496e-05, "loss": 0.9551, "step": 994 }, { "epoch": 0.14, "learning_rate": 1.9392129876904824e-05, "loss": 0.925, "step": 995 }, { "epoch": 0.14, "learning_rate": 1.9390584291056543e-05, "loss": 0.9414, "step": 996 }, { "epoch": 0.14, "learning_rate": 1.938903680453148e-05, "loss": 0.9397, "step": 997 }, { "epoch": 0.14, "learning_rate": 1.9387487417642854e-05, "loss": 0.9863, "step": 998 }, { "epoch": 0.14, "learning_rate": 1.938593613070426e-05, "loss": 0.9219, "step": 999 }, { "epoch": 0.14, "learning_rate": 1.9384382944029686e-05, "loss": 0.8669, "step": 1000 }, { "epoch": 0.14, "learning_rate": 1.9382827857933493e-05, "loss": 0.9812, "step": 1001 }, { "epoch": 0.14, "learning_rate": 1.9381270872730444e-05, "loss": 0.8706, "step": 1002 }, { "epoch": 0.14, "learning_rate": 1.937971198873567e-05, "loss": 0.9419, "step": 1003 }, { "epoch": 0.14, "learning_rate": 1.93781512062647e-05, "loss": 0.9719, "step": 1004 }, { "epoch": 0.14, "learning_rate": 1.937658852563343e-05, "loss": 0.9233, "step": 1005 }, { "epoch": 0.14, "learning_rate": 1.9375023947158157e-05, "loss": 0.9583, "step": 1006 }, { "epoch": 0.14, "learning_rate": 1.9373457471155554e-05, "loss": 0.9573, "step": 1007 }, { "epoch": 0.14, "learning_rate": 1.937188909794268e-05, "loss": 0.9343, "step": 1008 }, { "epoch": 0.14, "learning_rate": 1.9370318827836977e-05, "loss": 0.8406, "step": 1009 }, { "epoch": 0.14, "learning_rate": 1.9368746661156272e-05, "loss": 0.9453, "step": 1010 }, { "epoch": 0.14, "learning_rate": 1.9367172598218774e-05, "loss": 0.8138, "step": 1011 }, { "epoch": 0.14, "learning_rate": 1.936559663934308e-05, "loss": 0.9319, "step": 1012 }, { "epoch": 0.14, "learning_rate": 1.9364018784848165e-05, "loss": 0.9033, "step": 1013 }, { "epoch": 0.14, "learning_rate": 1.9362439035053387e-05, "loss": 0.9161, "step": 1014 }, { "epoch": 0.14, "learning_rate": 1.93608573902785e-05, "loss": 0.8833, "step": 1015 }, { "epoch": 0.14, "learning_rate": 1.935927385084363e-05, "loss": 0.926, "step": 1016 }, { "epoch": 0.14, "learning_rate": 1.9357688417069282e-05, "loss": 0.8669, "step": 1017 }, { "epoch": 0.14, "learning_rate": 1.935610108927636e-05, "loss": 0.9695, "step": 1018 }, { "epoch": 0.14, "learning_rate": 1.9354511867786138e-05, "loss": 0.9458, "step": 1019 }, { "epoch": 0.14, "learning_rate": 1.9352920752920282e-05, "loss": 0.9187, "step": 1020 }, { "epoch": 0.14, "learning_rate": 1.9351327745000835e-05, "loss": 0.8855, "step": 1021 }, { "epoch": 0.14, "learning_rate": 1.9349732844350228e-05, "loss": 0.834, "step": 1022 }, { "epoch": 0.14, "learning_rate": 1.9348136051291267e-05, "loss": 0.9141, "step": 1023 }, { "epoch": 0.14, "learning_rate": 1.9346537366147152e-05, "loss": 0.9233, "step": 1024 }, { "epoch": 0.14, "learning_rate": 1.9344936789241458e-05, "loss": 0.8967, "step": 1025 }, { "epoch": 0.14, "learning_rate": 1.9343334320898152e-05, "loss": 0.8794, "step": 1026 }, { "epoch": 0.14, "learning_rate": 1.934172996144157e-05, "loss": 0.8994, "step": 1027 }, { "epoch": 0.14, "learning_rate": 1.9340123711196436e-05, "loss": 0.9219, "step": 1028 }, { "epoch": 0.14, "learning_rate": 1.933851557048787e-05, "loss": 0.9543, "step": 1029 }, { "epoch": 0.14, "learning_rate": 1.933690553964135e-05, "loss": 0.6364, "step": 1030 }, { "epoch": 0.14, "learning_rate": 1.9335293618982765e-05, "loss": 0.9919, "step": 1031 }, { "epoch": 0.14, "learning_rate": 1.933367980883836e-05, "loss": 0.9285, "step": 1032 }, { "epoch": 0.14, "learning_rate": 1.933206410953478e-05, "loss": 0.8997, "step": 1033 }, { "epoch": 0.14, "learning_rate": 1.933044652139904e-05, "loss": 0.9646, "step": 1034 }, { "epoch": 0.14, "learning_rate": 1.932882704475855e-05, "loss": 0.5934, "step": 1035 }, { "epoch": 0.14, "learning_rate": 1.9327205679941096e-05, "loss": 0.8845, "step": 1036 }, { "epoch": 0.14, "learning_rate": 1.932558242727484e-05, "loss": 0.9553, "step": 1037 }, { "epoch": 0.14, "learning_rate": 1.932395728708834e-05, "loss": 0.9478, "step": 1038 }, { "epoch": 0.14, "learning_rate": 1.9322330259710522e-05, "loss": 0.9277, "step": 1039 }, { "epoch": 0.14, "learning_rate": 1.9320701345470704e-05, "loss": 0.9114, "step": 1040 }, { "epoch": 0.14, "learning_rate": 1.9319070544698578e-05, "loss": 0.9028, "step": 1041 }, { "epoch": 0.14, "learning_rate": 1.9317437857724228e-05, "loss": 0.8911, "step": 1042 }, { "epoch": 0.14, "learning_rate": 1.9315803284878113e-05, "loss": 0.9221, "step": 1043 }, { "epoch": 0.15, "learning_rate": 1.9314166826491066e-05, "loss": 0.8604, "step": 1044 }, { "epoch": 0.15, "learning_rate": 1.931252848289432e-05, "loss": 0.8303, "step": 1045 }, { "epoch": 0.15, "learning_rate": 1.9310888254419477e-05, "loss": 0.8757, "step": 1046 }, { "epoch": 0.15, "learning_rate": 1.9309246141398517e-05, "loss": 0.907, "step": 1047 }, { "epoch": 0.15, "learning_rate": 1.930760214416382e-05, "loss": 0.9897, "step": 1048 }, { "epoch": 0.15, "learning_rate": 1.930595626304812e-05, "loss": 0.9351, "step": 1049 }, { "epoch": 0.15, "learning_rate": 1.930430849838456e-05, "loss": 0.8997, "step": 1050 }, { "epoch": 0.15, "learning_rate": 1.9302658850506645e-05, "loss": 0.8542, "step": 1051 }, { "epoch": 0.15, "learning_rate": 1.930100731974827e-05, "loss": 0.9519, "step": 1052 }, { "epoch": 0.15, "learning_rate": 1.9299353906443708e-05, "loss": 0.9692, "step": 1053 }, { "epoch": 0.15, "learning_rate": 1.929769861092761e-05, "loss": 0.9321, "step": 1054 }, { "epoch": 0.15, "learning_rate": 1.929604143353502e-05, "loss": 0.9324, "step": 1055 }, { "epoch": 0.15, "learning_rate": 1.929438237460135e-05, "loss": 0.8684, "step": 1056 }, { "epoch": 0.15, "learning_rate": 1.9292721434462396e-05, "loss": 0.8286, "step": 1057 }, { "epoch": 0.15, "learning_rate": 1.9291058613454336e-05, "loss": 0.9016, "step": 1058 }, { "epoch": 0.15, "learning_rate": 1.9289393911913733e-05, "loss": 0.9507, "step": 1059 }, { "epoch": 0.15, "learning_rate": 1.9287727330177528e-05, "loss": 0.9109, "step": 1060 }, { "epoch": 0.15, "learning_rate": 1.9286058868583034e-05, "loss": 0.895, "step": 1061 }, { "epoch": 0.15, "learning_rate": 1.9284388527467953e-05, "loss": 0.6189, "step": 1062 }, { "epoch": 0.15, "learning_rate": 1.9282716307170374e-05, "loss": 0.597, "step": 1063 }, { "epoch": 0.15, "learning_rate": 1.928104220802875e-05, "loss": 0.6775, "step": 1064 }, { "epoch": 0.15, "learning_rate": 1.9279366230381927e-05, "loss": 0.8779, "step": 1065 }, { "epoch": 0.15, "learning_rate": 1.9277688374569124e-05, "loss": 0.9048, "step": 1066 }, { "epoch": 0.15, "learning_rate": 1.927600864092994e-05, "loss": 0.9583, "step": 1067 }, { "epoch": 0.15, "learning_rate": 1.927432702980437e-05, "loss": 0.9404, "step": 1068 }, { "epoch": 0.15, "learning_rate": 1.9272643541532764e-05, "loss": 0.8762, "step": 1069 }, { "epoch": 0.15, "learning_rate": 1.9270958176455866e-05, "loss": 0.8772, "step": 1070 }, { "epoch": 0.15, "learning_rate": 1.9269270934914797e-05, "loss": 0.9285, "step": 1071 }, { "epoch": 0.15, "learning_rate": 1.9267581817251065e-05, "loss": 0.9441, "step": 1072 }, { "epoch": 0.15, "learning_rate": 1.926589082380655e-05, "loss": 0.9036, "step": 1073 }, { "epoch": 0.15, "learning_rate": 1.926419795492351e-05, "loss": 0.9106, "step": 1074 }, { "epoch": 0.15, "learning_rate": 1.9262503210944583e-05, "loss": 0.9282, "step": 1075 }, { "epoch": 0.15, "learning_rate": 1.9260806592212796e-05, "loss": 0.926, "step": 1076 }, { "epoch": 0.15, "learning_rate": 1.9259108099071544e-05, "loss": 0.9426, "step": 1077 }, { "epoch": 0.15, "learning_rate": 1.9257407731864607e-05, "loss": 0.9146, "step": 1078 }, { "epoch": 0.15, "learning_rate": 1.925570549093615e-05, "loss": 0.8828, "step": 1079 }, { "epoch": 0.15, "learning_rate": 1.9254001376630698e-05, "loss": 0.8796, "step": 1080 }, { "epoch": 0.15, "learning_rate": 1.9252295389293176e-05, "loss": 0.9478, "step": 1081 }, { "epoch": 0.15, "learning_rate": 1.9250587529268882e-05, "loss": 0.8551, "step": 1082 }, { "epoch": 0.15, "learning_rate": 1.9248877796903483e-05, "loss": 0.9238, "step": 1083 }, { "epoch": 0.15, "learning_rate": 1.9247166192543038e-05, "loss": 0.9429, "step": 1084 }, { "epoch": 0.15, "learning_rate": 1.924545271653398e-05, "loss": 0.9185, "step": 1085 }, { "epoch": 0.15, "learning_rate": 1.924373736922312e-05, "loss": 0.6583, "step": 1086 }, { "epoch": 0.15, "learning_rate": 1.924202015095765e-05, "loss": 0.8536, "step": 1087 }, { "epoch": 0.15, "learning_rate": 1.9240301062085135e-05, "loss": 0.8979, "step": 1088 }, { "epoch": 0.15, "learning_rate": 1.9238580102953525e-05, "loss": 0.9978, "step": 1089 }, { "epoch": 0.15, "learning_rate": 1.923685727391115e-05, "loss": 0.917, "step": 1090 }, { "epoch": 0.15, "learning_rate": 1.9235132575306705e-05, "loss": 0.9004, "step": 1091 }, { "epoch": 0.15, "learning_rate": 1.9233406007489283e-05, "loss": 0.8723, "step": 1092 }, { "epoch": 0.15, "learning_rate": 1.9231677570808342e-05, "loss": 0.5665, "step": 1093 }, { "epoch": 0.15, "learning_rate": 1.9229947265613722e-05, "loss": 0.6462, "step": 1094 }, { "epoch": 0.15, "learning_rate": 1.9228215092255638e-05, "loss": 0.9194, "step": 1095 }, { "epoch": 0.15, "learning_rate": 1.922648105108469e-05, "loss": 0.9382, "step": 1096 }, { "epoch": 0.15, "learning_rate": 1.922474514245185e-05, "loss": 0.9031, "step": 1097 }, { "epoch": 0.15, "learning_rate": 1.922300736670847e-05, "loss": 0.8987, "step": 1098 }, { "epoch": 0.15, "learning_rate": 1.922126772420628e-05, "loss": 0.8936, "step": 1099 }, { "epoch": 0.15, "learning_rate": 1.9219526215297387e-05, "loss": 0.8674, "step": 1100 }, { "epoch": 0.15, "learning_rate": 1.9217782840334284e-05, "loss": 0.918, "step": 1101 }, { "epoch": 0.15, "learning_rate": 1.921603759966982e-05, "loss": 0.8989, "step": 1102 }, { "epoch": 0.15, "learning_rate": 1.921429049365725e-05, "loss": 0.9062, "step": 1103 }, { "epoch": 0.15, "learning_rate": 1.9212541522650182e-05, "loss": 0.8733, "step": 1104 }, { "epoch": 0.15, "learning_rate": 1.921079068700262e-05, "loss": 0.9028, "step": 1105 }, { "epoch": 0.15, "learning_rate": 1.9209037987068933e-05, "loss": 0.9783, "step": 1106 }, { "epoch": 0.15, "learning_rate": 1.9207283423203873e-05, "loss": 0.9424, "step": 1107 }, { "epoch": 0.15, "learning_rate": 1.9205526995762567e-05, "loss": 0.8958, "step": 1108 }, { "epoch": 0.15, "learning_rate": 1.920376870510052e-05, "loss": 0.5997, "step": 1109 }, { "epoch": 0.15, "learning_rate": 1.9202008551573614e-05, "loss": 0.6161, "step": 1110 }, { "epoch": 0.15, "learning_rate": 1.920024653553811e-05, "loss": 0.9448, "step": 1111 }, { "epoch": 0.15, "learning_rate": 1.9198482657350642e-05, "loss": 0.9207, "step": 1112 }, { "epoch": 0.15, "learning_rate": 1.9196716917368228e-05, "loss": 0.9529, "step": 1113 }, { "epoch": 0.15, "learning_rate": 1.9194949315948252e-05, "loss": 0.9329, "step": 1114 }, { "epoch": 0.15, "learning_rate": 1.9193179853448484e-05, "loss": 0.8833, "step": 1115 }, { "epoch": 0.16, "learning_rate": 1.9191408530227066e-05, "loss": 0.6733, "step": 1116 }, { "epoch": 0.16, "learning_rate": 1.918963534664252e-05, "loss": 0.9114, "step": 1117 }, { "epoch": 0.16, "learning_rate": 1.918786030305374e-05, "loss": 0.9263, "step": 1118 }, { "epoch": 0.16, "learning_rate": 1.9186083399819998e-05, "loss": 0.9453, "step": 1119 }, { "epoch": 0.16, "learning_rate": 1.9184304637300952e-05, "loss": 0.9016, "step": 1120 }, { "epoch": 0.16, "learning_rate": 1.9182524015856616e-05, "loss": 0.9531, "step": 1121 }, { "epoch": 0.16, "learning_rate": 1.91807415358474e-05, "loss": 0.9766, "step": 1122 }, { "epoch": 0.16, "learning_rate": 1.917895719763408e-05, "loss": 0.8367, "step": 1123 }, { "epoch": 0.16, "learning_rate": 1.917717100157781e-05, "loss": 0.9214, "step": 1124 }, { "epoch": 0.16, "learning_rate": 1.9175382948040125e-05, "loss": 0.8491, "step": 1125 }, { "epoch": 0.16, "learning_rate": 1.917359303738292e-05, "loss": 0.8491, "step": 1126 }, { "epoch": 0.16, "learning_rate": 1.917180126996849e-05, "loss": 0.6193, "step": 1127 }, { "epoch": 0.16, "learning_rate": 1.9170007646159484e-05, "loss": 0.915, "step": 1128 }, { "epoch": 0.16, "learning_rate": 1.916821216631894e-05, "loss": 0.9104, "step": 1129 }, { "epoch": 0.16, "learning_rate": 1.9166414830810266e-05, "loss": 0.9446, "step": 1130 }, { "epoch": 0.16, "learning_rate": 1.9164615639997248e-05, "loss": 0.9062, "step": 1131 }, { "epoch": 0.16, "learning_rate": 1.9162814594244045e-05, "loss": 0.947, "step": 1132 }, { "epoch": 0.16, "learning_rate": 1.9161011693915196e-05, "loss": 0.8818, "step": 1133 }, { "epoch": 0.16, "learning_rate": 1.915920693937561e-05, "loss": 0.866, "step": 1134 }, { "epoch": 0.16, "learning_rate": 1.9157400330990573e-05, "loss": 0.9424, "step": 1135 }, { "epoch": 0.16, "learning_rate": 1.915559186912575e-05, "loss": 0.9368, "step": 1136 }, { "epoch": 0.16, "learning_rate": 1.9153781554147173e-05, "loss": 0.8994, "step": 1137 }, { "epoch": 0.16, "learning_rate": 1.9151969386421256e-05, "loss": 0.8923, "step": 1138 }, { "epoch": 0.16, "learning_rate": 1.915015536631479e-05, "loss": 0.659, "step": 1139 }, { "epoch": 0.16, "learning_rate": 1.9148339494194933e-05, "loss": 0.9658, "step": 1140 }, { "epoch": 0.16, "learning_rate": 1.9146521770429223e-05, "loss": 0.9399, "step": 1141 }, { "epoch": 0.16, "learning_rate": 1.9144702195385573e-05, "loss": 0.8855, "step": 1142 }, { "epoch": 0.16, "learning_rate": 1.9142880769432266e-05, "loss": 0.9341, "step": 1143 }, { "epoch": 0.16, "learning_rate": 1.9141057492937964e-05, "loss": 0.929, "step": 1144 }, { "epoch": 0.16, "learning_rate": 1.9139232366271706e-05, "loss": 0.9512, "step": 1145 }, { "epoch": 0.16, "learning_rate": 1.91374053898029e-05, "loss": 0.9031, "step": 1146 }, { "epoch": 0.16, "learning_rate": 1.9135576563901327e-05, "loss": 0.9988, "step": 1147 }, { "epoch": 0.16, "learning_rate": 1.913374588893715e-05, "loss": 0.9155, "step": 1148 }, { "epoch": 0.16, "learning_rate": 1.91319133652809e-05, "loss": 0.9175, "step": 1149 }, { "epoch": 0.16, "learning_rate": 1.9130078993303484e-05, "loss": 0.8875, "step": 1150 }, { "epoch": 0.16, "learning_rate": 1.9128242773376188e-05, "loss": 0.896, "step": 1151 }, { "epoch": 0.16, "learning_rate": 1.912640470587066e-05, "loss": 0.901, "step": 1152 }, { "epoch": 0.16, "learning_rate": 1.9124564791158935e-05, "loss": 0.9004, "step": 1153 }, { "epoch": 0.16, "learning_rate": 1.9122723029613412e-05, "loss": 0.6396, "step": 1154 }, { "epoch": 0.16, "learning_rate": 1.912087942160687e-05, "loss": 0.9641, "step": 1155 }, { "epoch": 0.16, "learning_rate": 1.9119033967512462e-05, "loss": 0.9453, "step": 1156 }, { "epoch": 0.16, "learning_rate": 1.9117186667703708e-05, "loss": 0.9712, "step": 1157 }, { "epoch": 0.16, "learning_rate": 1.9115337522554508e-05, "loss": 0.8936, "step": 1158 }, { "epoch": 0.16, "learning_rate": 1.911348653243913e-05, "loss": 0.6582, "step": 1159 }, { "epoch": 0.16, "learning_rate": 1.9111633697732225e-05, "loss": 0.9482, "step": 1160 }, { "epoch": 0.16, "learning_rate": 1.910977901880881e-05, "loss": 0.8599, "step": 1161 }, { "epoch": 0.16, "learning_rate": 1.9107922496044273e-05, "loss": 0.8552, "step": 1162 }, { "epoch": 0.16, "learning_rate": 1.910606412981438e-05, "loss": 0.8586, "step": 1163 }, { "epoch": 0.16, "learning_rate": 1.910420392049527e-05, "loss": 0.8606, "step": 1164 }, { "epoch": 0.16, "learning_rate": 1.910234186846345e-05, "loss": 0.9158, "step": 1165 }, { "epoch": 0.16, "learning_rate": 1.910047797409581e-05, "loss": 0.874, "step": 1166 }, { "epoch": 0.16, "learning_rate": 1.9098612237769602e-05, "loss": 0.801, "step": 1167 }, { "epoch": 0.16, "learning_rate": 1.9096744659862457e-05, "loss": 0.9141, "step": 1168 }, { "epoch": 0.16, "learning_rate": 1.909487524075238e-05, "loss": 0.8591, "step": 1169 }, { "epoch": 0.16, "learning_rate": 1.909300398081774e-05, "loss": 0.8623, "step": 1170 }, { "epoch": 0.16, "learning_rate": 1.9091130880437284e-05, "loss": 0.8723, "step": 1171 }, { "epoch": 0.16, "learning_rate": 1.908925593999014e-05, "loss": 0.6192, "step": 1172 }, { "epoch": 0.16, "learning_rate": 1.9087379159855797e-05, "loss": 0.908, "step": 1173 }, { "epoch": 0.16, "learning_rate": 1.9085500540414117e-05, "loss": 0.928, "step": 1174 }, { "epoch": 0.16, "learning_rate": 1.908362008204534e-05, "loss": 0.8904, "step": 1175 }, { "epoch": 0.16, "learning_rate": 1.9081737785130074e-05, "loss": 0.8992, "step": 1176 }, { "epoch": 0.16, "learning_rate": 1.90798536500493e-05, "loss": 0.8967, "step": 1177 }, { "epoch": 0.16, "learning_rate": 1.907796767718437e-05, "loss": 0.8596, "step": 1178 }, { "epoch": 0.16, "learning_rate": 1.9076079866917013e-05, "loss": 0.9448, "step": 1179 }, { "epoch": 0.16, "learning_rate": 1.9074190219629328e-05, "loss": 0.602, "step": 1180 }, { "epoch": 0.16, "learning_rate": 1.9072298735703776e-05, "loss": 0.9856, "step": 1181 }, { "epoch": 0.16, "learning_rate": 1.9070405415523207e-05, "loss": 0.936, "step": 1182 }, { "epoch": 0.16, "learning_rate": 1.9068510259470826e-05, "loss": 0.3362, "step": 1183 }, { "epoch": 0.16, "learning_rate": 1.9066613267930223e-05, "loss": 0.8896, "step": 1184 }, { "epoch": 0.16, "learning_rate": 1.906471444128535e-05, "loss": 0.8533, "step": 1185 }, { "epoch": 0.16, "learning_rate": 1.9062813779920537e-05, "loss": 0.9355, "step": 1186 }, { "epoch": 0.16, "learning_rate": 1.9060911284220478e-05, "loss": 0.9285, "step": 1187 }, { "epoch": 0.17, "learning_rate": 1.9059006954570246e-05, "loss": 0.9458, "step": 1188 }, { "epoch": 0.17, "learning_rate": 1.905710079135528e-05, "loss": 0.8513, "step": 1189 }, { "epoch": 0.17, "learning_rate": 1.90551927949614e-05, "loss": 0.8916, "step": 1190 }, { "epoch": 0.17, "learning_rate": 1.9053282965774773e-05, "loss": 0.9231, "step": 1191 }, { "epoch": 0.17, "learning_rate": 1.905137130418197e-05, "loss": 0.9297, "step": 1192 }, { "epoch": 0.17, "learning_rate": 1.90494578105699e-05, "loss": 0.9382, "step": 1193 }, { "epoch": 0.17, "learning_rate": 1.9047542485325872e-05, "loss": 0.9197, "step": 1194 }, { "epoch": 0.17, "learning_rate": 1.9045625328837548e-05, "loss": 0.8997, "step": 1195 }, { "epoch": 0.17, "learning_rate": 1.9043706341492962e-05, "loss": 0.906, "step": 1196 }, { "epoch": 0.17, "learning_rate": 1.904178552368053e-05, "loss": 0.8975, "step": 1197 }, { "epoch": 0.17, "learning_rate": 1.9039862875789014e-05, "loss": 0.9155, "step": 1198 }, { "epoch": 0.17, "learning_rate": 1.903793839820758e-05, "loss": 0.9805, "step": 1199 }, { "epoch": 0.17, "learning_rate": 1.903601209132574e-05, "loss": 0.9153, "step": 1200 }, { "epoch": 0.17, "learning_rate": 1.9034083955533377e-05, "loss": 0.958, "step": 1201 }, { "epoch": 0.17, "learning_rate": 1.903215399122076e-05, "loss": 0.9133, "step": 1202 }, { "epoch": 0.17, "learning_rate": 1.903022219877851e-05, "loss": 0.9082, "step": 1203 }, { "epoch": 0.17, "learning_rate": 1.9028288578597635e-05, "loss": 0.8455, "step": 1204 }, { "epoch": 0.17, "learning_rate": 1.9026353131069498e-05, "loss": 0.9146, "step": 1205 }, { "epoch": 0.17, "learning_rate": 1.9024415856585844e-05, "loss": 0.9314, "step": 1206 }, { "epoch": 0.17, "learning_rate": 1.9022476755538777e-05, "loss": 0.937, "step": 1207 }, { "epoch": 0.17, "learning_rate": 1.9020535828320774e-05, "loss": 0.8748, "step": 1208 }, { "epoch": 0.17, "learning_rate": 1.901859307532469e-05, "loss": 0.9219, "step": 1209 }, { "epoch": 0.17, "learning_rate": 1.901664849694374e-05, "loss": 0.887, "step": 1210 }, { "epoch": 0.17, "learning_rate": 1.9014702093571508e-05, "loss": 0.9597, "step": 1211 }, { "epoch": 0.17, "learning_rate": 1.9012753865601953e-05, "loss": 0.8989, "step": 1212 }, { "epoch": 0.17, "learning_rate": 1.9010803813429405e-05, "loss": 0.9058, "step": 1213 }, { "epoch": 0.17, "learning_rate": 1.900885193744855e-05, "loss": 0.95, "step": 1214 }, { "epoch": 0.17, "learning_rate": 1.900689823805446e-05, "loss": 0.8875, "step": 1215 }, { "epoch": 0.17, "learning_rate": 1.900494271564257e-05, "loss": 0.5833, "step": 1216 }, { "epoch": 0.17, "learning_rate": 1.9002985370608675e-05, "loss": 0.886, "step": 1217 }, { "epoch": 0.17, "learning_rate": 1.9001026203348952e-05, "loss": 0.8533, "step": 1218 }, { "epoch": 0.17, "learning_rate": 1.899906521425994e-05, "loss": 0.9038, "step": 1219 }, { "epoch": 0.17, "learning_rate": 1.8997102403738543e-05, "loss": 1.0034, "step": 1220 }, { "epoch": 0.17, "learning_rate": 1.8995137772182047e-05, "loss": 0.9182, "step": 1221 }, { "epoch": 0.17, "learning_rate": 1.8993171319988092e-05, "loss": 0.9045, "step": 1222 }, { "epoch": 0.17, "learning_rate": 1.8991203047554693e-05, "loss": 0.9062, "step": 1223 }, { "epoch": 0.17, "learning_rate": 1.898923295528024e-05, "loss": 0.8997, "step": 1224 }, { "epoch": 0.17, "learning_rate": 1.8987261043563474e-05, "loss": 0.9868, "step": 1225 }, { "epoch": 0.17, "learning_rate": 1.898528731280352e-05, "loss": 0.9099, "step": 1226 }, { "epoch": 0.17, "learning_rate": 1.8983311763399867e-05, "loss": 0.9236, "step": 1227 }, { "epoch": 0.17, "learning_rate": 1.898133439575237e-05, "loss": 0.6219, "step": 1228 }, { "epoch": 0.17, "learning_rate": 1.897935521026125e-05, "loss": 0.9744, "step": 1229 }, { "epoch": 0.17, "learning_rate": 1.8977374207327104e-05, "loss": 0.9231, "step": 1230 }, { "epoch": 0.17, "learning_rate": 1.897539138735089e-05, "loss": 0.8716, "step": 1231 }, { "epoch": 0.17, "learning_rate": 1.897340675073393e-05, "loss": 0.887, "step": 1232 }, { "epoch": 0.17, "learning_rate": 1.8971420297877927e-05, "loss": 0.9497, "step": 1233 }, { "epoch": 0.17, "learning_rate": 1.896943202918494e-05, "loss": 0.9202, "step": 1234 }, { "epoch": 0.17, "learning_rate": 1.89674419450574e-05, "loss": 0.5646, "step": 1235 }, { "epoch": 0.17, "learning_rate": 1.8965450045898103e-05, "loss": 0.8928, "step": 1236 }, { "epoch": 0.17, "learning_rate": 1.8963456332110216e-05, "loss": 0.9324, "step": 1237 }, { "epoch": 0.17, "learning_rate": 1.8961460804097276e-05, "loss": 0.947, "step": 1238 }, { "epoch": 0.17, "learning_rate": 1.8959463462263175e-05, "loss": 0.9438, "step": 1239 }, { "epoch": 0.17, "learning_rate": 1.895746430701218e-05, "loss": 0.9104, "step": 1240 }, { "epoch": 0.17, "learning_rate": 1.895546333874893e-05, "loss": 0.8633, "step": 1241 }, { "epoch": 0.17, "learning_rate": 1.8953460557878425e-05, "loss": 0.615, "step": 1242 }, { "epoch": 0.17, "learning_rate": 1.8951455964806028e-05, "loss": 0.906, "step": 1243 }, { "epoch": 0.17, "learning_rate": 1.8949449559937482e-05, "loss": 0.937, "step": 1244 }, { "epoch": 0.17, "learning_rate": 1.8947441343678875e-05, "loss": 0.9243, "step": 1245 }, { "epoch": 0.17, "learning_rate": 1.8945431316436687e-05, "loss": 0.9236, "step": 1246 }, { "epoch": 0.17, "learning_rate": 1.8943419478617747e-05, "loss": 0.9404, "step": 1247 }, { "epoch": 0.17, "learning_rate": 1.8941405830629255e-05, "loss": 0.918, "step": 1248 }, { "epoch": 0.17, "learning_rate": 1.8939390372878784e-05, "loss": 0.9482, "step": 1249 }, { "epoch": 0.17, "learning_rate": 1.8937373105774258e-05, "loss": 0.9016, "step": 1250 }, { "epoch": 0.17, "learning_rate": 1.8935354029723984e-05, "loss": 0.9216, "step": 1251 }, { "epoch": 0.17, "learning_rate": 1.8933333145136626e-05, "loss": 0.8796, "step": 1252 }, { "epoch": 0.17, "learning_rate": 1.8931310452421216e-05, "loss": 0.896, "step": 1253 }, { "epoch": 0.17, "learning_rate": 1.892928595198715e-05, "loss": 0.8865, "step": 1254 }, { "epoch": 0.17, "learning_rate": 1.8927259644244195e-05, "loss": 0.95, "step": 1255 }, { "epoch": 0.17, "learning_rate": 1.892523152960248e-05, "loss": 0.9282, "step": 1256 }, { "epoch": 0.17, "learning_rate": 1.8923201608472496e-05, "loss": 0.896, "step": 1257 }, { "epoch": 0.17, "learning_rate": 1.8921169881265106e-05, "loss": 0.8777, "step": 1258 }, { "epoch": 0.17, "learning_rate": 1.891913634839154e-05, "loss": 0.9624, "step": 1259 }, { "epoch": 0.18, "learning_rate": 1.8917101010263388e-05, "loss": 0.9597, "step": 1260 }, { "epoch": 0.18, "learning_rate": 1.8915063867292603e-05, "loss": 0.9043, "step": 1261 }, { "epoch": 0.18, "learning_rate": 1.8913024919891515e-05, "loss": 0.8845, "step": 1262 }, { "epoch": 0.18, "learning_rate": 1.891098416847281e-05, "loss": 0.9263, "step": 1263 }, { "epoch": 0.18, "learning_rate": 1.8908941613449534e-05, "loss": 0.896, "step": 1264 }, { "epoch": 0.18, "learning_rate": 1.8906897255235112e-05, "loss": 0.9358, "step": 1265 }, { "epoch": 0.18, "learning_rate": 1.8904851094243324e-05, "loss": 0.9397, "step": 1266 }, { "epoch": 0.18, "learning_rate": 1.890280313088832e-05, "loss": 0.9421, "step": 1267 }, { "epoch": 0.18, "learning_rate": 1.8900753365584612e-05, "loss": 0.8212, "step": 1268 }, { "epoch": 0.18, "learning_rate": 1.889870179874708e-05, "loss": 0.9351, "step": 1269 }, { "epoch": 0.18, "learning_rate": 1.8896648430790958e-05, "loss": 0.8992, "step": 1270 }, { "epoch": 0.18, "learning_rate": 1.889459326213186e-05, "loss": 0.9385, "step": 1271 }, { "epoch": 0.18, "learning_rate": 1.8892536293185758e-05, "loss": 0.9094, "step": 1272 }, { "epoch": 0.18, "learning_rate": 1.889047752436898e-05, "loss": 0.8794, "step": 1273 }, { "epoch": 0.18, "learning_rate": 1.888841695609823e-05, "loss": 0.8816, "step": 1274 }, { "epoch": 0.18, "learning_rate": 1.8886354588790576e-05, "loss": 0.6218, "step": 1275 }, { "epoch": 0.18, "learning_rate": 1.888429042286344e-05, "loss": 0.6294, "step": 1276 }, { "epoch": 0.18, "learning_rate": 1.8882224458734612e-05, "loss": 0.969, "step": 1277 }, { "epoch": 0.18, "learning_rate": 1.8880156696822254e-05, "loss": 0.9109, "step": 1278 }, { "epoch": 0.18, "learning_rate": 1.887808713754489e-05, "loss": 0.9297, "step": 1279 }, { "epoch": 0.18, "learning_rate": 1.8876015781321393e-05, "loss": 0.9041, "step": 1280 }, { "epoch": 0.18, "learning_rate": 1.8873942628571018e-05, "loss": 0.8931, "step": 1281 }, { "epoch": 0.18, "learning_rate": 1.887186767971337e-05, "loss": 0.9409, "step": 1282 }, { "epoch": 0.18, "learning_rate": 1.8869790935168432e-05, "loss": 0.9414, "step": 1283 }, { "epoch": 0.18, "learning_rate": 1.8867712395356536e-05, "loss": 0.8965, "step": 1284 }, { "epoch": 0.18, "learning_rate": 1.8865632060698383e-05, "loss": 0.8889, "step": 1285 }, { "epoch": 0.18, "learning_rate": 1.8863549931615042e-05, "loss": 0.8994, "step": 1286 }, { "epoch": 0.18, "learning_rate": 1.8861466008527937e-05, "loss": 0.9414, "step": 1287 }, { "epoch": 0.18, "learning_rate": 1.885938029185886e-05, "loss": 0.8674, "step": 1288 }, { "epoch": 0.18, "learning_rate": 1.8857292782029963e-05, "loss": 0.929, "step": 1289 }, { "epoch": 0.18, "learning_rate": 1.885520347946377e-05, "loss": 0.9026, "step": 1290 }, { "epoch": 0.18, "learning_rate": 1.8853112384583153e-05, "loss": 0.801, "step": 1291 }, { "epoch": 0.18, "learning_rate": 1.885101949781136e-05, "loss": 0.8862, "step": 1292 }, { "epoch": 0.18, "learning_rate": 1.8848924819571994e-05, "loss": 0.8643, "step": 1293 }, { "epoch": 0.18, "learning_rate": 1.8846828350289022e-05, "loss": 0.9465, "step": 1294 }, { "epoch": 0.18, "learning_rate": 1.884473009038678e-05, "loss": 0.9504, "step": 1295 }, { "epoch": 0.18, "learning_rate": 1.8842630040289952e-05, "loss": 0.9348, "step": 1296 }, { "epoch": 0.18, "learning_rate": 1.8840528200423594e-05, "loss": 0.9185, "step": 1297 }, { "epoch": 0.18, "learning_rate": 1.8838424571213136e-05, "loss": 0.9109, "step": 1298 }, { "epoch": 0.18, "learning_rate": 1.8836319153084342e-05, "loss": 0.6053, "step": 1299 }, { "epoch": 0.18, "learning_rate": 1.8834211946463363e-05, "loss": 0.9233, "step": 1300 }, { "epoch": 0.18, "learning_rate": 1.88321029517767e-05, "loss": 0.9175, "step": 1301 }, { "epoch": 0.18, "learning_rate": 1.8829992169451217e-05, "loss": 0.9607, "step": 1302 }, { "epoch": 0.18, "learning_rate": 1.8827879599914143e-05, "loss": 0.8658, "step": 1303 }, { "epoch": 0.18, "learning_rate": 1.882576524359307e-05, "loss": 0.929, "step": 1304 }, { "epoch": 0.18, "learning_rate": 1.882364910091594e-05, "loss": 0.9363, "step": 1305 }, { "epoch": 0.18, "learning_rate": 1.882153117231108e-05, "loss": 0.9817, "step": 1306 }, { "epoch": 0.18, "learning_rate": 1.8819411458207147e-05, "loss": 0.8445, "step": 1307 }, { "epoch": 0.18, "learning_rate": 1.8817289959033187e-05, "loss": 0.8894, "step": 1308 }, { "epoch": 0.18, "learning_rate": 1.8815166675218595e-05, "loss": 0.912, "step": 1309 }, { "epoch": 0.18, "learning_rate": 1.8813041607193125e-05, "loss": 0.8806, "step": 1310 }, { "epoch": 0.18, "learning_rate": 1.88109147553869e-05, "loss": 0.5875, "step": 1311 }, { "epoch": 0.18, "learning_rate": 1.88087861202304e-05, "loss": 0.8806, "step": 1312 }, { "epoch": 0.18, "learning_rate": 1.880665570215446e-05, "loss": 0.9812, "step": 1313 }, { "epoch": 0.18, "learning_rate": 1.880452350159029e-05, "loss": 0.9612, "step": 1314 }, { "epoch": 0.18, "learning_rate": 1.8802389518969445e-05, "loss": 0.9097, "step": 1315 }, { "epoch": 0.18, "learning_rate": 1.8800253754723857e-05, "loss": 0.9314, "step": 1316 }, { "epoch": 0.18, "learning_rate": 1.8798116209285798e-05, "loss": 0.9685, "step": 1317 }, { "epoch": 0.18, "learning_rate": 1.8795976883087923e-05, "loss": 0.8999, "step": 1318 }, { "epoch": 0.18, "learning_rate": 1.879383577656323e-05, "loss": 0.9307, "step": 1319 }, { "epoch": 0.18, "learning_rate": 1.8791692890145084e-05, "loss": 0.9299, "step": 1320 }, { "epoch": 0.18, "learning_rate": 1.878954822426722e-05, "loss": 0.9077, "step": 1321 }, { "epoch": 0.18, "learning_rate": 1.878740177936371e-05, "loss": 0.9075, "step": 1322 }, { "epoch": 0.18, "learning_rate": 1.8785253555869013e-05, "loss": 0.9124, "step": 1323 }, { "epoch": 0.18, "learning_rate": 1.878310355421792e-05, "loss": 0.8373, "step": 1324 }, { "epoch": 0.18, "learning_rate": 1.878095177484561e-05, "loss": 0.8855, "step": 1325 }, { "epoch": 0.18, "learning_rate": 1.8778798218187598e-05, "loss": 0.6116, "step": 1326 }, { "epoch": 0.18, "learning_rate": 1.8776642884679778e-05, "loss": 0.9299, "step": 1327 }, { "epoch": 0.18, "learning_rate": 1.8774485774758387e-05, "loss": 0.6178, "step": 1328 }, { "epoch": 0.18, "learning_rate": 1.877232688886003e-05, "loss": 0.9824, "step": 1329 }, { "epoch": 0.18, "learning_rate": 1.877016622742168e-05, "loss": 0.9143, "step": 1330 }, { "epoch": 0.18, "learning_rate": 1.876800379088065e-05, "loss": 0.9614, "step": 1331 }, { "epoch": 0.19, "learning_rate": 1.8765839579674623e-05, "loss": 0.9788, "step": 1332 }, { "epoch": 0.19, "learning_rate": 1.8763673594241643e-05, "loss": 0.905, "step": 1333 }, { "epoch": 0.19, "learning_rate": 1.8761505835020113e-05, "loss": 0.662, "step": 1334 }, { "epoch": 0.19, "learning_rate": 1.875933630244879e-05, "loss": 0.8723, "step": 1335 }, { "epoch": 0.19, "learning_rate": 1.875716499696679e-05, "loss": 0.6104, "step": 1336 }, { "epoch": 0.19, "learning_rate": 1.8754991919013598e-05, "loss": 0.6065, "step": 1337 }, { "epoch": 0.19, "learning_rate": 1.8752817069029042e-05, "loss": 0.9158, "step": 1338 }, { "epoch": 0.19, "learning_rate": 1.8750640447453322e-05, "loss": 0.9316, "step": 1339 }, { "epoch": 0.19, "learning_rate": 1.874846205472699e-05, "loss": 0.9775, "step": 1340 }, { "epoch": 0.19, "learning_rate": 1.8746281891290956e-05, "loss": 0.9001, "step": 1341 }, { "epoch": 0.19, "learning_rate": 1.874409995758649e-05, "loss": 0.9194, "step": 1342 }, { "epoch": 0.19, "learning_rate": 1.8741916254055228e-05, "loss": 0.6205, "step": 1343 }, { "epoch": 0.19, "learning_rate": 1.873973078113915e-05, "loss": 0.9075, "step": 1344 }, { "epoch": 0.19, "learning_rate": 1.8737543539280598e-05, "loss": 0.9382, "step": 1345 }, { "epoch": 0.19, "learning_rate": 1.873535452892228e-05, "loss": 0.8977, "step": 1346 }, { "epoch": 0.19, "learning_rate": 1.8733163750507262e-05, "loss": 0.938, "step": 1347 }, { "epoch": 0.19, "learning_rate": 1.8730971204478956e-05, "loss": 0.915, "step": 1348 }, { "epoch": 0.19, "learning_rate": 1.872877689128114e-05, "loss": 0.8811, "step": 1349 }, { "epoch": 0.19, "learning_rate": 1.8726580811357942e-05, "loss": 0.8765, "step": 1350 }, { "epoch": 0.19, "learning_rate": 1.8724382965153864e-05, "loss": 0.9094, "step": 1351 }, { "epoch": 0.19, "learning_rate": 1.8722183353113753e-05, "loss": 0.8872, "step": 1352 }, { "epoch": 0.19, "learning_rate": 1.871998197568281e-05, "loss": 0.8802, "step": 1353 }, { "epoch": 0.19, "learning_rate": 1.8717778833306604e-05, "loss": 0.9255, "step": 1354 }, { "epoch": 0.19, "learning_rate": 1.8715573926431058e-05, "loss": 0.9446, "step": 1355 }, { "epoch": 0.19, "learning_rate": 1.8713367255502443e-05, "loss": 0.9148, "step": 1356 }, { "epoch": 0.19, "learning_rate": 1.8711158820967402e-05, "loss": 0.9126, "step": 1357 }, { "epoch": 0.19, "learning_rate": 1.8708948623272925e-05, "loss": 0.9497, "step": 1358 }, { "epoch": 0.19, "learning_rate": 1.870673666286636e-05, "loss": 0.9749, "step": 1359 }, { "epoch": 0.19, "learning_rate": 1.8704522940195418e-05, "loss": 0.6108, "step": 1360 }, { "epoch": 0.19, "learning_rate": 1.8702307455708152e-05, "loss": 0.9048, "step": 1361 }, { "epoch": 0.19, "learning_rate": 1.870009020985299e-05, "loss": 0.8589, "step": 1362 }, { "epoch": 0.19, "learning_rate": 1.8697871203078707e-05, "loss": 0.9194, "step": 1363 }, { "epoch": 0.19, "learning_rate": 1.8695650435834428e-05, "loss": 0.9104, "step": 1364 }, { "epoch": 0.19, "learning_rate": 1.8693427908569654e-05, "loss": 0.8987, "step": 1365 }, { "epoch": 0.19, "learning_rate": 1.8691203621734218e-05, "loss": 0.804, "step": 1366 }, { "epoch": 0.19, "learning_rate": 1.8688977575778327e-05, "loss": 0.8926, "step": 1367 }, { "epoch": 0.19, "learning_rate": 1.8686749771152537e-05, "loss": 0.9341, "step": 1368 }, { "epoch": 0.19, "learning_rate": 1.868452020830776e-05, "loss": 0.6069, "step": 1369 }, { "epoch": 0.19, "learning_rate": 1.8682288887695268e-05, "loss": 0.864, "step": 1370 }, { "epoch": 0.19, "learning_rate": 1.868005580976668e-05, "loss": 0.8669, "step": 1371 }, { "epoch": 0.19, "learning_rate": 1.8677820974973985e-05, "loss": 0.8599, "step": 1372 }, { "epoch": 0.19, "learning_rate": 1.8675584383769508e-05, "loss": 0.8787, "step": 1373 }, { "epoch": 0.19, "learning_rate": 1.8673346036605947e-05, "loss": 0.9243, "step": 1374 }, { "epoch": 0.19, "learning_rate": 1.867110593393635e-05, "loss": 0.95, "step": 1375 }, { "epoch": 0.19, "learning_rate": 1.8668864076214115e-05, "loss": 0.9683, "step": 1376 }, { "epoch": 0.19, "learning_rate": 1.8666620463893003e-05, "loss": 0.9578, "step": 1377 }, { "epoch": 0.19, "learning_rate": 1.8664375097427124e-05, "loss": 0.98, "step": 1378 }, { "epoch": 0.19, "learning_rate": 1.8662127977270947e-05, "loss": 0.8552, "step": 1379 }, { "epoch": 0.19, "learning_rate": 1.8659879103879294e-05, "loss": 0.5891, "step": 1380 }, { "epoch": 0.19, "learning_rate": 1.8657628477707343e-05, "loss": 0.8511, "step": 1381 }, { "epoch": 0.19, "learning_rate": 1.8655376099210623e-05, "loss": 0.9224, "step": 1382 }, { "epoch": 0.19, "learning_rate": 1.8653121968845027e-05, "loss": 0.9158, "step": 1383 }, { "epoch": 0.19, "learning_rate": 1.8650866087066793e-05, "loss": 0.8997, "step": 1384 }, { "epoch": 0.19, "learning_rate": 1.8648608454332513e-05, "loss": 0.9033, "step": 1385 }, { "epoch": 0.19, "learning_rate": 1.864634907109914e-05, "loss": 0.9324, "step": 1386 }, { "epoch": 0.19, "learning_rate": 1.8644087937823984e-05, "loss": 0.9016, "step": 1387 }, { "epoch": 0.19, "learning_rate": 1.8641825054964696e-05, "loss": 0.947, "step": 1388 }, { "epoch": 0.19, "learning_rate": 1.8639560422979296e-05, "loss": 0.8691, "step": 1389 }, { "epoch": 0.19, "learning_rate": 1.8637294042326144e-05, "loss": 0.8567, "step": 1390 }, { "epoch": 0.19, "learning_rate": 1.8635025913463965e-05, "loss": 0.9363, "step": 1391 }, { "epoch": 0.19, "learning_rate": 1.863275603685183e-05, "loss": 0.8955, "step": 1392 }, { "epoch": 0.19, "learning_rate": 1.8630484412949172e-05, "loss": 0.7911, "step": 1393 }, { "epoch": 0.19, "learning_rate": 1.8628211042215772e-05, "loss": 0.8452, "step": 1394 }, { "epoch": 0.19, "learning_rate": 1.8625935925111766e-05, "loss": 0.8706, "step": 1395 }, { "epoch": 0.19, "learning_rate": 1.8623659062097643e-05, "loss": 0.8882, "step": 1396 }, { "epoch": 0.19, "learning_rate": 1.862138045363424e-05, "loss": 0.8987, "step": 1397 }, { "epoch": 0.19, "learning_rate": 1.861910010018276e-05, "loss": 0.6302, "step": 1398 }, { "epoch": 0.19, "learning_rate": 1.861681800220475e-05, "loss": 0.8962, "step": 1399 }, { "epoch": 0.19, "learning_rate": 1.861453416016211e-05, "loss": 0.8708, "step": 1400 }, { "epoch": 0.19, "learning_rate": 1.8612248574517097e-05, "loss": 0.8613, "step": 1401 }, { "epoch": 0.19, "learning_rate": 1.860996124573232e-05, "loss": 0.8887, "step": 1402 }, { "epoch": 0.19, "learning_rate": 1.860767217427074e-05, "loss": 0.8823, "step": 1403 }, { "epoch": 0.2, "learning_rate": 1.860538136059567e-05, "loss": 0.947, "step": 1404 }, { "epoch": 0.2, "learning_rate": 1.8603088805170772e-05, "loss": 0.8506, "step": 1405 }, { "epoch": 0.2, "learning_rate": 1.860079450846007e-05, "loss": 0.6074, "step": 1406 }, { "epoch": 0.2, "learning_rate": 1.859849847092793e-05, "loss": 0.8822, "step": 1407 }, { "epoch": 0.2, "learning_rate": 1.8596200693039078e-05, "loss": 0.9038, "step": 1408 }, { "epoch": 0.2, "learning_rate": 1.8593901175258592e-05, "loss": 0.6552, "step": 1409 }, { "epoch": 0.2, "learning_rate": 1.85915999180519e-05, "loss": 0.9272, "step": 1410 }, { "epoch": 0.2, "learning_rate": 1.8589296921884782e-05, "loss": 0.6993, "step": 1411 }, { "epoch": 0.2, "learning_rate": 1.8586992187223367e-05, "loss": 0.8796, "step": 1412 }, { "epoch": 0.2, "learning_rate": 1.858468571453414e-05, "loss": 0.8721, "step": 1413 }, { "epoch": 0.2, "learning_rate": 1.8582377504283932e-05, "loss": 0.8352, "step": 1414 }, { "epoch": 0.2, "learning_rate": 1.858006755693994e-05, "loss": 0.8633, "step": 1415 }, { "epoch": 0.2, "learning_rate": 1.8577755872969696e-05, "loss": 0.8748, "step": 1416 }, { "epoch": 0.2, "learning_rate": 1.8575442452841096e-05, "loss": 0.8474, "step": 1417 }, { "epoch": 0.2, "learning_rate": 1.8573127297022373e-05, "loss": 0.9431, "step": 1418 }, { "epoch": 0.2, "learning_rate": 1.857081040598213e-05, "loss": 0.8936, "step": 1419 }, { "epoch": 0.2, "learning_rate": 1.85684917801893e-05, "loss": 0.9219, "step": 1420 }, { "epoch": 0.2, "learning_rate": 1.856617142011319e-05, "loss": 0.9519, "step": 1421 }, { "epoch": 0.2, "learning_rate": 1.856384932622344e-05, "loss": 0.6125, "step": 1422 }, { "epoch": 0.2, "learning_rate": 1.856152549899005e-05, "loss": 0.8845, "step": 1423 }, { "epoch": 0.2, "learning_rate": 1.8559199938883364e-05, "loss": 0.8916, "step": 1424 }, { "epoch": 0.2, "learning_rate": 1.8556872646374083e-05, "loss": 0.9561, "step": 1425 }, { "epoch": 0.2, "learning_rate": 1.855454362193326e-05, "loss": 0.9434, "step": 1426 }, { "epoch": 0.2, "learning_rate": 1.8552212866032294e-05, "loss": 0.9348, "step": 1427 }, { "epoch": 0.2, "learning_rate": 1.8549880379142934e-05, "loss": 0.8376, "step": 1428 }, { "epoch": 0.2, "learning_rate": 1.8547546161737276e-05, "loss": 0.9316, "step": 1429 }, { "epoch": 0.2, "learning_rate": 1.854521021428778e-05, "loss": 0.8784, "step": 1430 }, { "epoch": 0.2, "learning_rate": 1.8542872537267244e-05, "loss": 0.8784, "step": 1431 }, { "epoch": 0.2, "learning_rate": 1.854053313114882e-05, "loss": 0.9043, "step": 1432 }, { "epoch": 0.2, "learning_rate": 1.8538191996406e-05, "loss": 0.915, "step": 1433 }, { "epoch": 0.2, "learning_rate": 1.8535849133512657e-05, "loss": 0.907, "step": 1434 }, { "epoch": 0.2, "learning_rate": 1.853350454294297e-05, "loss": 0.8411, "step": 1435 }, { "epoch": 0.2, "learning_rate": 1.85311582251715e-05, "loss": 0.9121, "step": 1436 }, { "epoch": 0.2, "learning_rate": 1.852881018067315e-05, "loss": 0.7778, "step": 1437 }, { "epoch": 0.2, "learning_rate": 1.852646040992316e-05, "loss": 0.9155, "step": 1438 }, { "epoch": 0.2, "learning_rate": 1.8524108913397138e-05, "loss": 0.9197, "step": 1439 }, { "epoch": 0.2, "learning_rate": 1.8521755691571027e-05, "loss": 0.8755, "step": 1440 }, { "epoch": 0.2, "learning_rate": 1.851940074492113e-05, "loss": 0.8547, "step": 1441 }, { "epoch": 0.2, "learning_rate": 1.8517044073924092e-05, "loss": 0.8879, "step": 1442 }, { "epoch": 0.2, "learning_rate": 1.8514685679056908e-05, "loss": 0.6145, "step": 1443 }, { "epoch": 0.2, "learning_rate": 1.851232556079692e-05, "loss": 0.9341, "step": 1444 }, { "epoch": 0.2, "learning_rate": 1.8509963719621824e-05, "loss": 0.9177, "step": 1445 }, { "epoch": 0.2, "learning_rate": 1.8507600156009668e-05, "loss": 0.9155, "step": 1446 }, { "epoch": 0.2, "learning_rate": 1.850523487043883e-05, "loss": 0.8383, "step": 1447 }, { "epoch": 0.2, "learning_rate": 1.8502867863388064e-05, "loss": 0.9006, "step": 1448 }, { "epoch": 0.2, "learning_rate": 1.850049913533645e-05, "loss": 0.8386, "step": 1449 }, { "epoch": 0.2, "learning_rate": 1.849812868676342e-05, "loss": 0.8945, "step": 1450 }, { "epoch": 0.2, "learning_rate": 1.8495756518148766e-05, "loss": 0.6364, "step": 1451 }, { "epoch": 0.2, "learning_rate": 1.849338262997262e-05, "loss": 0.8994, "step": 1452 }, { "epoch": 0.2, "learning_rate": 1.849100702271546e-05, "loss": 0.8564, "step": 1453 }, { "epoch": 0.2, "learning_rate": 1.8488629696858116e-05, "loss": 0.9675, "step": 1454 }, { "epoch": 0.2, "learning_rate": 1.8486250652881763e-05, "loss": 0.8906, "step": 1455 }, { "epoch": 0.2, "learning_rate": 1.8483869891267928e-05, "loss": 0.9001, "step": 1456 }, { "epoch": 0.2, "learning_rate": 1.848148741249848e-05, "loss": 0.9277, "step": 1457 }, { "epoch": 0.2, "learning_rate": 1.8479103217055637e-05, "loss": 0.9092, "step": 1458 }, { "epoch": 0.2, "learning_rate": 1.8476717305421973e-05, "loss": 0.9065, "step": 1459 }, { "epoch": 0.2, "learning_rate": 1.8474329678080398e-05, "loss": 0.8491, "step": 1460 }, { "epoch": 0.2, "learning_rate": 1.847194033551417e-05, "loss": 0.918, "step": 1461 }, { "epoch": 0.2, "learning_rate": 1.8469549278206898e-05, "loss": 0.6068, "step": 1462 }, { "epoch": 0.2, "learning_rate": 1.8467156506642547e-05, "loss": 0.8511, "step": 1463 }, { "epoch": 0.2, "learning_rate": 1.846476202130541e-05, "loss": 0.958, "step": 1464 }, { "epoch": 0.2, "learning_rate": 1.8462365822680142e-05, "loss": 0.9077, "step": 1465 }, { "epoch": 0.2, "learning_rate": 1.8459967911251735e-05, "loss": 0.9319, "step": 1466 }, { "epoch": 0.2, "learning_rate": 1.8457568287505534e-05, "loss": 0.8281, "step": 1467 }, { "epoch": 0.2, "learning_rate": 1.845516695192723e-05, "loss": 0.6132, "step": 1468 }, { "epoch": 0.2, "learning_rate": 1.845276390500286e-05, "loss": 0.9299, "step": 1469 }, { "epoch": 0.2, "learning_rate": 1.84503591472188e-05, "loss": 0.6576, "step": 1470 }, { "epoch": 0.2, "learning_rate": 1.8447952679061783e-05, "loss": 0.865, "step": 1471 }, { "epoch": 0.2, "learning_rate": 1.8445544501018886e-05, "loss": 0.9116, "step": 1472 }, { "epoch": 0.2, "learning_rate": 1.8443134613577527e-05, "loss": 0.6255, "step": 1473 }, { "epoch": 0.2, "learning_rate": 1.8440723017225476e-05, "loss": 0.8335, "step": 1474 }, { "epoch": 0.2, "learning_rate": 1.843830971245084e-05, "loss": 0.9121, "step": 1475 }, { "epoch": 0.21, "learning_rate": 1.8435894699742088e-05, "loss": 0.9497, "step": 1476 }, { "epoch": 0.21, "learning_rate": 1.8433477979588012e-05, "loss": 0.9434, "step": 1477 }, { "epoch": 0.21, "learning_rate": 1.843105955247777e-05, "loss": 0.9321, "step": 1478 }, { "epoch": 0.21, "learning_rate": 1.8428639418900854e-05, "loss": 0.854, "step": 1479 }, { "epoch": 0.21, "learning_rate": 1.842621757934711e-05, "loss": 0.9402, "step": 1480 }, { "epoch": 0.21, "learning_rate": 1.8423794034306716e-05, "loss": 0.9045, "step": 1481 }, { "epoch": 0.21, "learning_rate": 1.842136878427021e-05, "loss": 0.6524, "step": 1482 }, { "epoch": 0.21, "learning_rate": 1.8418941829728467e-05, "loss": 0.8779, "step": 1483 }, { "epoch": 0.21, "learning_rate": 1.8416513171172705e-05, "loss": 0.9321, "step": 1484 }, { "epoch": 0.21, "learning_rate": 1.8414082809094495e-05, "loss": 0.8906, "step": 1485 }, { "epoch": 0.21, "learning_rate": 1.8411650743985743e-05, "loss": 0.9358, "step": 1486 }, { "epoch": 0.21, "learning_rate": 1.840921697633871e-05, "loss": 0.9226, "step": 1487 }, { "epoch": 0.21, "learning_rate": 1.8406781506645994e-05, "loss": 0.8967, "step": 1488 }, { "epoch": 0.21, "learning_rate": 1.840434433540054e-05, "loss": 0.8679, "step": 1489 }, { "epoch": 0.21, "learning_rate": 1.8401905463095638e-05, "loss": 0.6591, "step": 1490 }, { "epoch": 0.21, "learning_rate": 1.839946489022492e-05, "loss": 0.9204, "step": 1491 }, { "epoch": 0.21, "learning_rate": 1.8397022617282362e-05, "loss": 0.8813, "step": 1492 }, { "epoch": 0.21, "learning_rate": 1.8394578644762294e-05, "loss": 0.9343, "step": 1493 }, { "epoch": 0.21, "learning_rate": 1.8392132973159372e-05, "loss": 0.9272, "step": 1494 }, { "epoch": 0.21, "learning_rate": 1.8389685602968613e-05, "loss": 0.9058, "step": 1495 }, { "epoch": 0.21, "learning_rate": 1.8387236534685368e-05, "loss": 0.6442, "step": 1496 }, { "epoch": 0.21, "learning_rate": 1.838478576880533e-05, "loss": 0.929, "step": 1497 }, { "epoch": 0.21, "learning_rate": 1.8382333305824548e-05, "loss": 0.6129, "step": 1498 }, { "epoch": 0.21, "learning_rate": 1.8379879146239404e-05, "loss": 0.8735, "step": 1499 }, { "epoch": 0.21, "learning_rate": 1.837742329054662e-05, "loss": 0.8569, "step": 1500 }, { "epoch": 0.21, "learning_rate": 1.8374965739243275e-05, "loss": 0.8953, "step": 1501 }, { "epoch": 0.21, "learning_rate": 1.8372506492826778e-05, "loss": 0.8938, "step": 1502 }, { "epoch": 0.21, "learning_rate": 1.837004555179489e-05, "loss": 0.9448, "step": 1503 }, { "epoch": 0.21, "learning_rate": 1.8367582916645704e-05, "loss": 0.9478, "step": 1504 }, { "epoch": 0.21, "learning_rate": 1.8365118587877675e-05, "loss": 0.8566, "step": 1505 }, { "epoch": 0.21, "learning_rate": 1.836265256598958e-05, "loss": 0.9592, "step": 1506 }, { "epoch": 0.21, "learning_rate": 1.8360184851480548e-05, "loss": 0.8752, "step": 1507 }, { "epoch": 0.21, "learning_rate": 1.835771544485006e-05, "loss": 0.8298, "step": 1508 }, { "epoch": 0.21, "learning_rate": 1.8355244346597914e-05, "loss": 0.624, "step": 1509 }, { "epoch": 0.21, "learning_rate": 1.835277155722428e-05, "loss": 0.8955, "step": 1510 }, { "epoch": 0.21, "learning_rate": 1.835029707722965e-05, "loss": 0.8816, "step": 1511 }, { "epoch": 0.21, "learning_rate": 1.8347820907114867e-05, "loss": 0.9292, "step": 1512 }, { "epoch": 0.21, "learning_rate": 1.834534304738111e-05, "loss": 0.9448, "step": 1513 }, { "epoch": 0.21, "learning_rate": 1.8342863498529907e-05, "loss": 0.6082, "step": 1514 }, { "epoch": 0.21, "learning_rate": 1.834038226106313e-05, "loss": 0.8452, "step": 1515 }, { "epoch": 0.21, "learning_rate": 1.8337899335482974e-05, "loss": 0.905, "step": 1516 }, { "epoch": 0.21, "learning_rate": 1.8335414722292003e-05, "loss": 0.9028, "step": 1517 }, { "epoch": 0.21, "learning_rate": 1.8332928421993097e-05, "loss": 0.5543, "step": 1518 }, { "epoch": 0.21, "learning_rate": 1.8330440435089498e-05, "loss": 0.927, "step": 1519 }, { "epoch": 0.21, "learning_rate": 1.8327950762084773e-05, "loss": 0.9458, "step": 1520 }, { "epoch": 0.21, "learning_rate": 1.8325459403482844e-05, "loss": 0.9221, "step": 1521 }, { "epoch": 0.21, "learning_rate": 1.832296635978797e-05, "loss": 0.957, "step": 1522 }, { "epoch": 0.21, "learning_rate": 1.832047163150474e-05, "loss": 0.8977, "step": 1523 }, { "epoch": 0.21, "learning_rate": 1.8317975219138094e-05, "loss": 0.8794, "step": 1524 }, { "epoch": 0.21, "learning_rate": 1.831547712319332e-05, "loss": 0.9338, "step": 1525 }, { "epoch": 0.21, "learning_rate": 1.831297734417604e-05, "loss": 0.5948, "step": 1526 }, { "epoch": 0.21, "learning_rate": 1.83104758825922e-05, "loss": 0.9231, "step": 1527 }, { "epoch": 0.21, "learning_rate": 1.8307972738948116e-05, "loss": 0.864, "step": 1528 }, { "epoch": 0.21, "learning_rate": 1.8305467913750425e-05, "loss": 0.9587, "step": 1529 }, { "epoch": 0.21, "learning_rate": 1.8302961407506112e-05, "loss": 0.9558, "step": 1530 }, { "epoch": 0.21, "learning_rate": 1.8300453220722495e-05, "loss": 0.9304, "step": 1531 }, { "epoch": 0.21, "learning_rate": 1.829794335390724e-05, "loss": 0.9387, "step": 1532 }, { "epoch": 0.21, "learning_rate": 1.829543180756835e-05, "loss": 0.8896, "step": 1533 }, { "epoch": 0.21, "learning_rate": 1.8292918582214173e-05, "loss": 0.8931, "step": 1534 }, { "epoch": 0.21, "learning_rate": 1.829040367835338e-05, "loss": 0.9285, "step": 1535 }, { "epoch": 0.21, "learning_rate": 1.8287887096495006e-05, "loss": 0.8774, "step": 1536 }, { "epoch": 0.21, "learning_rate": 1.8285368837148403e-05, "loss": 0.8828, "step": 1537 }, { "epoch": 0.21, "learning_rate": 1.8282848900823282e-05, "loss": 0.9299, "step": 1538 }, { "epoch": 0.21, "learning_rate": 1.8280327288029677e-05, "loss": 0.5867, "step": 1539 }, { "epoch": 0.21, "learning_rate": 1.8277803999277973e-05, "loss": 0.9221, "step": 1540 }, { "epoch": 0.21, "learning_rate": 1.8275279035078887e-05, "loss": 0.8225, "step": 1541 }, { "epoch": 0.21, "learning_rate": 1.827275239594348e-05, "loss": 0.6019, "step": 1542 }, { "epoch": 0.21, "learning_rate": 1.8270224082383145e-05, "loss": 0.9424, "step": 1543 }, { "epoch": 0.21, "learning_rate": 1.8267694094909627e-05, "loss": 0.8101, "step": 1544 }, { "epoch": 0.21, "learning_rate": 1.8265162434034992e-05, "loss": 0.8503, "step": 1545 }, { "epoch": 0.21, "learning_rate": 1.826262910027166e-05, "loss": 0.842, "step": 1546 }, { "epoch": 0.21, "learning_rate": 1.8260094094132386e-05, "loss": 0.9187, "step": 1547 }, { "epoch": 0.22, "learning_rate": 1.8257557416130253e-05, "loss": 0.6396, "step": 1548 }, { "epoch": 0.22, "learning_rate": 1.8255019066778698e-05, "loss": 0.8762, "step": 1549 }, { "epoch": 0.22, "learning_rate": 1.8252479046591492e-05, "loss": 0.915, "step": 1550 }, { "epoch": 0.22, "learning_rate": 1.824993735608273e-05, "loss": 0.9082, "step": 1551 }, { "epoch": 0.22, "learning_rate": 1.8247393995766862e-05, "loss": 0.8782, "step": 1552 }, { "epoch": 0.22, "learning_rate": 1.8244848966158675e-05, "loss": 0.9214, "step": 1553 }, { "epoch": 0.22, "learning_rate": 1.8242302267773283e-05, "loss": 0.9495, "step": 1554 }, { "epoch": 0.22, "learning_rate": 1.8239753901126144e-05, "loss": 0.9075, "step": 1555 }, { "epoch": 0.22, "learning_rate": 1.8237203866733054e-05, "loss": 0.865, "step": 1556 }, { "epoch": 0.22, "learning_rate": 1.8234652165110146e-05, "loss": 0.8728, "step": 1557 }, { "epoch": 0.22, "learning_rate": 1.8232098796773897e-05, "loss": 0.668, "step": 1558 }, { "epoch": 0.22, "learning_rate": 1.8229543762241104e-05, "loss": 0.9023, "step": 1559 }, { "epoch": 0.22, "learning_rate": 1.822698706202892e-05, "loss": 0.9465, "step": 1560 }, { "epoch": 0.22, "learning_rate": 1.8224428696654825e-05, "loss": 0.8894, "step": 1561 }, { "epoch": 0.22, "learning_rate": 1.8221868666636635e-05, "loss": 0.9114, "step": 1562 }, { "epoch": 0.22, "learning_rate": 1.8219306972492513e-05, "loss": 0.5782, "step": 1563 }, { "epoch": 0.22, "learning_rate": 1.8216743614740947e-05, "loss": 0.8906, "step": 1564 }, { "epoch": 0.22, "learning_rate": 1.821417859390077e-05, "loss": 0.8794, "step": 1565 }, { "epoch": 0.22, "learning_rate": 1.8211611910491145e-05, "loss": 0.9111, "step": 1566 }, { "epoch": 0.22, "learning_rate": 1.8209043565031575e-05, "loss": 0.7937, "step": 1567 }, { "epoch": 0.22, "learning_rate": 1.8206473558041903e-05, "loss": 0.9729, "step": 1568 }, { "epoch": 0.22, "learning_rate": 1.82039018900423e-05, "loss": 0.9089, "step": 1569 }, { "epoch": 0.22, "learning_rate": 1.820132856155328e-05, "loss": 0.8867, "step": 1570 }, { "epoch": 0.22, "learning_rate": 1.8198753573095693e-05, "loss": 0.8994, "step": 1571 }, { "epoch": 0.22, "learning_rate": 1.8196176925190722e-05, "loss": 0.9238, "step": 1572 }, { "epoch": 0.22, "learning_rate": 1.819359861835988e-05, "loss": 0.6371, "step": 1573 }, { "epoch": 0.22, "learning_rate": 1.819101865312503e-05, "loss": 0.8914, "step": 1574 }, { "epoch": 0.22, "learning_rate": 1.8188437030008363e-05, "loss": 0.9116, "step": 1575 }, { "epoch": 0.22, "learning_rate": 1.8185853749532404e-05, "loss": 0.8625, "step": 1576 }, { "epoch": 0.22, "learning_rate": 1.8183268812220013e-05, "loss": 0.6238, "step": 1577 }, { "epoch": 0.22, "learning_rate": 1.8180682218594387e-05, "loss": 0.8577, "step": 1578 }, { "epoch": 0.22, "learning_rate": 1.8178093969179068e-05, "loss": 0.9861, "step": 1579 }, { "epoch": 0.22, "learning_rate": 1.817550406449791e-05, "loss": 0.9043, "step": 1580 }, { "epoch": 0.22, "learning_rate": 1.8172912505075128e-05, "loss": 0.9302, "step": 1581 }, { "epoch": 0.22, "learning_rate": 1.817031929143525e-05, "loss": 0.8518, "step": 1582 }, { "epoch": 0.22, "learning_rate": 1.816772442410316e-05, "loss": 0.96, "step": 1583 }, { "epoch": 0.22, "learning_rate": 1.8165127903604052e-05, "loss": 0.9478, "step": 1584 }, { "epoch": 0.22, "learning_rate": 1.8162529730463477e-05, "loss": 0.9954, "step": 1585 }, { "epoch": 0.22, "learning_rate": 1.815992990520731e-05, "loss": 0.8552, "step": 1586 }, { "epoch": 0.22, "learning_rate": 1.8157328428361763e-05, "loss": 0.9004, "step": 1587 }, { "epoch": 0.22, "learning_rate": 1.8154725300453377e-05, "loss": 0.8667, "step": 1588 }, { "epoch": 0.22, "learning_rate": 1.8152120522009034e-05, "loss": 0.8635, "step": 1589 }, { "epoch": 0.22, "learning_rate": 1.814951409355595e-05, "loss": 0.8589, "step": 1590 }, { "epoch": 0.22, "learning_rate": 1.8146906015621666e-05, "loss": 0.916, "step": 1591 }, { "epoch": 0.22, "learning_rate": 1.8144296288734068e-05, "loss": 0.8987, "step": 1592 }, { "epoch": 0.22, "learning_rate": 1.814168491342137e-05, "loss": 0.8425, "step": 1593 }, { "epoch": 0.22, "learning_rate": 1.8139071890212117e-05, "loss": 0.8696, "step": 1594 }, { "epoch": 0.22, "learning_rate": 1.8136457219635197e-05, "loss": 0.8577, "step": 1595 }, { "epoch": 0.22, "learning_rate": 1.8133840902219822e-05, "loss": 0.9116, "step": 1596 }, { "epoch": 0.22, "learning_rate": 1.8131222938495545e-05, "loss": 0.8763, "step": 1597 }, { "epoch": 0.22, "learning_rate": 1.812860332899224e-05, "loss": 0.6262, "step": 1598 }, { "epoch": 0.22, "learning_rate": 1.812598207424013e-05, "loss": 0.9346, "step": 1599 }, { "epoch": 0.22, "learning_rate": 1.8123359174769763e-05, "loss": 0.8096, "step": 1600 }, { "epoch": 0.22, "learning_rate": 1.8120734631112015e-05, "loss": 0.6482, "step": 1601 }, { "epoch": 0.22, "learning_rate": 1.8118108443798102e-05, "loss": 0.9087, "step": 1602 }, { "epoch": 0.22, "learning_rate": 1.8115480613359574e-05, "loss": 0.8923, "step": 1603 }, { "epoch": 0.22, "learning_rate": 1.8112851140328304e-05, "loss": 0.8889, "step": 1604 }, { "epoch": 0.22, "learning_rate": 1.811022002523651e-05, "loss": 0.886, "step": 1605 }, { "epoch": 0.22, "learning_rate": 1.810758726861673e-05, "loss": 0.8987, "step": 1606 }, { "epoch": 0.22, "learning_rate": 1.8104952871001847e-05, "loss": 0.8833, "step": 1607 }, { "epoch": 0.22, "learning_rate": 1.8102316832925063e-05, "loss": 0.9053, "step": 1608 }, { "epoch": 0.22, "learning_rate": 1.8099679154919922e-05, "loss": 0.9014, "step": 1609 }, { "epoch": 0.22, "learning_rate": 1.8097039837520296e-05, "loss": 0.894, "step": 1610 }, { "epoch": 0.22, "learning_rate": 1.809439888126039e-05, "loss": 0.9282, "step": 1611 }, { "epoch": 0.22, "learning_rate": 1.8091756286674735e-05, "loss": 0.9333, "step": 1612 }, { "epoch": 0.22, "learning_rate": 1.8089112054298202e-05, "loss": 0.8899, "step": 1613 }, { "epoch": 0.22, "learning_rate": 1.8086466184665994e-05, "loss": 0.8396, "step": 1614 }, { "epoch": 0.22, "learning_rate": 1.8083818678313634e-05, "loss": 0.8701, "step": 1615 }, { "epoch": 0.22, "learning_rate": 1.8081169535776987e-05, "loss": 0.8264, "step": 1616 }, { "epoch": 0.22, "learning_rate": 1.8078518757592247e-05, "loss": 0.9438, "step": 1617 }, { "epoch": 0.22, "learning_rate": 1.807586634429594e-05, "loss": 0.9453, "step": 1618 }, { "epoch": 0.22, "learning_rate": 1.8073212296424914e-05, "loss": 0.9294, "step": 1619 }, { "epoch": 0.23, "learning_rate": 1.8070556614516358e-05, "loss": 0.6453, "step": 1620 }, { "epoch": 0.23, "learning_rate": 1.806789929910779e-05, "loss": 0.9722, "step": 1621 }, { "epoch": 0.23, "learning_rate": 1.8065240350737052e-05, "loss": 0.8508, "step": 1622 }, { "epoch": 0.23, "learning_rate": 1.806257976994233e-05, "loss": 0.8457, "step": 1623 }, { "epoch": 0.23, "learning_rate": 1.805991755726212e-05, "loss": 0.9297, "step": 1624 }, { "epoch": 0.23, "learning_rate": 1.8057253713235273e-05, "loss": 0.8342, "step": 1625 }, { "epoch": 0.23, "learning_rate": 1.8054588238400952e-05, "loss": 0.9014, "step": 1626 }, { "epoch": 0.23, "learning_rate": 1.8051921133298652e-05, "loss": 0.9197, "step": 1627 }, { "epoch": 0.23, "learning_rate": 1.8049252398468207e-05, "loss": 0.8889, "step": 1628 }, { "epoch": 0.23, "learning_rate": 1.8046582034449774e-05, "loss": 0.928, "step": 1629 }, { "epoch": 0.23, "learning_rate": 1.8043910041783836e-05, "loss": 0.906, "step": 1630 }, { "epoch": 0.23, "learning_rate": 1.8041236421011216e-05, "loss": 0.9094, "step": 1631 }, { "epoch": 0.23, "learning_rate": 1.803856117267306e-05, "loss": 0.8408, "step": 1632 }, { "epoch": 0.23, "learning_rate": 1.8035884297310846e-05, "loss": 0.9736, "step": 1633 }, { "epoch": 0.23, "learning_rate": 1.803320579546638e-05, "loss": 0.8658, "step": 1634 }, { "epoch": 0.23, "learning_rate": 1.8030525667681793e-05, "loss": 0.8091, "step": 1635 }, { "epoch": 0.23, "learning_rate": 1.8027843914499553e-05, "loss": 0.8137, "step": 1636 }, { "epoch": 0.23, "learning_rate": 1.8025160536462454e-05, "loss": 0.9404, "step": 1637 }, { "epoch": 0.23, "learning_rate": 1.8022475534113614e-05, "loss": 0.96, "step": 1638 }, { "epoch": 0.23, "learning_rate": 1.801978890799649e-05, "loss": 0.9089, "step": 1639 }, { "epoch": 0.23, "learning_rate": 1.8017100658654857e-05, "loss": 0.8782, "step": 1640 }, { "epoch": 0.23, "learning_rate": 1.8014410786632822e-05, "loss": 0.9114, "step": 1641 }, { "epoch": 0.23, "learning_rate": 1.8011719292474823e-05, "loss": 0.9058, "step": 1642 }, { "epoch": 0.23, "learning_rate": 1.800902617672563e-05, "loss": 0.9124, "step": 1643 }, { "epoch": 0.23, "learning_rate": 1.8006331439930328e-05, "loss": 0.9375, "step": 1644 }, { "epoch": 0.23, "learning_rate": 1.800363508263434e-05, "loss": 0.9302, "step": 1645 }, { "epoch": 0.23, "learning_rate": 1.800093710538342e-05, "loss": 0.8745, "step": 1646 }, { "epoch": 0.23, "learning_rate": 1.7998237508723642e-05, "loss": 0.8789, "step": 1647 }, { "epoch": 0.23, "learning_rate": 1.7995536293201413e-05, "loss": 0.8987, "step": 1648 }, { "epoch": 0.23, "learning_rate": 1.7992833459363462e-05, "loss": 0.9395, "step": 1649 }, { "epoch": 0.23, "learning_rate": 1.799012900775685e-05, "loss": 0.6224, "step": 1650 }, { "epoch": 0.23, "learning_rate": 1.7987422938928968e-05, "loss": 0.9155, "step": 1651 }, { "epoch": 0.23, "learning_rate": 1.7984715253427523e-05, "loss": 0.9148, "step": 1652 }, { "epoch": 0.23, "learning_rate": 1.7982005951800564e-05, "loss": 0.8865, "step": 1653 }, { "epoch": 0.23, "learning_rate": 1.7979295034596456e-05, "loss": 0.8591, "step": 1654 }, { "epoch": 0.23, "learning_rate": 1.79765825023639e-05, "loss": 0.8562, "step": 1655 }, { "epoch": 0.23, "learning_rate": 1.797386835565192e-05, "loss": 0.8694, "step": 1656 }, { "epoch": 0.23, "learning_rate": 1.7971152595009854e-05, "loss": 0.8679, "step": 1657 }, { "epoch": 0.23, "learning_rate": 1.796843522098739e-05, "loss": 0.8645, "step": 1658 }, { "epoch": 0.23, "learning_rate": 1.7965716234134527e-05, "loss": 0.9382, "step": 1659 }, { "epoch": 0.23, "learning_rate": 1.7962995635001593e-05, "loss": 0.8623, "step": 1660 }, { "epoch": 0.23, "learning_rate": 1.796027342413925e-05, "loss": 0.9424, "step": 1661 }, { "epoch": 0.23, "learning_rate": 1.7957549602098472e-05, "loss": 0.8604, "step": 1662 }, { "epoch": 0.23, "learning_rate": 1.7954824169430573e-05, "loss": 0.916, "step": 1663 }, { "epoch": 0.23, "learning_rate": 1.7952097126687186e-05, "loss": 0.9124, "step": 1664 }, { "epoch": 0.23, "learning_rate": 1.7949368474420267e-05, "loss": 0.8596, "step": 1665 }, { "epoch": 0.23, "learning_rate": 1.794663821318211e-05, "loss": 0.8774, "step": 1666 }, { "epoch": 0.23, "learning_rate": 1.7943906343525314e-05, "loss": 0.9099, "step": 1667 }, { "epoch": 0.23, "learning_rate": 1.7941172866002826e-05, "loss": 0.875, "step": 1668 }, { "epoch": 0.23, "learning_rate": 1.793843778116791e-05, "loss": 0.9109, "step": 1669 }, { "epoch": 0.23, "learning_rate": 1.7935701089574142e-05, "loss": 0.8682, "step": 1670 }, { "epoch": 0.23, "learning_rate": 1.7932962791775447e-05, "loss": 0.6907, "step": 1671 }, { "epoch": 0.23, "learning_rate": 1.7930222888326058e-05, "loss": 0.8225, "step": 1672 }, { "epoch": 0.23, "learning_rate": 1.7927481379780536e-05, "loss": 0.8975, "step": 1673 }, { "epoch": 0.23, "learning_rate": 1.7924738266693774e-05, "loss": 0.8884, "step": 1674 }, { "epoch": 0.23, "learning_rate": 1.7921993549620977e-05, "loss": 0.8718, "step": 1675 }, { "epoch": 0.23, "learning_rate": 1.791924722911769e-05, "loss": 0.8577, "step": 1676 }, { "epoch": 0.23, "learning_rate": 1.7916499305739772e-05, "loss": 0.9524, "step": 1677 }, { "epoch": 0.23, "learning_rate": 1.791374978004341e-05, "loss": 0.5669, "step": 1678 }, { "epoch": 0.23, "learning_rate": 1.7910998652585112e-05, "loss": 0.9148, "step": 1679 }, { "epoch": 0.23, "learning_rate": 1.7908245923921718e-05, "loss": 0.5535, "step": 1680 }, { "epoch": 0.23, "learning_rate": 1.7905491594610382e-05, "loss": 0.9043, "step": 1681 }, { "epoch": 0.23, "learning_rate": 1.7902735665208587e-05, "loss": 0.8994, "step": 1682 }, { "epoch": 0.23, "learning_rate": 1.789997813627414e-05, "loss": 0.9075, "step": 1683 }, { "epoch": 0.23, "learning_rate": 1.7897219008365176e-05, "loss": 0.8999, "step": 1684 }, { "epoch": 0.23, "learning_rate": 1.7894458282040146e-05, "loss": 0.8425, "step": 1685 }, { "epoch": 0.23, "learning_rate": 1.7891695957857823e-05, "loss": 0.8745, "step": 1686 }, { "epoch": 0.23, "learning_rate": 1.7888932036377316e-05, "loss": 0.8914, "step": 1687 }, { "epoch": 0.23, "learning_rate": 1.7886166518158045e-05, "loss": 0.8472, "step": 1688 }, { "epoch": 0.23, "learning_rate": 1.7883399403759758e-05, "loss": 0.8135, "step": 1689 }, { "epoch": 0.23, "learning_rate": 1.7880630693742523e-05, "loss": 0.8906, "step": 1690 }, { "epoch": 0.23, "learning_rate": 1.787786038866674e-05, "loss": 0.8977, "step": 1691 }, { "epoch": 0.24, "learning_rate": 1.7875088489093122e-05, "loss": 0.9045, "step": 1692 }, { "epoch": 0.24, "learning_rate": 1.7872314995582706e-05, "loss": 0.9087, "step": 1693 }, { "epoch": 0.24, "learning_rate": 1.7869539908696857e-05, "loss": 0.8796, "step": 1694 }, { "epoch": 0.24, "learning_rate": 1.7866763228997257e-05, "loss": 0.5994, "step": 1695 }, { "epoch": 0.24, "learning_rate": 1.7863984957045915e-05, "loss": 0.8389, "step": 1696 }, { "epoch": 0.24, "learning_rate": 1.7861205093405157e-05, "loss": 0.9001, "step": 1697 }, { "epoch": 0.24, "learning_rate": 1.7858423638637636e-05, "loss": 0.8638, "step": 1698 }, { "epoch": 0.24, "learning_rate": 1.7855640593306323e-05, "loss": 0.9067, "step": 1699 }, { "epoch": 0.24, "learning_rate": 1.7852855957974517e-05, "loss": 0.8958, "step": 1700 }, { "epoch": 0.24, "learning_rate": 1.785006973320583e-05, "loss": 0.8677, "step": 1701 }, { "epoch": 0.24, "learning_rate": 1.7847281919564205e-05, "loss": 0.8555, "step": 1702 }, { "epoch": 0.24, "learning_rate": 1.7844492517613902e-05, "loss": 0.8196, "step": 1703 }, { "epoch": 0.24, "learning_rate": 1.7841701527919497e-05, "loss": 0.9551, "step": 1704 }, { "epoch": 0.24, "learning_rate": 1.7838908951045898e-05, "loss": 0.9248, "step": 1705 }, { "epoch": 0.24, "learning_rate": 1.783611478755833e-05, "loss": 0.9473, "step": 1706 }, { "epoch": 0.24, "learning_rate": 1.7833319038022333e-05, "loss": 0.8462, "step": 1707 }, { "epoch": 0.24, "learning_rate": 1.783052170300378e-05, "loss": 0.9292, "step": 1708 }, { "epoch": 0.24, "learning_rate": 1.7827722783068853e-05, "loss": 0.9084, "step": 1709 }, { "epoch": 0.24, "learning_rate": 1.7824922278784065e-05, "loss": 0.8408, "step": 1710 }, { "epoch": 0.24, "learning_rate": 1.7822120190716242e-05, "loss": 0.8733, "step": 1711 }, { "epoch": 0.24, "learning_rate": 1.781931651943253e-05, "loss": 0.8809, "step": 1712 }, { "epoch": 0.24, "learning_rate": 1.7816511265500405e-05, "loss": 0.6726, "step": 1713 }, { "epoch": 0.24, "learning_rate": 1.7813704429487656e-05, "loss": 0.9187, "step": 1714 }, { "epoch": 0.24, "learning_rate": 1.7810896011962387e-05, "loss": 0.7107, "step": 1715 }, { "epoch": 0.24, "learning_rate": 1.7808086013493036e-05, "loss": 0.9133, "step": 1716 }, { "epoch": 0.24, "learning_rate": 1.7805274434648353e-05, "loss": 0.9109, "step": 1717 }, { "epoch": 0.24, "learning_rate": 1.7802461275997403e-05, "loss": 0.8794, "step": 1718 }, { "epoch": 0.24, "learning_rate": 1.779964653810958e-05, "loss": 0.9438, "step": 1719 }, { "epoch": 0.24, "learning_rate": 1.7796830221554594e-05, "loss": 0.925, "step": 1720 }, { "epoch": 0.24, "learning_rate": 1.779401232690247e-05, "loss": 0.8896, "step": 1721 }, { "epoch": 0.24, "learning_rate": 1.779119285472356e-05, "loss": 0.8745, "step": 1722 }, { "epoch": 0.24, "learning_rate": 1.778837180558853e-05, "loss": 0.8477, "step": 1723 }, { "epoch": 0.24, "learning_rate": 1.7785549180068375e-05, "loss": 0.9282, "step": 1724 }, { "epoch": 0.24, "learning_rate": 1.7782724978734388e-05, "loss": 0.9248, "step": 1725 }, { "epoch": 0.24, "learning_rate": 1.7779899202158206e-05, "loss": 0.8818, "step": 1726 }, { "epoch": 0.24, "learning_rate": 1.7777071850911762e-05, "loss": 0.8625, "step": 1727 }, { "epoch": 0.24, "learning_rate": 1.777424292556733e-05, "loss": 0.8904, "step": 1728 }, { "epoch": 0.24, "learning_rate": 1.7771412426697482e-05, "loss": 0.8672, "step": 1729 }, { "epoch": 0.24, "learning_rate": 1.7768580354875126e-05, "loss": 0.8528, "step": 1730 }, { "epoch": 0.24, "learning_rate": 1.776574671067347e-05, "loss": 0.8928, "step": 1731 }, { "epoch": 0.24, "learning_rate": 1.776291149466606e-05, "loss": 0.8921, "step": 1732 }, { "epoch": 0.24, "learning_rate": 1.7760074707426747e-05, "loss": 0.9355, "step": 1733 }, { "epoch": 0.24, "learning_rate": 1.77572363495297e-05, "loss": 0.9236, "step": 1734 }, { "epoch": 0.24, "learning_rate": 1.7754396421549412e-05, "loss": 0.9626, "step": 1735 }, { "epoch": 0.24, "learning_rate": 1.7751554924060696e-05, "loss": 0.9048, "step": 1736 }, { "epoch": 0.24, "learning_rate": 1.7748711857638672e-05, "loss": 0.9172, "step": 1737 }, { "epoch": 0.24, "learning_rate": 1.7745867222858785e-05, "loss": 0.8896, "step": 1738 }, { "epoch": 0.24, "learning_rate": 1.7743021020296797e-05, "loss": 0.9626, "step": 1739 }, { "epoch": 0.24, "learning_rate": 1.7740173250528784e-05, "loss": 0.9307, "step": 1740 }, { "epoch": 0.24, "learning_rate": 1.773732391413114e-05, "loss": 0.925, "step": 1741 }, { "epoch": 0.24, "learning_rate": 1.7734473011680585e-05, "loss": 0.8977, "step": 1742 }, { "epoch": 0.24, "learning_rate": 1.773162054375414e-05, "loss": 0.8579, "step": 1743 }, { "epoch": 0.24, "learning_rate": 1.7728766510929158e-05, "loss": 0.8418, "step": 1744 }, { "epoch": 0.24, "learning_rate": 1.7725910913783297e-05, "loss": 0.9011, "step": 1745 }, { "epoch": 0.24, "learning_rate": 1.772305375289454e-05, "loss": 0.8931, "step": 1746 }, { "epoch": 0.24, "learning_rate": 1.7720195028841184e-05, "loss": 0.9023, "step": 1747 }, { "epoch": 0.24, "learning_rate": 1.7717334742201836e-05, "loss": 0.8848, "step": 1748 }, { "epoch": 0.24, "learning_rate": 1.7714472893555434e-05, "loss": 0.9016, "step": 1749 }, { "epoch": 0.24, "learning_rate": 1.7711609483481212e-05, "loss": 0.8894, "step": 1750 }, { "epoch": 0.24, "learning_rate": 1.7708744512558738e-05, "loss": 0.8921, "step": 1751 }, { "epoch": 0.24, "learning_rate": 1.7705877981367887e-05, "loss": 0.8892, "step": 1752 }, { "epoch": 0.24, "learning_rate": 1.7703009890488852e-05, "loss": 0.8687, "step": 1753 }, { "epoch": 0.24, "learning_rate": 1.7700140240502147e-05, "loss": 0.885, "step": 1754 }, { "epoch": 0.24, "learning_rate": 1.7697269031988588e-05, "loss": 0.9155, "step": 1755 }, { "epoch": 0.24, "learning_rate": 1.769439626552932e-05, "loss": 0.8962, "step": 1756 }, { "epoch": 0.24, "learning_rate": 1.769152194170579e-05, "loss": 0.9346, "step": 1757 }, { "epoch": 0.24, "learning_rate": 1.7688646061099774e-05, "loss": 0.8816, "step": 1758 }, { "epoch": 0.24, "learning_rate": 1.768576862429336e-05, "loss": 0.9106, "step": 1759 }, { "epoch": 0.24, "learning_rate": 1.768288963186894e-05, "loss": 0.875, "step": 1760 }, { "epoch": 0.24, "learning_rate": 1.7680009084409237e-05, "loss": 0.8989, "step": 1761 }, { "epoch": 0.24, "learning_rate": 1.7677126982497278e-05, "loss": 0.866, "step": 1762 }, { "epoch": 0.24, "learning_rate": 1.7674243326716402e-05, "loss": 0.3667, "step": 1763 }, { "epoch": 0.25, "learning_rate": 1.7671358117650278e-05, "loss": 0.8774, "step": 1764 }, { "epoch": 0.25, "learning_rate": 1.766847135588287e-05, "loss": 0.9058, "step": 1765 }, { "epoch": 0.25, "learning_rate": 1.766558304199847e-05, "loss": 0.9346, "step": 1766 }, { "epoch": 0.25, "learning_rate": 1.7662693176581677e-05, "loss": 0.8782, "step": 1767 }, { "epoch": 0.25, "learning_rate": 1.7659801760217413e-05, "loss": 0.9302, "step": 1768 }, { "epoch": 0.25, "learning_rate": 1.76569087934909e-05, "loss": 0.9202, "step": 1769 }, { "epoch": 0.25, "learning_rate": 1.7654014276987684e-05, "loss": 0.6621, "step": 1770 }, { "epoch": 0.25, "learning_rate": 1.7651118211293626e-05, "loss": 0.8657, "step": 1771 }, { "epoch": 0.25, "learning_rate": 1.764822059699489e-05, "loss": 0.9131, "step": 1772 }, { "epoch": 0.25, "learning_rate": 1.7645321434677965e-05, "loss": 0.9583, "step": 1773 }, { "epoch": 0.25, "learning_rate": 1.7642420724929645e-05, "loss": 0.8872, "step": 1774 }, { "epoch": 0.25, "learning_rate": 1.763951846833704e-05, "loss": 0.9822, "step": 1775 }, { "epoch": 0.25, "learning_rate": 1.7636614665487584e-05, "loss": 0.9368, "step": 1776 }, { "epoch": 0.25, "learning_rate": 1.7633709316969e-05, "loss": 0.8665, "step": 1777 }, { "epoch": 0.25, "learning_rate": 1.7630802423369343e-05, "loss": 0.9683, "step": 1778 }, { "epoch": 0.25, "learning_rate": 1.762789398527698e-05, "loss": 0.8582, "step": 1779 }, { "epoch": 0.25, "learning_rate": 1.7624984003280573e-05, "loss": 0.8945, "step": 1780 }, { "epoch": 0.25, "learning_rate": 1.7622072477969127e-05, "loss": 0.9387, "step": 1781 }, { "epoch": 0.25, "learning_rate": 1.7619159409931925e-05, "loss": 0.8912, "step": 1782 }, { "epoch": 0.25, "learning_rate": 1.761624479975859e-05, "loss": 0.8715, "step": 1783 }, { "epoch": 0.25, "learning_rate": 1.7613328648039042e-05, "loss": 0.9038, "step": 1784 }, { "epoch": 0.25, "learning_rate": 1.7610410955363515e-05, "loss": 0.9126, "step": 1785 }, { "epoch": 0.25, "learning_rate": 1.7607491722322564e-05, "loss": 0.856, "step": 1786 }, { "epoch": 0.25, "learning_rate": 1.760457094950704e-05, "loss": 0.9072, "step": 1787 }, { "epoch": 0.25, "learning_rate": 1.760164863750812e-05, "loss": 0.5761, "step": 1788 }, { "epoch": 0.25, "learning_rate": 1.7598724786917288e-05, "loss": 0.884, "step": 1789 }, { "epoch": 0.25, "learning_rate": 1.7595799398326333e-05, "loss": 0.8448, "step": 1790 }, { "epoch": 0.25, "learning_rate": 1.7592872472327363e-05, "loss": 0.9343, "step": 1791 }, { "epoch": 0.25, "learning_rate": 1.75899440095128e-05, "loss": 0.8654, "step": 1792 }, { "epoch": 0.25, "learning_rate": 1.758701401047536e-05, "loss": 0.8838, "step": 1793 }, { "epoch": 0.25, "learning_rate": 1.7584082475808094e-05, "loss": 0.8782, "step": 1794 }, { "epoch": 0.25, "learning_rate": 1.7581149406104347e-05, "loss": 0.8618, "step": 1795 }, { "epoch": 0.25, "learning_rate": 1.757821480195778e-05, "loss": 0.8582, "step": 1796 }, { "epoch": 0.25, "learning_rate": 1.7575278663962362e-05, "loss": 0.9358, "step": 1797 }, { "epoch": 0.25, "learning_rate": 1.7572340992712372e-05, "loss": 0.8774, "step": 1798 }, { "epoch": 0.25, "learning_rate": 1.7569401788802408e-05, "loss": 0.8848, "step": 1799 }, { "epoch": 0.25, "learning_rate": 1.7566461052827373e-05, "loss": 0.8472, "step": 1800 }, { "epoch": 0.25, "learning_rate": 1.756351878538247e-05, "loss": 0.8521, "step": 1801 }, { "epoch": 0.25, "learning_rate": 1.756057498706323e-05, "loss": 0.6842, "step": 1802 }, { "epoch": 0.25, "learning_rate": 1.7557629658465475e-05, "loss": 0.835, "step": 1803 }, { "epoch": 0.25, "learning_rate": 1.7554682800185358e-05, "loss": 0.8875, "step": 1804 }, { "epoch": 0.25, "learning_rate": 1.755173441281932e-05, "loss": 0.9346, "step": 1805 }, { "epoch": 0.25, "learning_rate": 1.7548784496964134e-05, "loss": 0.8555, "step": 1806 }, { "epoch": 0.25, "learning_rate": 1.7545833053216855e-05, "loss": 0.8962, "step": 1807 }, { "epoch": 0.25, "learning_rate": 1.7542880082174874e-05, "loss": 0.8252, "step": 1808 }, { "epoch": 0.25, "learning_rate": 1.7539925584435874e-05, "loss": 0.9121, "step": 1809 }, { "epoch": 0.25, "learning_rate": 1.7536969560597853e-05, "loss": 0.8953, "step": 1810 }, { "epoch": 0.25, "learning_rate": 1.753401201125912e-05, "loss": 0.5925, "step": 1811 }, { "epoch": 0.25, "learning_rate": 1.7531052937018286e-05, "loss": 0.9209, "step": 1812 }, { "epoch": 0.25, "learning_rate": 1.7528092338474275e-05, "loss": 0.8914, "step": 1813 }, { "epoch": 0.25, "learning_rate": 1.7525130216226323e-05, "loss": 0.8875, "step": 1814 }, { "epoch": 0.25, "learning_rate": 1.7522166570873965e-05, "loss": 0.9346, "step": 1815 }, { "epoch": 0.25, "learning_rate": 1.7519201403017056e-05, "loss": 0.917, "step": 1816 }, { "epoch": 0.25, "learning_rate": 1.7516234713255755e-05, "loss": 0.9414, "step": 1817 }, { "epoch": 0.25, "learning_rate": 1.7513266502190518e-05, "loss": 0.9353, "step": 1818 }, { "epoch": 0.25, "learning_rate": 1.751029677042212e-05, "loss": 0.925, "step": 1819 }, { "epoch": 0.25, "learning_rate": 1.7507325518551652e-05, "loss": 0.8577, "step": 1820 }, { "epoch": 0.25, "learning_rate": 1.7504352747180492e-05, "loss": 0.8516, "step": 1821 }, { "epoch": 0.25, "learning_rate": 1.750137845691034e-05, "loss": 0.9128, "step": 1822 }, { "epoch": 0.25, "learning_rate": 1.7498402648343193e-05, "loss": 0.9048, "step": 1823 }, { "epoch": 0.25, "learning_rate": 1.749542532208137e-05, "loss": 0.8335, "step": 1824 }, { "epoch": 0.25, "learning_rate": 1.7492446478727492e-05, "loss": 0.8569, "step": 1825 }, { "epoch": 0.25, "learning_rate": 1.7489466118884472e-05, "loss": 0.835, "step": 1826 }, { "epoch": 0.25, "learning_rate": 1.748648424315555e-05, "loss": 0.884, "step": 1827 }, { "epoch": 0.25, "learning_rate": 1.7483500852144265e-05, "loss": 0.9141, "step": 1828 }, { "epoch": 0.25, "learning_rate": 1.748051594645446e-05, "loss": 0.8792, "step": 1829 }, { "epoch": 0.25, "learning_rate": 1.747752952669029e-05, "loss": 0.6168, "step": 1830 }, { "epoch": 0.25, "learning_rate": 1.7474541593456208e-05, "loss": 0.9148, "step": 1831 }, { "epoch": 0.25, "learning_rate": 1.7471552147356983e-05, "loss": 0.9551, "step": 1832 }, { "epoch": 0.25, "learning_rate": 1.7468561188997686e-05, "loss": 0.8567, "step": 1833 }, { "epoch": 0.25, "learning_rate": 1.7465568718983694e-05, "loss": 0.8843, "step": 1834 }, { "epoch": 0.25, "learning_rate": 1.7462574737920687e-05, "loss": 0.8574, "step": 1835 }, { "epoch": 0.26, "learning_rate": 1.7459579246414655e-05, "loss": 0.9011, "step": 1836 }, { "epoch": 0.26, "learning_rate": 1.7456582245071896e-05, "loss": 0.9067, "step": 1837 }, { "epoch": 0.26, "learning_rate": 1.7453583734499008e-05, "loss": 0.8625, "step": 1838 }, { "epoch": 0.26, "learning_rate": 1.74505837153029e-05, "loss": 0.915, "step": 1839 }, { "epoch": 0.26, "learning_rate": 1.7447582188090777e-05, "loss": 0.817, "step": 1840 }, { "epoch": 0.26, "learning_rate": 1.744457915347016e-05, "loss": 0.8738, "step": 1841 }, { "epoch": 0.26, "learning_rate": 1.744157461204887e-05, "loss": 0.8718, "step": 1842 }, { "epoch": 0.26, "learning_rate": 1.743856856443503e-05, "loss": 0.897, "step": 1843 }, { "epoch": 0.26, "learning_rate": 1.743556101123707e-05, "loss": 0.8062, "step": 1844 }, { "epoch": 0.26, "learning_rate": 1.7432551953063738e-05, "loss": 0.8918, "step": 1845 }, { "epoch": 0.26, "learning_rate": 1.7429541390524058e-05, "loss": 0.939, "step": 1846 }, { "epoch": 0.26, "learning_rate": 1.742652932422739e-05, "loss": 0.8855, "step": 1847 }, { "epoch": 0.26, "learning_rate": 1.7423515754783373e-05, "loss": 0.884, "step": 1848 }, { "epoch": 0.26, "learning_rate": 1.7420500682801963e-05, "loss": 0.8684, "step": 1849 }, { "epoch": 0.26, "learning_rate": 1.741748410889342e-05, "loss": 0.9016, "step": 1850 }, { "epoch": 0.26, "learning_rate": 1.7414466033668307e-05, "loss": 0.8777, "step": 1851 }, { "epoch": 0.26, "learning_rate": 1.7411446457737485e-05, "loss": 0.8906, "step": 1852 }, { "epoch": 0.26, "learning_rate": 1.7408425381712127e-05, "loss": 0.905, "step": 1853 }, { "epoch": 0.26, "learning_rate": 1.7405402806203703e-05, "loss": 0.9077, "step": 1854 }, { "epoch": 0.26, "learning_rate": 1.7402378731823996e-05, "loss": 0.8929, "step": 1855 }, { "epoch": 0.26, "learning_rate": 1.739935315918508e-05, "loss": 0.9456, "step": 1856 }, { "epoch": 0.26, "learning_rate": 1.7396326088899336e-05, "loss": 0.8579, "step": 1857 }, { "epoch": 0.26, "learning_rate": 1.7393297521579457e-05, "loss": 0.6005, "step": 1858 }, { "epoch": 0.26, "learning_rate": 1.7390267457838426e-05, "loss": 0.6041, "step": 1859 }, { "epoch": 0.26, "learning_rate": 1.738723589828954e-05, "loss": 0.9417, "step": 1860 }, { "epoch": 0.26, "learning_rate": 1.7384202843546394e-05, "loss": 0.8984, "step": 1861 }, { "epoch": 0.26, "learning_rate": 1.7381168294222882e-05, "loss": 0.8912, "step": 1862 }, { "epoch": 0.26, "learning_rate": 1.737813225093321e-05, "loss": 0.8945, "step": 1863 }, { "epoch": 0.26, "learning_rate": 1.7375094714291872e-05, "loss": 0.9019, "step": 1864 }, { "epoch": 0.26, "learning_rate": 1.7372055684913676e-05, "loss": 0.8752, "step": 1865 }, { "epoch": 0.26, "learning_rate": 1.736901516341373e-05, "loss": 0.9277, "step": 1866 }, { "epoch": 0.26, "learning_rate": 1.7365973150407446e-05, "loss": 0.895, "step": 1867 }, { "epoch": 0.26, "learning_rate": 1.736292964651053e-05, "loss": 0.8977, "step": 1868 }, { "epoch": 0.26, "learning_rate": 1.7359884652338995e-05, "loss": 0.8489, "step": 1869 }, { "epoch": 0.26, "learning_rate": 1.7356838168509155e-05, "loss": 0.6279, "step": 1870 }, { "epoch": 0.26, "learning_rate": 1.735379019563763e-05, "loss": 0.8745, "step": 1871 }, { "epoch": 0.26, "learning_rate": 1.7350740734341332e-05, "loss": 0.9055, "step": 1872 }, { "epoch": 0.26, "learning_rate": 1.734768978523748e-05, "loss": 0.9265, "step": 1873 }, { "epoch": 0.26, "learning_rate": 1.7344637348943596e-05, "loss": 0.8657, "step": 1874 }, { "epoch": 0.26, "learning_rate": 1.73415834260775e-05, "loss": 0.7988, "step": 1875 }, { "epoch": 0.26, "learning_rate": 1.7338528017257307e-05, "loss": 0.5874, "step": 1876 }, { "epoch": 0.26, "learning_rate": 1.7335471123101447e-05, "loss": 0.9336, "step": 1877 }, { "epoch": 0.26, "learning_rate": 1.733241274422864e-05, "loss": 0.925, "step": 1878 }, { "epoch": 0.26, "learning_rate": 1.732935288125791e-05, "loss": 0.9109, "step": 1879 }, { "epoch": 0.26, "learning_rate": 1.7326291534808576e-05, "loss": 0.9038, "step": 1880 }, { "epoch": 0.26, "learning_rate": 1.7323228705500268e-05, "loss": 0.8879, "step": 1881 }, { "epoch": 0.26, "learning_rate": 1.732016439395291e-05, "loss": 0.894, "step": 1882 }, { "epoch": 0.26, "learning_rate": 1.731709860078672e-05, "loss": 0.9397, "step": 1883 }, { "epoch": 0.26, "learning_rate": 1.7314031326622225e-05, "loss": 0.9358, "step": 1884 }, { "epoch": 0.26, "learning_rate": 1.7310962572080252e-05, "loss": 0.8257, "step": 1885 }, { "epoch": 0.26, "learning_rate": 1.730789233778192e-05, "loss": 0.8823, "step": 1886 }, { "epoch": 0.26, "learning_rate": 1.730482062434865e-05, "loss": 0.8923, "step": 1887 }, { "epoch": 0.26, "learning_rate": 1.7301747432402174e-05, "loss": 0.8499, "step": 1888 }, { "epoch": 0.26, "learning_rate": 1.7298672762564502e-05, "loss": 0.8953, "step": 1889 }, { "epoch": 0.26, "learning_rate": 1.729559661545796e-05, "loss": 0.8455, "step": 1890 }, { "epoch": 0.26, "learning_rate": 1.729251899170517e-05, "loss": 0.8228, "step": 1891 }, { "epoch": 0.26, "learning_rate": 1.7289439891929042e-05, "loss": 0.8721, "step": 1892 }, { "epoch": 0.26, "learning_rate": 1.7286359316752804e-05, "loss": 0.8862, "step": 1893 }, { "epoch": 0.26, "learning_rate": 1.7283277266799964e-05, "loss": 0.8745, "step": 1894 }, { "epoch": 0.26, "learning_rate": 1.7280193742694336e-05, "loss": 0.8997, "step": 1895 }, { "epoch": 0.26, "learning_rate": 1.727710874506004e-05, "loss": 0.8567, "step": 1896 }, { "epoch": 0.26, "learning_rate": 1.7274022274521475e-05, "loss": 0.8394, "step": 1897 }, { "epoch": 0.26, "learning_rate": 1.7270934331703365e-05, "loss": 0.8557, "step": 1898 }, { "epoch": 0.26, "learning_rate": 1.7267844917230702e-05, "loss": 0.9531, "step": 1899 }, { "epoch": 0.26, "learning_rate": 1.7264754031728802e-05, "loss": 0.8937, "step": 1900 }, { "epoch": 0.26, "learning_rate": 1.7261661675823266e-05, "loss": 0.8417, "step": 1901 }, { "epoch": 0.26, "learning_rate": 1.725856785013999e-05, "loss": 0.8506, "step": 1902 }, { "epoch": 0.26, "learning_rate": 1.7255472555305172e-05, "loss": 0.9126, "step": 1903 }, { "epoch": 0.26, "learning_rate": 1.7252375791945312e-05, "loss": 0.858, "step": 1904 }, { "epoch": 0.26, "learning_rate": 1.7249277560687196e-05, "loss": 0.8838, "step": 1905 }, { "epoch": 0.26, "learning_rate": 1.7246177862157918e-05, "loss": 0.8811, "step": 1906 }, { "epoch": 0.26, "learning_rate": 1.7243076696984864e-05, "loss": 0.8894, "step": 1907 }, { "epoch": 0.27, "learning_rate": 1.7239974065795713e-05, "loss": 0.8489, "step": 1908 }, { "epoch": 0.27, "learning_rate": 1.723686996921845e-05, "loss": 0.9072, "step": 1909 }, { "epoch": 0.27, "learning_rate": 1.7233764407881352e-05, "loss": 0.8889, "step": 1910 }, { "epoch": 0.27, "learning_rate": 1.723065738241299e-05, "loss": 0.905, "step": 1911 }, { "epoch": 0.27, "learning_rate": 1.722754889344223e-05, "loss": 0.8406, "step": 1912 }, { "epoch": 0.27, "learning_rate": 1.722443894159824e-05, "loss": 0.8748, "step": 1913 }, { "epoch": 0.27, "learning_rate": 1.722132752751049e-05, "loss": 0.8293, "step": 1914 }, { "epoch": 0.27, "learning_rate": 1.7218214651808725e-05, "loss": 0.9285, "step": 1915 }, { "epoch": 0.27, "learning_rate": 1.7215100315123003e-05, "loss": 0.9111, "step": 1916 }, { "epoch": 0.27, "learning_rate": 1.7211984518083674e-05, "loss": 0.5946, "step": 1917 }, { "epoch": 0.27, "learning_rate": 1.7208867261321387e-05, "loss": 0.8413, "step": 1918 }, { "epoch": 0.27, "learning_rate": 1.7205748545467075e-05, "loss": 0.9106, "step": 1919 }, { "epoch": 0.27, "learning_rate": 1.7202628371151975e-05, "loss": 0.8317, "step": 1920 }, { "epoch": 0.27, "learning_rate": 1.7199506739007624e-05, "loss": 0.8765, "step": 1921 }, { "epoch": 0.27, "learning_rate": 1.719638364966584e-05, "loss": 0.9111, "step": 1922 }, { "epoch": 0.27, "learning_rate": 1.719325910375875e-05, "loss": 0.8962, "step": 1923 }, { "epoch": 0.27, "learning_rate": 1.7190133101918765e-05, "loss": 0.9553, "step": 1924 }, { "epoch": 0.27, "learning_rate": 1.7187005644778593e-05, "loss": 0.9041, "step": 1925 }, { "epoch": 0.27, "learning_rate": 1.7183876732971248e-05, "loss": 0.6466, "step": 1926 }, { "epoch": 0.27, "learning_rate": 1.718074636713002e-05, "loss": 0.8838, "step": 1927 }, { "epoch": 0.27, "learning_rate": 1.717761454788851e-05, "loss": 0.9546, "step": 1928 }, { "epoch": 0.27, "learning_rate": 1.7174481275880604e-05, "loss": 0.9172, "step": 1929 }, { "epoch": 0.27, "learning_rate": 1.717134655174048e-05, "loss": 0.7808, "step": 1930 }, { "epoch": 0.27, "learning_rate": 1.7168210376102612e-05, "loss": 0.9099, "step": 1931 }, { "epoch": 0.27, "learning_rate": 1.7165072749601776e-05, "loss": 0.9539, "step": 1932 }, { "epoch": 0.27, "learning_rate": 1.7161933672873032e-05, "loss": 0.6477, "step": 1933 }, { "epoch": 0.27, "learning_rate": 1.7158793146551736e-05, "loss": 0.8684, "step": 1934 }, { "epoch": 0.27, "learning_rate": 1.7155651171273543e-05, "loss": 0.9294, "step": 1935 }, { "epoch": 0.27, "learning_rate": 1.7152507747674388e-05, "loss": 0.897, "step": 1936 }, { "epoch": 0.27, "learning_rate": 1.7149362876390514e-05, "loss": 0.8655, "step": 1937 }, { "epoch": 0.27, "learning_rate": 1.7146216558058447e-05, "loss": 0.8237, "step": 1938 }, { "epoch": 0.27, "learning_rate": 1.7143068793315013e-05, "loss": 0.9097, "step": 1939 }, { "epoch": 0.27, "learning_rate": 1.7139919582797323e-05, "loss": 0.9097, "step": 1940 }, { "epoch": 0.27, "learning_rate": 1.7136768927142786e-05, "loss": 0.8582, "step": 1941 }, { "epoch": 0.27, "learning_rate": 1.7133616826989104e-05, "loss": 0.9177, "step": 1942 }, { "epoch": 0.27, "learning_rate": 1.7130463282974267e-05, "loss": 0.9214, "step": 1943 }, { "epoch": 0.27, "learning_rate": 1.7127308295736563e-05, "loss": 0.8356, "step": 1944 }, { "epoch": 0.27, "learning_rate": 1.7124151865914566e-05, "loss": 0.9399, "step": 1945 }, { "epoch": 0.27, "learning_rate": 1.7120993994147146e-05, "loss": 0.8417, "step": 1946 }, { "epoch": 0.27, "learning_rate": 1.7117834681073467e-05, "loss": 0.8629, "step": 1947 }, { "epoch": 0.27, "learning_rate": 1.7114673927332975e-05, "loss": 0.5888, "step": 1948 }, { "epoch": 0.27, "learning_rate": 1.7111511733565424e-05, "loss": 0.8823, "step": 1949 }, { "epoch": 0.27, "learning_rate": 1.7108348100410838e-05, "loss": 0.8512, "step": 1950 }, { "epoch": 0.27, "learning_rate": 1.710518302850955e-05, "loss": 0.6288, "step": 1951 }, { "epoch": 0.27, "learning_rate": 1.7102016518502176e-05, "loss": 0.938, "step": 1952 }, { "epoch": 0.27, "learning_rate": 1.709884857102963e-05, "loss": 0.8599, "step": 1953 }, { "epoch": 0.27, "learning_rate": 1.7095679186733108e-05, "loss": 0.8691, "step": 1954 }, { "epoch": 0.27, "learning_rate": 1.70925083662541e-05, "loss": 0.9463, "step": 1955 }, { "epoch": 0.27, "learning_rate": 1.708933611023439e-05, "loss": 0.9309, "step": 1956 }, { "epoch": 0.27, "learning_rate": 1.7086162419316053e-05, "loss": 0.8271, "step": 1957 }, { "epoch": 0.27, "learning_rate": 1.7082987294141444e-05, "loss": 0.873, "step": 1958 }, { "epoch": 0.27, "learning_rate": 1.707981073535322e-05, "loss": 0.9302, "step": 1959 }, { "epoch": 0.27, "learning_rate": 1.707663274359433e-05, "loss": 0.9067, "step": 1960 }, { "epoch": 0.27, "learning_rate": 1.7073453319508e-05, "loss": 0.9001, "step": 1961 }, { "epoch": 0.27, "learning_rate": 1.707027246373775e-05, "loss": 0.9465, "step": 1962 }, { "epoch": 0.27, "learning_rate": 1.7067090176927402e-05, "loss": 0.9038, "step": 1963 }, { "epoch": 0.27, "learning_rate": 1.7063906459721055e-05, "loss": 0.917, "step": 1964 }, { "epoch": 0.27, "learning_rate": 1.7060721312763096e-05, "loss": 0.3792, "step": 1965 }, { "epoch": 0.27, "learning_rate": 1.7057534736698212e-05, "loss": 0.8455, "step": 1966 }, { "epoch": 0.27, "learning_rate": 1.7054346732171373e-05, "loss": 0.8585, "step": 1967 }, { "epoch": 0.27, "learning_rate": 1.7051157299827833e-05, "loss": 0.6499, "step": 1968 }, { "epoch": 0.27, "learning_rate": 1.704796644031315e-05, "loss": 0.6447, "step": 1969 }, { "epoch": 0.27, "learning_rate": 1.704477415427316e-05, "loss": 0.8433, "step": 1970 }, { "epoch": 0.27, "learning_rate": 1.7041580442353983e-05, "loss": 0.8945, "step": 1971 }, { "epoch": 0.27, "learning_rate": 1.7038385305202036e-05, "loss": 0.938, "step": 1972 }, { "epoch": 0.27, "learning_rate": 1.7035188743464023e-05, "loss": 1.0042, "step": 1973 }, { "epoch": 0.27, "learning_rate": 1.7031990757786942e-05, "loss": 0.9531, "step": 1974 }, { "epoch": 0.27, "learning_rate": 1.7028791348818062e-05, "loss": 0.9368, "step": 1975 }, { "epoch": 0.27, "learning_rate": 1.702559051720496e-05, "loss": 0.8813, "step": 1976 }, { "epoch": 0.27, "learning_rate": 1.702238826359549e-05, "loss": 0.8645, "step": 1977 }, { "epoch": 0.27, "learning_rate": 1.701918458863779e-05, "loss": 0.8467, "step": 1978 }, { "epoch": 0.27, "learning_rate": 1.7015979492980297e-05, "loss": 0.8033, "step": 1979 }, { "epoch": 0.28, "learning_rate": 1.701277297727173e-05, "loss": 0.916, "step": 1980 }, { "epoch": 0.28, "learning_rate": 1.7009565042161097e-05, "loss": 0.8572, "step": 1981 }, { "epoch": 0.28, "learning_rate": 1.7006355688297686e-05, "loss": 0.9712, "step": 1982 }, { "epoch": 0.28, "learning_rate": 1.700314491633108e-05, "loss": 0.8613, "step": 1983 }, { "epoch": 0.28, "learning_rate": 1.6999932726911153e-05, "loss": 0.8394, "step": 1984 }, { "epoch": 0.28, "learning_rate": 1.699671912068805e-05, "loss": 0.9575, "step": 1985 }, { "epoch": 0.28, "learning_rate": 1.699350409831222e-05, "loss": 0.8838, "step": 1986 }, { "epoch": 0.28, "learning_rate": 1.6990287660434388e-05, "loss": 0.8984, "step": 1987 }, { "epoch": 0.28, "learning_rate": 1.698706980770557e-05, "loss": 0.9263, "step": 1988 }, { "epoch": 0.28, "learning_rate": 1.698385054077707e-05, "loss": 0.6022, "step": 1989 }, { "epoch": 0.28, "learning_rate": 1.698062986030047e-05, "loss": 0.894, "step": 1990 }, { "epoch": 0.28, "learning_rate": 1.697740776692764e-05, "loss": 0.8567, "step": 1991 }, { "epoch": 0.28, "learning_rate": 1.697418426131075e-05, "loss": 0.8262, "step": 1992 }, { "epoch": 0.28, "learning_rate": 1.6970959344102237e-05, "loss": 0.9109, "step": 1993 }, { "epoch": 0.28, "learning_rate": 1.696773301595484e-05, "loss": 0.8491, "step": 1994 }, { "epoch": 0.28, "learning_rate": 1.6964505277521567e-05, "loss": 0.9717, "step": 1995 }, { "epoch": 0.28, "learning_rate": 1.6961276129455722e-05, "loss": 0.8965, "step": 1996 }, { "epoch": 0.28, "learning_rate": 1.69580455724109e-05, "loss": 0.8667, "step": 1997 }, { "epoch": 0.28, "learning_rate": 1.6954813607040962e-05, "loss": 0.8901, "step": 1998 }, { "epoch": 0.28, "learning_rate": 1.6951580234000073e-05, "loss": 0.8826, "step": 1999 }, { "epoch": 0.28, "learning_rate": 1.6948345453942674e-05, "loss": 0.8599, "step": 2000 }, { "epoch": 0.28, "learning_rate": 1.694510926752349e-05, "loss": 0.8602, "step": 2001 }, { "epoch": 0.28, "learning_rate": 1.6941871675397538e-05, "loss": 0.8945, "step": 2002 }, { "epoch": 0.28, "learning_rate": 1.6938632678220106e-05, "loss": 0.7883, "step": 2003 }, { "epoch": 0.28, "learning_rate": 1.6935392276646783e-05, "loss": 0.9001, "step": 2004 }, { "epoch": 0.28, "learning_rate": 1.6932150471333432e-05, "loss": 0.884, "step": 2005 }, { "epoch": 0.28, "learning_rate": 1.6928907262936197e-05, "loss": 0.9023, "step": 2006 }, { "epoch": 0.28, "learning_rate": 1.6925662652111515e-05, "loss": 0.8433, "step": 2007 }, { "epoch": 0.28, "learning_rate": 1.692241663951611e-05, "loss": 0.8594, "step": 2008 }, { "epoch": 0.28, "learning_rate": 1.6919169225806967e-05, "loss": 0.8674, "step": 2009 }, { "epoch": 0.28, "learning_rate": 1.6915920411641387e-05, "loss": 0.8738, "step": 2010 }, { "epoch": 0.28, "learning_rate": 1.6912670197676927e-05, "loss": 0.8596, "step": 2011 }, { "epoch": 0.28, "learning_rate": 1.690941858457144e-05, "loss": 0.9023, "step": 2012 }, { "epoch": 0.28, "learning_rate": 1.6906165572983062e-05, "loss": 0.8601, "step": 2013 }, { "epoch": 0.28, "learning_rate": 1.690291116357021e-05, "loss": 0.8792, "step": 2014 }, { "epoch": 0.28, "learning_rate": 1.6899655356991584e-05, "loss": 0.9194, "step": 2015 }, { "epoch": 0.28, "learning_rate": 1.6896398153906165e-05, "loss": 0.8667, "step": 2016 }, { "epoch": 0.28, "learning_rate": 1.6893139554973225e-05, "loss": 0.6409, "step": 2017 }, { "epoch": 0.28, "learning_rate": 1.6889879560852307e-05, "loss": 0.8606, "step": 2018 }, { "epoch": 0.28, "learning_rate": 1.6886618172203243e-05, "loss": 0.8823, "step": 2019 }, { "epoch": 0.28, "learning_rate": 1.6883355389686142e-05, "loss": 0.8994, "step": 2020 }, { "epoch": 0.28, "learning_rate": 1.6880091213961403e-05, "loss": 0.8828, "step": 2021 }, { "epoch": 0.28, "learning_rate": 1.6876825645689708e-05, "loss": 0.9146, "step": 2022 }, { "epoch": 0.28, "learning_rate": 1.6873558685532007e-05, "loss": 0.866, "step": 2023 }, { "epoch": 0.28, "learning_rate": 1.687029033414954e-05, "loss": 0.8638, "step": 2024 }, { "epoch": 0.28, "learning_rate": 1.6867020592203838e-05, "loss": 0.856, "step": 2025 }, { "epoch": 0.28, "learning_rate": 1.68637494603567e-05, "loss": 0.9165, "step": 2026 }, { "epoch": 0.28, "learning_rate": 1.686047693927021e-05, "loss": 0.6021, "step": 2027 }, { "epoch": 0.28, "learning_rate": 1.6857203029606736e-05, "loss": 0.8804, "step": 2028 }, { "epoch": 0.28, "learning_rate": 1.6853927732028918e-05, "loss": 0.823, "step": 2029 }, { "epoch": 0.28, "learning_rate": 1.6850651047199695e-05, "loss": 0.9109, "step": 2030 }, { "epoch": 0.28, "learning_rate": 1.684737297578227e-05, "loss": 0.8867, "step": 2031 }, { "epoch": 0.28, "learning_rate": 1.6844093518440133e-05, "loss": 0.8667, "step": 2032 }, { "epoch": 0.28, "learning_rate": 1.6840812675837054e-05, "loss": 0.8826, "step": 2033 }, { "epoch": 0.28, "learning_rate": 1.6837530448637087e-05, "loss": 0.8708, "step": 2034 }, { "epoch": 0.28, "learning_rate": 1.6834246837504556e-05, "loss": 0.8987, "step": 2035 }, { "epoch": 0.28, "learning_rate": 1.683096184310408e-05, "loss": 0.8518, "step": 2036 }, { "epoch": 0.28, "learning_rate": 1.682767546610054e-05, "loss": 0.681, "step": 2037 }, { "epoch": 0.28, "learning_rate": 1.6824387707159112e-05, "loss": 0.9094, "step": 2038 }, { "epoch": 0.28, "learning_rate": 1.682109856694525e-05, "loss": 0.8669, "step": 2039 }, { "epoch": 0.28, "learning_rate": 1.6817808046124676e-05, "loss": 0.6469, "step": 2040 }, { "epoch": 0.28, "learning_rate": 1.6814516145363404e-05, "loss": 0.9275, "step": 2041 }, { "epoch": 0.28, "learning_rate": 1.681122286532772e-05, "loss": 0.9717, "step": 2042 }, { "epoch": 0.28, "learning_rate": 1.6807928206684196e-05, "loss": 0.8879, "step": 2043 }, { "epoch": 0.28, "learning_rate": 1.6804632170099675e-05, "loss": 0.6145, "step": 2044 }, { "epoch": 0.28, "learning_rate": 1.680133475624129e-05, "loss": 0.8572, "step": 2045 }, { "epoch": 0.28, "learning_rate": 1.6798035965776433e-05, "loss": 0.821, "step": 2046 }, { "epoch": 0.28, "learning_rate": 1.679473579937279e-05, "loss": 0.9465, "step": 2047 }, { "epoch": 0.28, "learning_rate": 1.6791434257698332e-05, "loss": 0.6235, "step": 2048 }, { "epoch": 0.28, "learning_rate": 1.6788131341421292e-05, "loss": 0.9329, "step": 2049 }, { "epoch": 0.28, "learning_rate": 1.6784827051210192e-05, "loss": 0.8601, "step": 2050 }, { "epoch": 0.28, "learning_rate": 1.678152138773382e-05, "loss": 0.8726, "step": 2051 }, { "epoch": 0.29, "learning_rate": 1.677821435166126e-05, "loss": 0.9285, "step": 2052 }, { "epoch": 0.29, "learning_rate": 1.6774905943661857e-05, "loss": 0.8762, "step": 2053 }, { "epoch": 0.29, "learning_rate": 1.6771596164405246e-05, "loss": 0.9146, "step": 2054 }, { "epoch": 0.29, "learning_rate": 1.6768285014561332e-05, "loss": 0.8506, "step": 2055 }, { "epoch": 0.29, "learning_rate": 1.6764972494800296e-05, "loss": 0.9099, "step": 2056 }, { "epoch": 0.29, "learning_rate": 1.6761658605792605e-05, "loss": 0.8364, "step": 2057 }, { "epoch": 0.29, "learning_rate": 1.6758343348208996e-05, "loss": 0.8232, "step": 2058 }, { "epoch": 0.29, "learning_rate": 1.6755026722720487e-05, "loss": 0.8623, "step": 2059 }, { "epoch": 0.29, "learning_rate": 1.675170872999837e-05, "loss": 0.7898, "step": 2060 }, { "epoch": 0.29, "learning_rate": 1.6748389370714212e-05, "loss": 0.9148, "step": 2061 }, { "epoch": 0.29, "learning_rate": 1.6745068645539865e-05, "loss": 0.8948, "step": 2062 }, { "epoch": 0.29, "learning_rate": 1.6741746555147445e-05, "loss": 0.9299, "step": 2063 }, { "epoch": 0.29, "learning_rate": 1.6738423100209353e-05, "loss": 0.8391, "step": 2064 }, { "epoch": 0.29, "learning_rate": 1.6735098281398273e-05, "loss": 0.8896, "step": 2065 }, { "epoch": 0.29, "learning_rate": 1.673177209938714e-05, "loss": 0.8337, "step": 2066 }, { "epoch": 0.29, "learning_rate": 1.6728444554849194e-05, "loss": 0.8755, "step": 2067 }, { "epoch": 0.29, "learning_rate": 1.6725115648457936e-05, "loss": 0.9175, "step": 2068 }, { "epoch": 0.29, "learning_rate": 1.672178538088714e-05, "loss": 0.8865, "step": 2069 }, { "epoch": 0.29, "learning_rate": 1.6718453752810863e-05, "loss": 0.7913, "step": 2070 }, { "epoch": 0.29, "learning_rate": 1.6715120764903433e-05, "loss": 0.9128, "step": 2071 }, { "epoch": 0.29, "learning_rate": 1.671178641783946e-05, "loss": 0.892, "step": 2072 }, { "epoch": 0.29, "learning_rate": 1.6708450712293815e-05, "loss": 0.9438, "step": 2073 }, { "epoch": 0.29, "learning_rate": 1.670511364894166e-05, "loss": 0.8555, "step": 2074 }, { "epoch": 0.29, "learning_rate": 1.6701775228458425e-05, "loss": 0.8604, "step": 2075 }, { "epoch": 0.29, "learning_rate": 1.6698435451519808e-05, "loss": 0.8672, "step": 2076 }, { "epoch": 0.29, "learning_rate": 1.669509431880179e-05, "loss": 0.9006, "step": 2077 }, { "epoch": 0.29, "learning_rate": 1.669175183098063e-05, "loss": 0.9238, "step": 2078 }, { "epoch": 0.29, "learning_rate": 1.668840798873285e-05, "loss": 0.8447, "step": 2079 }, { "epoch": 0.29, "learning_rate": 1.6685062792735255e-05, "loss": 0.6191, "step": 2080 }, { "epoch": 0.29, "learning_rate": 1.6681716243664915e-05, "loss": 0.8584, "step": 2081 }, { "epoch": 0.29, "learning_rate": 1.6678368342199185e-05, "loss": 0.8303, "step": 2082 }, { "epoch": 0.29, "learning_rate": 1.6675019089015686e-05, "loss": 0.9451, "step": 2083 }, { "epoch": 0.29, "learning_rate": 1.6671668484792315e-05, "loss": 0.8982, "step": 2084 }, { "epoch": 0.29, "learning_rate": 1.6668316530207244e-05, "loss": 0.8621, "step": 2085 }, { "epoch": 0.29, "learning_rate": 1.6664963225938916e-05, "loss": 0.9119, "step": 2086 }, { "epoch": 0.29, "learning_rate": 1.6661608572666045e-05, "loss": 0.8833, "step": 2087 }, { "epoch": 0.29, "learning_rate": 1.6658252571067626e-05, "loss": 0.8752, "step": 2088 }, { "epoch": 0.29, "learning_rate": 1.6654895221822918e-05, "loss": 0.8787, "step": 2089 }, { "epoch": 0.29, "learning_rate": 1.6651536525611455e-05, "loss": 0.8477, "step": 2090 }, { "epoch": 0.29, "learning_rate": 1.6648176483113053e-05, "loss": 0.9148, "step": 2091 }, { "epoch": 0.29, "learning_rate": 1.6644815095007784e-05, "loss": 0.8682, "step": 2092 }, { "epoch": 0.29, "learning_rate": 1.6641452361976e-05, "loss": 0.9438, "step": 2093 }, { "epoch": 0.29, "learning_rate": 1.6638088284698337e-05, "loss": 0.8525, "step": 2094 }, { "epoch": 0.29, "learning_rate": 1.6634722863855684e-05, "loss": 0.5983, "step": 2095 }, { "epoch": 0.29, "learning_rate": 1.6631356100129212e-05, "loss": 0.7493, "step": 2096 }, { "epoch": 0.29, "learning_rate": 1.662798799420036e-05, "loss": 0.8657, "step": 2097 }, { "epoch": 0.29, "learning_rate": 1.6624618546750842e-05, "loss": 0.8215, "step": 2098 }, { "epoch": 0.29, "learning_rate": 1.6621247758462647e-05, "loss": 0.8611, "step": 2099 }, { "epoch": 0.29, "learning_rate": 1.6617875630018025e-05, "loss": 0.663, "step": 2100 }, { "epoch": 0.29, "learning_rate": 1.6614502162099508e-05, "loss": 0.8511, "step": 2101 }, { "epoch": 0.29, "learning_rate": 1.6611127355389883e-05, "loss": 0.832, "step": 2102 }, { "epoch": 0.29, "learning_rate": 1.660775121057223e-05, "loss": 0.6108, "step": 2103 }, { "epoch": 0.29, "learning_rate": 1.6604373728329888e-05, "loss": 0.9121, "step": 2104 }, { "epoch": 0.29, "learning_rate": 1.660099490934646e-05, "loss": 0.929, "step": 2105 }, { "epoch": 0.29, "learning_rate": 1.6597614754305838e-05, "loss": 0.8262, "step": 2106 }, { "epoch": 0.29, "learning_rate": 1.6594233263892164e-05, "loss": 0.6232, "step": 2107 }, { "epoch": 0.29, "learning_rate": 1.6590850438789864e-05, "loss": 0.3757, "step": 2108 }, { "epoch": 0.29, "learning_rate": 1.658746627968363e-05, "loss": 0.8125, "step": 2109 }, { "epoch": 0.29, "learning_rate": 1.658408078725842e-05, "loss": 0.8831, "step": 2110 }, { "epoch": 0.29, "learning_rate": 1.6580693962199473e-05, "loss": 0.9067, "step": 2111 }, { "epoch": 0.29, "learning_rate": 1.6577305805192283e-05, "loss": 0.9084, "step": 2112 }, { "epoch": 0.29, "learning_rate": 1.6573916316922623e-05, "loss": 0.9749, "step": 2113 }, { "epoch": 0.29, "learning_rate": 1.657052549807654e-05, "loss": 0.8706, "step": 2114 }, { "epoch": 0.29, "learning_rate": 1.6567133349340334e-05, "loss": 0.8262, "step": 2115 }, { "epoch": 0.29, "learning_rate": 1.6563739871400593e-05, "loss": 0.5912, "step": 2116 }, { "epoch": 0.29, "learning_rate": 1.656034506494416e-05, "loss": 0.894, "step": 2117 }, { "epoch": 0.29, "learning_rate": 1.655694893065815e-05, "loss": 0.8923, "step": 2118 }, { "epoch": 0.29, "learning_rate": 1.6553551469229954e-05, "loss": 0.917, "step": 2119 }, { "epoch": 0.29, "learning_rate": 1.6550152681347223e-05, "loss": 0.8833, "step": 2120 }, { "epoch": 0.29, "learning_rate": 1.6546752567697884e-05, "loss": 0.9314, "step": 2121 }, { "epoch": 0.29, "learning_rate": 1.654335112897012e-05, "loss": 0.9021, "step": 2122 }, { "epoch": 0.29, "learning_rate": 1.6539948365852397e-05, "loss": 0.6023, "step": 2123 }, { "epoch": 0.3, "learning_rate": 1.6536544279033443e-05, "loss": 0.8442, "step": 2124 }, { "epoch": 0.3, "learning_rate": 1.653313886920225e-05, "loss": 0.853, "step": 2125 }, { "epoch": 0.3, "learning_rate": 1.652973213704808e-05, "loss": 0.8789, "step": 2126 }, { "epoch": 0.3, "learning_rate": 1.652632408326047e-05, "loss": 0.8867, "step": 2127 }, { "epoch": 0.3, "learning_rate": 1.652291470852921e-05, "loss": 0.9287, "step": 2128 }, { "epoch": 0.3, "learning_rate": 1.6519504013544373e-05, "loss": 0.8623, "step": 2129 }, { "epoch": 0.3, "learning_rate": 1.6516091998996287e-05, "loss": 0.8716, "step": 2130 }, { "epoch": 0.3, "learning_rate": 1.6512678665575554e-05, "loss": 0.9802, "step": 2131 }, { "epoch": 0.3, "learning_rate": 1.650926401397304e-05, "loss": 0.936, "step": 2132 }, { "epoch": 0.3, "learning_rate": 1.6505848044879876e-05, "loss": 0.5864, "step": 2133 }, { "epoch": 0.3, "learning_rate": 1.6502430758987472e-05, "loss": 0.8645, "step": 2134 }, { "epoch": 0.3, "learning_rate": 1.6499012156987486e-05, "loss": 0.917, "step": 2135 }, { "epoch": 0.3, "learning_rate": 1.6495592239571854e-05, "loss": 0.885, "step": 2136 }, { "epoch": 0.3, "learning_rate": 1.649217100743277e-05, "loss": 0.8826, "step": 2137 }, { "epoch": 0.3, "learning_rate": 1.6488748461262713e-05, "loss": 0.9043, "step": 2138 }, { "epoch": 0.3, "learning_rate": 1.64853246017544e-05, "loss": 0.8091, "step": 2139 }, { "epoch": 0.3, "learning_rate": 1.6481899429600836e-05, "loss": 0.8997, "step": 2140 }, { "epoch": 0.3, "learning_rate": 1.6478472945495284e-05, "loss": 0.897, "step": 2141 }, { "epoch": 0.3, "learning_rate": 1.647504515013127e-05, "loss": 0.8704, "step": 2142 }, { "epoch": 0.3, "learning_rate": 1.647161604420259e-05, "loss": 0.5754, "step": 2143 }, { "epoch": 0.3, "learning_rate": 1.6468185628403303e-05, "loss": 0.8721, "step": 2144 }, { "epoch": 0.3, "learning_rate": 1.646475390342773e-05, "loss": 0.9028, "step": 2145 }, { "epoch": 0.3, "learning_rate": 1.6461320869970466e-05, "loss": 0.8955, "step": 2146 }, { "epoch": 0.3, "learning_rate": 1.645788652872636e-05, "loss": 0.9312, "step": 2147 }, { "epoch": 0.3, "learning_rate": 1.645445088039054e-05, "loss": 0.8914, "step": 2148 }, { "epoch": 0.3, "learning_rate": 1.6451013925658375e-05, "loss": 0.9185, "step": 2149 }, { "epoch": 0.3, "learning_rate": 1.6447575665225524e-05, "loss": 0.8774, "step": 2150 }, { "epoch": 0.3, "learning_rate": 1.6444136099787894e-05, "loss": 0.8589, "step": 2151 }, { "epoch": 0.3, "learning_rate": 1.6440695230041666e-05, "loss": 0.791, "step": 2152 }, { "epoch": 0.3, "learning_rate": 1.6437253056683276e-05, "loss": 0.818, "step": 2153 }, { "epoch": 0.3, "learning_rate": 1.6433809580409432e-05, "loss": 0.8821, "step": 2154 }, { "epoch": 0.3, "learning_rate": 1.6430364801917095e-05, "loss": 0.8201, "step": 2155 }, { "epoch": 0.3, "learning_rate": 1.6426918721903504e-05, "loss": 0.9321, "step": 2156 }, { "epoch": 0.3, "learning_rate": 1.642347134106615e-05, "loss": 0.874, "step": 2157 }, { "epoch": 0.3, "learning_rate": 1.6420022660102793e-05, "loss": 0.8889, "step": 2158 }, { "epoch": 0.3, "learning_rate": 1.6416572679711453e-05, "loss": 0.8997, "step": 2159 }, { "epoch": 0.3, "learning_rate": 1.6413121400590413e-05, "loss": 0.8994, "step": 2160 }, { "epoch": 0.3, "learning_rate": 1.6409668823438223e-05, "loss": 0.804, "step": 2161 }, { "epoch": 0.3, "learning_rate": 1.640621494895369e-05, "loss": 0.8716, "step": 2162 }, { "epoch": 0.3, "learning_rate": 1.6402759777835888e-05, "loss": 0.9307, "step": 2163 }, { "epoch": 0.3, "learning_rate": 1.6399303310784153e-05, "loss": 0.8857, "step": 2164 }, { "epoch": 0.3, "learning_rate": 1.6395845548498082e-05, "loss": 0.675, "step": 2165 }, { "epoch": 0.3, "learning_rate": 1.639238649167753e-05, "loss": 0.885, "step": 2166 }, { "epoch": 0.3, "learning_rate": 1.6388926141022627e-05, "loss": 0.8672, "step": 2167 }, { "epoch": 0.3, "learning_rate": 1.638546449723375e-05, "loss": 0.9182, "step": 2168 }, { "epoch": 0.3, "learning_rate": 1.6382001561011543e-05, "loss": 0.886, "step": 2169 }, { "epoch": 0.3, "learning_rate": 1.6378537333056913e-05, "loss": 0.8318, "step": 2170 }, { "epoch": 0.3, "learning_rate": 1.6375071814071035e-05, "loss": 0.8792, "step": 2171 }, { "epoch": 0.3, "learning_rate": 1.6371605004755332e-05, "loss": 0.8955, "step": 2172 }, { "epoch": 0.3, "learning_rate": 1.6368136905811493e-05, "loss": 0.8667, "step": 2173 }, { "epoch": 0.3, "learning_rate": 1.6364667517941476e-05, "loss": 0.8982, "step": 2174 }, { "epoch": 0.3, "learning_rate": 1.6361196841847484e-05, "loss": 0.8752, "step": 2175 }, { "epoch": 0.3, "learning_rate": 1.6357724878232e-05, "loss": 0.8616, "step": 2176 }, { "epoch": 0.3, "learning_rate": 1.6354251627797754e-05, "loss": 0.6151, "step": 2177 }, { "epoch": 0.3, "learning_rate": 1.635077709124774e-05, "loss": 0.8682, "step": 2178 }, { "epoch": 0.3, "learning_rate": 1.634730126928521e-05, "loss": 0.8987, "step": 2179 }, { "epoch": 0.3, "learning_rate": 1.6343824162613683e-05, "loss": 0.8794, "step": 2180 }, { "epoch": 0.3, "learning_rate": 1.634034577193693e-05, "loss": 0.8569, "step": 2181 }, { "epoch": 0.3, "learning_rate": 1.633686609795899e-05, "loss": 0.8977, "step": 2182 }, { "epoch": 0.3, "learning_rate": 1.6333385141384152e-05, "loss": 0.9128, "step": 2183 }, { "epoch": 0.3, "learning_rate": 1.6329902902916976e-05, "loss": 0.9285, "step": 2184 }, { "epoch": 0.3, "learning_rate": 1.632641938326227e-05, "loss": 0.8945, "step": 2185 }, { "epoch": 0.3, "learning_rate": 1.632293458312511e-05, "loss": 0.8967, "step": 2186 }, { "epoch": 0.3, "learning_rate": 1.6319448503210825e-05, "loss": 0.9336, "step": 2187 }, { "epoch": 0.3, "learning_rate": 1.631596114422501e-05, "loss": 0.8948, "step": 2188 }, { "epoch": 0.3, "learning_rate": 1.631247250687351e-05, "loss": 0.9197, "step": 2189 }, { "epoch": 0.3, "learning_rate": 1.630898259186244e-05, "loss": 0.8311, "step": 2190 }, { "epoch": 0.3, "learning_rate": 1.630549139989816e-05, "loss": 0.8616, "step": 2191 }, { "epoch": 0.3, "learning_rate": 1.63019989316873e-05, "loss": 0.8503, "step": 2192 }, { "epoch": 0.3, "learning_rate": 1.6298505187936743e-05, "loss": 0.8794, "step": 2193 }, { "epoch": 0.3, "learning_rate": 1.629501016935363e-05, "loss": 0.9622, "step": 2194 }, { "epoch": 0.3, "learning_rate": 1.6291513876645362e-05, "loss": 0.9146, "step": 2195 }, { "epoch": 0.31, "learning_rate": 1.62880163105196e-05, "loss": 0.9287, "step": 2196 }, { "epoch": 0.31, "learning_rate": 1.6284517471684252e-05, "loss": 0.8604, "step": 2197 }, { "epoch": 0.31, "learning_rate": 1.6281017360847503e-05, "loss": 0.5972, "step": 2198 }, { "epoch": 0.31, "learning_rate": 1.627751597871777e-05, "loss": 0.873, "step": 2199 }, { "epoch": 0.31, "learning_rate": 1.6274013326003753e-05, "loss": 0.9119, "step": 2200 }, { "epoch": 0.31, "learning_rate": 1.627050940341439e-05, "loss": 0.9387, "step": 2201 }, { "epoch": 0.31, "learning_rate": 1.6267004211658886e-05, "loss": 0.8657, "step": 2202 }, { "epoch": 0.31, "learning_rate": 1.62634977514467e-05, "loss": 0.8806, "step": 2203 }, { "epoch": 0.31, "learning_rate": 1.6259990023487552e-05, "loss": 0.8779, "step": 2204 }, { "epoch": 0.31, "learning_rate": 1.6256481028491407e-05, "loss": 0.5063, "step": 2205 }, { "epoch": 0.31, "learning_rate": 1.6252970767168497e-05, "loss": 0.9236, "step": 2206 }, { "epoch": 0.31, "learning_rate": 1.624945924022931e-05, "loss": 0.8882, "step": 2207 }, { "epoch": 0.31, "learning_rate": 1.6245946448384584e-05, "loss": 0.8992, "step": 2208 }, { "epoch": 0.31, "learning_rate": 1.624243239234532e-05, "loss": 0.6711, "step": 2209 }, { "epoch": 0.31, "learning_rate": 1.6238917072822768e-05, "loss": 0.5667, "step": 2210 }, { "epoch": 0.31, "learning_rate": 1.623540049052844e-05, "loss": 0.8281, "step": 2211 }, { "epoch": 0.31, "learning_rate": 1.6231882646174094e-05, "loss": 0.9016, "step": 2212 }, { "epoch": 0.31, "learning_rate": 1.622836354047176e-05, "loss": 0.8831, "step": 2213 }, { "epoch": 0.31, "learning_rate": 1.622484317413371e-05, "loss": 0.8816, "step": 2214 }, { "epoch": 0.31, "learning_rate": 1.6221321547872468e-05, "loss": 0.9419, "step": 2215 }, { "epoch": 0.31, "learning_rate": 1.6217798662400826e-05, "loss": 0.9202, "step": 2216 }, { "epoch": 0.31, "learning_rate": 1.6214274518431825e-05, "loss": 0.8157, "step": 2217 }, { "epoch": 0.31, "learning_rate": 1.621074911667876e-05, "loss": 0.8557, "step": 2218 }, { "epoch": 0.31, "learning_rate": 1.6207222457855176e-05, "loss": 0.863, "step": 2219 }, { "epoch": 0.31, "learning_rate": 1.6203694542674882e-05, "loss": 0.9111, "step": 2220 }, { "epoch": 0.31, "learning_rate": 1.6200165371851935e-05, "loss": 0.8372, "step": 2221 }, { "epoch": 0.31, "learning_rate": 1.6196634946100647e-05, "loss": 0.6097, "step": 2222 }, { "epoch": 0.31, "learning_rate": 1.6193103266135584e-05, "loss": 0.8987, "step": 2223 }, { "epoch": 0.31, "learning_rate": 1.6189570332671573e-05, "loss": 0.8784, "step": 2224 }, { "epoch": 0.31, "learning_rate": 1.6186036146423678e-05, "loss": 0.926, "step": 2225 }, { "epoch": 0.31, "learning_rate": 1.618250070810723e-05, "loss": 0.8735, "step": 2226 }, { "epoch": 0.31, "learning_rate": 1.6178964018437814e-05, "loss": 0.9006, "step": 2227 }, { "epoch": 0.31, "learning_rate": 1.6175426078131267e-05, "loss": 0.9009, "step": 2228 }, { "epoch": 0.31, "learning_rate": 1.6171886887903668e-05, "loss": 0.8948, "step": 2229 }, { "epoch": 0.31, "learning_rate": 1.616834644847136e-05, "loss": 0.8936, "step": 2230 }, { "epoch": 0.31, "learning_rate": 1.616480476055094e-05, "loss": 0.8503, "step": 2231 }, { "epoch": 0.31, "learning_rate": 1.616126182485925e-05, "loss": 0.5869, "step": 2232 }, { "epoch": 0.31, "learning_rate": 1.6157717642113396e-05, "loss": 0.8823, "step": 2233 }, { "epoch": 0.31, "learning_rate": 1.615417221303072e-05, "loss": 0.9224, "step": 2234 }, { "epoch": 0.31, "learning_rate": 1.6150625538328828e-05, "loss": 0.8591, "step": 2235 }, { "epoch": 0.31, "learning_rate": 1.6147077618725578e-05, "loss": 0.8113, "step": 2236 }, { "epoch": 0.31, "learning_rate": 1.6143528454939077e-05, "loss": 0.8472, "step": 2237 }, { "epoch": 0.31, "learning_rate": 1.6139978047687685e-05, "loss": 0.895, "step": 2238 }, { "epoch": 0.31, "learning_rate": 1.6136426397690007e-05, "loss": 0.9072, "step": 2239 }, { "epoch": 0.31, "learning_rate": 1.6132873505664912e-05, "loss": 0.8591, "step": 2240 }, { "epoch": 0.31, "learning_rate": 1.6129319372331513e-05, "loss": 0.9736, "step": 2241 }, { "epoch": 0.31, "learning_rate": 1.6125763998409173e-05, "loss": 0.8291, "step": 2242 }, { "epoch": 0.31, "learning_rate": 1.6122207384617507e-05, "loss": 0.9333, "step": 2243 }, { "epoch": 0.31, "learning_rate": 1.6118649531676387e-05, "loss": 0.8643, "step": 2244 }, { "epoch": 0.31, "learning_rate": 1.6115090440305927e-05, "loss": 0.9021, "step": 2245 }, { "epoch": 0.31, "learning_rate": 1.6111530111226497e-05, "loss": 0.8887, "step": 2246 }, { "epoch": 0.31, "learning_rate": 1.6107968545158717e-05, "loss": 0.8572, "step": 2247 }, { "epoch": 0.31, "learning_rate": 1.610440574282345e-05, "loss": 0.8711, "step": 2248 }, { "epoch": 0.31, "learning_rate": 1.6100841704941828e-05, "loss": 0.8518, "step": 2249 }, { "epoch": 0.31, "learning_rate": 1.609727643223521e-05, "loss": 0.8696, "step": 2250 }, { "epoch": 0.31, "learning_rate": 1.6093709925425222e-05, "loss": 0.9482, "step": 2251 }, { "epoch": 0.31, "learning_rate": 1.609014218523373e-05, "loss": 0.8696, "step": 2252 }, { "epoch": 0.31, "learning_rate": 1.6086573212382855e-05, "loss": 0.8755, "step": 2253 }, { "epoch": 0.31, "learning_rate": 1.6083003007594965e-05, "loss": 0.8674, "step": 2254 }, { "epoch": 0.31, "learning_rate": 1.6079431571592675e-05, "loss": 0.8989, "step": 2255 }, { "epoch": 0.31, "learning_rate": 1.6075858905098856e-05, "loss": 0.7062, "step": 2256 }, { "epoch": 0.31, "learning_rate": 1.6072285008836628e-05, "loss": 0.8657, "step": 2257 }, { "epoch": 0.31, "learning_rate": 1.606870988352935e-05, "loss": 0.8267, "step": 2258 }, { "epoch": 0.31, "learning_rate": 1.6065133529900637e-05, "loss": 0.9907, "step": 2259 }, { "epoch": 0.31, "learning_rate": 1.6061555948674352e-05, "loss": 0.936, "step": 2260 }, { "epoch": 0.31, "learning_rate": 1.605797714057461e-05, "loss": 0.8545, "step": 2261 }, { "epoch": 0.31, "learning_rate": 1.605439710632576e-05, "loss": 0.884, "step": 2262 }, { "epoch": 0.31, "learning_rate": 1.605081584665242e-05, "loss": 0.9404, "step": 2263 }, { "epoch": 0.31, "learning_rate": 1.604723336227944e-05, "loss": 0.8782, "step": 2264 }, { "epoch": 0.31, "learning_rate": 1.6043649653931926e-05, "loss": 0.8826, "step": 2265 }, { "epoch": 0.31, "learning_rate": 1.6040064722335227e-05, "loss": 0.8833, "step": 2266 }, { "epoch": 0.31, "learning_rate": 1.6036478568214944e-05, "loss": 0.8589, "step": 2267 }, { "epoch": 0.32, "learning_rate": 1.6032891192296922e-05, "loss": 0.9448, "step": 2268 }, { "epoch": 0.32, "learning_rate": 1.6029302595307255e-05, "loss": 0.7927, "step": 2269 }, { "epoch": 0.32, "learning_rate": 1.6025712777972285e-05, "loss": 0.8289, "step": 2270 }, { "epoch": 0.32, "learning_rate": 1.6022121741018596e-05, "loss": 0.8538, "step": 2271 }, { "epoch": 0.32, "learning_rate": 1.6018529485173024e-05, "loss": 0.8635, "step": 2272 }, { "epoch": 0.32, "learning_rate": 1.601493601116265e-05, "loss": 0.8999, "step": 2273 }, { "epoch": 0.32, "learning_rate": 1.6011341319714804e-05, "loss": 0.865, "step": 2274 }, { "epoch": 0.32, "learning_rate": 1.6007745411557062e-05, "loss": 0.8621, "step": 2275 }, { "epoch": 0.32, "learning_rate": 1.6004148287417235e-05, "loss": 0.8561, "step": 2276 }, { "epoch": 0.32, "learning_rate": 1.60005499480234e-05, "loss": 0.8374, "step": 2277 }, { "epoch": 0.32, "learning_rate": 1.599695039410386e-05, "loss": 0.9299, "step": 2278 }, { "epoch": 0.32, "learning_rate": 1.5993349626387186e-05, "loss": 0.8691, "step": 2279 }, { "epoch": 0.32, "learning_rate": 1.598974764560217e-05, "loss": 0.9143, "step": 2280 }, { "epoch": 0.32, "learning_rate": 1.5986144452477865e-05, "loss": 0.6305, "step": 2281 }, { "epoch": 0.32, "learning_rate": 1.5982540047743565e-05, "loss": 0.8896, "step": 2282 }, { "epoch": 0.32, "learning_rate": 1.5978934432128817e-05, "loss": 0.8385, "step": 2283 }, { "epoch": 0.32, "learning_rate": 1.59753276063634e-05, "loss": 0.908, "step": 2284 }, { "epoch": 0.32, "learning_rate": 1.5971719571177346e-05, "loss": 0.8809, "step": 2285 }, { "epoch": 0.32, "learning_rate": 1.5968110327300925e-05, "loss": 0.8245, "step": 2286 }, { "epoch": 0.32, "learning_rate": 1.5964499875464665e-05, "loss": 0.8914, "step": 2287 }, { "epoch": 0.32, "learning_rate": 1.5960888216399326e-05, "loss": 0.6082, "step": 2288 }, { "epoch": 0.32, "learning_rate": 1.5957275350835916e-05, "loss": 0.8796, "step": 2289 }, { "epoch": 0.32, "learning_rate": 1.5953661279505686e-05, "loss": 0.8552, "step": 2290 }, { "epoch": 0.32, "learning_rate": 1.595004600314014e-05, "loss": 0.8867, "step": 2291 }, { "epoch": 0.32, "learning_rate": 1.5946429522471013e-05, "loss": 0.8997, "step": 2292 }, { "epoch": 0.32, "learning_rate": 1.5942811838230285e-05, "loss": 0.5768, "step": 2293 }, { "epoch": 0.32, "learning_rate": 1.5939192951150196e-05, "loss": 0.884, "step": 2294 }, { "epoch": 0.32, "learning_rate": 1.5935572861963208e-05, "loss": 0.8792, "step": 2295 }, { "epoch": 0.32, "learning_rate": 1.5931951571402035e-05, "loss": 0.8728, "step": 2296 }, { "epoch": 0.32, "learning_rate": 1.5928329080199638e-05, "loss": 0.8755, "step": 2297 }, { "epoch": 0.32, "learning_rate": 1.592470538908922e-05, "loss": 0.9373, "step": 2298 }, { "epoch": 0.32, "learning_rate": 1.5921080498804226e-05, "loss": 0.8984, "step": 2299 }, { "epoch": 0.32, "learning_rate": 1.5917454410078335e-05, "loss": 0.929, "step": 2300 }, { "epoch": 0.32, "learning_rate": 1.591382712364548e-05, "loss": 0.8931, "step": 2301 }, { "epoch": 0.32, "learning_rate": 1.5910198640239835e-05, "loss": 0.8804, "step": 2302 }, { "epoch": 0.32, "learning_rate": 1.590656896059581e-05, "loss": 0.9514, "step": 2303 }, { "epoch": 0.32, "learning_rate": 1.5902938085448064e-05, "loss": 0.9031, "step": 2304 }, { "epoch": 0.32, "learning_rate": 1.589930601553149e-05, "loss": 0.886, "step": 2305 }, { "epoch": 0.32, "learning_rate": 1.5895672751581232e-05, "loss": 0.8214, "step": 2306 }, { "epoch": 0.32, "learning_rate": 1.589203829433267e-05, "loss": 0.8901, "step": 2307 }, { "epoch": 0.32, "learning_rate": 1.5888402644521428e-05, "loss": 0.9312, "step": 2308 }, { "epoch": 0.32, "learning_rate": 1.588476580288337e-05, "loss": 0.8948, "step": 2309 }, { "epoch": 0.32, "learning_rate": 1.5881127770154597e-05, "loss": 0.8457, "step": 2310 }, { "epoch": 0.32, "learning_rate": 1.5877488547071464e-05, "loss": 0.8442, "step": 2311 }, { "epoch": 0.32, "learning_rate": 1.5873848134370554e-05, "loss": 0.8406, "step": 2312 }, { "epoch": 0.32, "learning_rate": 1.587020653278869e-05, "loss": 0.8647, "step": 2313 }, { "epoch": 0.32, "learning_rate": 1.586656374306295e-05, "loss": 0.8806, "step": 2314 }, { "epoch": 0.32, "learning_rate": 1.586291976593064e-05, "loss": 0.8843, "step": 2315 }, { "epoch": 0.32, "learning_rate": 1.5859274602129303e-05, "loss": 0.8303, "step": 2316 }, { "epoch": 0.32, "learning_rate": 1.585562825239674e-05, "loss": 0.8721, "step": 2317 }, { "epoch": 0.32, "learning_rate": 1.5851980717470973e-05, "loss": 0.9336, "step": 2318 }, { "epoch": 0.32, "learning_rate": 1.584833199809028e-05, "loss": 0.6141, "step": 2319 }, { "epoch": 0.32, "learning_rate": 1.584468209499316e-05, "loss": 0.8422, "step": 2320 }, { "epoch": 0.32, "learning_rate": 1.584103100891837e-05, "loss": 0.8706, "step": 2321 }, { "epoch": 0.32, "learning_rate": 1.5837378740604896e-05, "loss": 0.78, "step": 2322 }, { "epoch": 0.32, "learning_rate": 1.5833725290791963e-05, "loss": 0.876, "step": 2323 }, { "epoch": 0.32, "learning_rate": 1.5830070660219042e-05, "loss": 0.8657, "step": 2324 }, { "epoch": 0.32, "learning_rate": 1.5826414849625837e-05, "loss": 0.8777, "step": 2325 }, { "epoch": 0.32, "learning_rate": 1.5822757859752295e-05, "loss": 0.8445, "step": 2326 }, { "epoch": 0.32, "learning_rate": 1.58190996913386e-05, "loss": 0.9294, "step": 2327 }, { "epoch": 0.32, "learning_rate": 1.5815440345125167e-05, "loss": 0.9055, "step": 2328 }, { "epoch": 0.32, "learning_rate": 1.5811779821852663e-05, "loss": 0.928, "step": 2329 }, { "epoch": 0.32, "learning_rate": 1.580811812226199e-05, "loss": 0.9182, "step": 2330 }, { "epoch": 0.32, "learning_rate": 1.5804455247094277e-05, "loss": 0.9089, "step": 2331 }, { "epoch": 0.32, "learning_rate": 1.5800791197090904e-05, "loss": 0.8362, "step": 2332 }, { "epoch": 0.32, "learning_rate": 1.5797125972993475e-05, "loss": 0.8672, "step": 2333 }, { "epoch": 0.32, "learning_rate": 1.5793459575543853e-05, "loss": 0.5988, "step": 2334 }, { "epoch": 0.32, "learning_rate": 1.578979200548412e-05, "loss": 0.9102, "step": 2335 }, { "epoch": 0.32, "learning_rate": 1.5786123263556596e-05, "loss": 0.8882, "step": 2336 }, { "epoch": 0.32, "learning_rate": 1.5782453350503848e-05, "loss": 0.9075, "step": 2337 }, { "epoch": 0.32, "learning_rate": 1.5778782267068675e-05, "loss": 0.929, "step": 2338 }, { "epoch": 0.32, "learning_rate": 1.577511001399411e-05, "loss": 0.9285, "step": 2339 }, { "epoch": 0.33, "learning_rate": 1.5771436592023434e-05, "loss": 0.873, "step": 2340 }, { "epoch": 0.33, "learning_rate": 1.5767762001900147e-05, "loss": 0.9075, "step": 2341 }, { "epoch": 0.33, "learning_rate": 1.5764086244368e-05, "loss": 0.8826, "step": 2342 }, { "epoch": 0.33, "learning_rate": 1.576040932017097e-05, "loss": 0.8411, "step": 2343 }, { "epoch": 0.33, "learning_rate": 1.5756731230053284e-05, "loss": 0.8582, "step": 2344 }, { "epoch": 0.33, "learning_rate": 1.575305197475939e-05, "loss": 0.8904, "step": 2345 }, { "epoch": 0.33, "learning_rate": 1.5749371555033978e-05, "loss": 0.8955, "step": 2346 }, { "epoch": 0.33, "learning_rate": 1.5745689971621977e-05, "loss": 0.9314, "step": 2347 }, { "epoch": 0.33, "learning_rate": 1.5742007225268543e-05, "loss": 0.9058, "step": 2348 }, { "epoch": 0.33, "learning_rate": 1.5738323316719078e-05, "loss": 0.8896, "step": 2349 }, { "epoch": 0.33, "learning_rate": 1.5734638246719214e-05, "loss": 0.9221, "step": 2350 }, { "epoch": 0.33, "learning_rate": 1.5730952016014816e-05, "loss": 0.9048, "step": 2351 }, { "epoch": 0.33, "learning_rate": 1.5727264625351986e-05, "loss": 0.8689, "step": 2352 }, { "epoch": 0.33, "learning_rate": 1.5723576075477057e-05, "loss": 0.8821, "step": 2353 }, { "epoch": 0.33, "learning_rate": 1.571988636713661e-05, "loss": 0.8569, "step": 2354 }, { "epoch": 0.33, "learning_rate": 1.571619550107744e-05, "loss": 0.8142, "step": 2355 }, { "epoch": 0.33, "learning_rate": 1.5712503478046595e-05, "loss": 0.8965, "step": 2356 }, { "epoch": 0.33, "learning_rate": 1.5708810298791345e-05, "loss": 0.8619, "step": 2357 }, { "epoch": 0.33, "learning_rate": 1.57051159640592e-05, "loss": 0.9011, "step": 2358 }, { "epoch": 0.33, "learning_rate": 1.57014204745979e-05, "loss": 0.8501, "step": 2359 }, { "epoch": 0.33, "learning_rate": 1.569772383115543e-05, "loss": 0.866, "step": 2360 }, { "epoch": 0.33, "learning_rate": 1.5694026034479984e-05, "loss": 0.9363, "step": 2361 }, { "epoch": 0.33, "learning_rate": 1.5690327085320018e-05, "loss": 0.9023, "step": 2362 }, { "epoch": 0.33, "learning_rate": 1.5686626984424203e-05, "loss": 0.9116, "step": 2363 }, { "epoch": 0.33, "learning_rate": 1.568292573254145e-05, "loss": 0.855, "step": 2364 }, { "epoch": 0.33, "learning_rate": 1.5679223330420895e-05, "loss": 0.6228, "step": 2365 }, { "epoch": 0.33, "learning_rate": 1.5675519778811922e-05, "loss": 0.8779, "step": 2366 }, { "epoch": 0.33, "learning_rate": 1.5671815078464134e-05, "loss": 0.8468, "step": 2367 }, { "epoch": 0.33, "learning_rate": 1.5668109230127367e-05, "loss": 0.8867, "step": 2368 }, { "epoch": 0.33, "learning_rate": 1.5664402234551704e-05, "loss": 0.8943, "step": 2369 }, { "epoch": 0.33, "learning_rate": 1.5660694092487444e-05, "loss": 0.9436, "step": 2370 }, { "epoch": 0.33, "learning_rate": 1.5656984804685124e-05, "loss": 0.9153, "step": 2371 }, { "epoch": 0.33, "learning_rate": 1.5653274371895515e-05, "loss": 0.9104, "step": 2372 }, { "epoch": 0.33, "learning_rate": 1.5649562794869615e-05, "loss": 0.9556, "step": 2373 }, { "epoch": 0.33, "learning_rate": 1.5645850074358656e-05, "loss": 0.5979, "step": 2374 }, { "epoch": 0.33, "learning_rate": 1.56421362111141e-05, "loss": 0.8401, "step": 2375 }, { "epoch": 0.33, "learning_rate": 1.5638421205887645e-05, "loss": 0.8608, "step": 2376 }, { "epoch": 0.33, "learning_rate": 1.5634705059431218e-05, "loss": 0.845, "step": 2377 }, { "epoch": 0.33, "learning_rate": 1.5630987772496973e-05, "loss": 0.8639, "step": 2378 }, { "epoch": 0.33, "learning_rate": 1.56272693458373e-05, "loss": 0.915, "step": 2379 }, { "epoch": 0.33, "learning_rate": 1.5623549780204814e-05, "loss": 0.9377, "step": 2380 }, { "epoch": 0.33, "learning_rate": 1.5619829076352365e-05, "loss": 0.848, "step": 2381 }, { "epoch": 0.33, "learning_rate": 1.5616107235033032e-05, "loss": 0.8142, "step": 2382 }, { "epoch": 0.33, "learning_rate": 1.561238425700013e-05, "loss": 0.8059, "step": 2383 }, { "epoch": 0.33, "learning_rate": 1.5608660143007194e-05, "loss": 0.8518, "step": 2384 }, { "epoch": 0.33, "learning_rate": 1.5604934893807994e-05, "loss": 0.928, "step": 2385 }, { "epoch": 0.33, "learning_rate": 1.560120851015653e-05, "loss": 0.8701, "step": 2386 }, { "epoch": 0.33, "learning_rate": 1.5597480992807032e-05, "loss": 0.9033, "step": 2387 }, { "epoch": 0.33, "learning_rate": 1.5593752342513956e-05, "loss": 0.8291, "step": 2388 }, { "epoch": 0.33, "learning_rate": 1.5590022560031993e-05, "loss": 0.8728, "step": 2389 }, { "epoch": 0.33, "learning_rate": 1.5586291646116053e-05, "loss": 0.8921, "step": 2390 }, { "epoch": 0.33, "learning_rate": 1.5582559601521295e-05, "loss": 0.8965, "step": 2391 }, { "epoch": 0.33, "learning_rate": 1.557882642700308e-05, "loss": 0.606, "step": 2392 }, { "epoch": 0.33, "learning_rate": 1.5575092123317017e-05, "loss": 0.8745, "step": 2393 }, { "epoch": 0.33, "learning_rate": 1.5571356691218937e-05, "loss": 0.9231, "step": 2394 }, { "epoch": 0.33, "learning_rate": 1.5567620131464902e-05, "loss": 0.854, "step": 2395 }, { "epoch": 0.33, "learning_rate": 1.5563882444811203e-05, "loss": 0.8145, "step": 2396 }, { "epoch": 0.33, "learning_rate": 1.5560143632014357e-05, "loss": 0.9231, "step": 2397 }, { "epoch": 0.33, "learning_rate": 1.5556403693831098e-05, "loss": 0.9194, "step": 2398 }, { "epoch": 0.33, "learning_rate": 1.5552662631018408e-05, "loss": 0.8459, "step": 2399 }, { "epoch": 0.33, "learning_rate": 1.5548920444333488e-05, "loss": 0.8438, "step": 2400 }, { "epoch": 0.33, "learning_rate": 1.554517713453376e-05, "loss": 0.926, "step": 2401 }, { "epoch": 0.33, "learning_rate": 1.5541432702376885e-05, "loss": 0.9207, "step": 2402 }, { "epoch": 0.33, "learning_rate": 1.553768714862074e-05, "loss": 0.6213, "step": 2403 }, { "epoch": 0.33, "learning_rate": 1.5533940474023435e-05, "loss": 0.5657, "step": 2404 }, { "epoch": 0.33, "learning_rate": 1.5530192679343304e-05, "loss": 0.8464, "step": 2405 }, { "epoch": 0.33, "learning_rate": 1.5526443765338915e-05, "loss": 0.8474, "step": 2406 }, { "epoch": 0.33, "learning_rate": 1.5522693732769057e-05, "loss": 0.897, "step": 2407 }, { "epoch": 0.33, "learning_rate": 1.551894258239274e-05, "loss": 0.5815, "step": 2408 }, { "epoch": 0.33, "learning_rate": 1.551519031496921e-05, "loss": 0.8489, "step": 2409 }, { "epoch": 0.33, "learning_rate": 1.5511436931257933e-05, "loss": 0.9604, "step": 2410 }, { "epoch": 0.33, "learning_rate": 1.5507682432018605e-05, "loss": 0.8475, "step": 2411 }, { "epoch": 0.34, "learning_rate": 1.5503926818011142e-05, "loss": 0.8555, "step": 2412 }, { "epoch": 0.34, "learning_rate": 1.5500170089995695e-05, "loss": 0.8131, "step": 2413 }, { "epoch": 0.34, "learning_rate": 1.5496412248732627e-05, "loss": 0.8535, "step": 2414 }, { "epoch": 0.34, "learning_rate": 1.5492653294982544e-05, "loss": 0.8777, "step": 2415 }, { "epoch": 0.34, "learning_rate": 1.5488893229506258e-05, "loss": 0.8661, "step": 2416 }, { "epoch": 0.34, "learning_rate": 1.5485132053064818e-05, "loss": 0.8887, "step": 2417 }, { "epoch": 0.34, "learning_rate": 1.5481369766419496e-05, "loss": 0.8818, "step": 2418 }, { "epoch": 0.34, "learning_rate": 1.547760637033179e-05, "loss": 0.8381, "step": 2419 }, { "epoch": 0.34, "learning_rate": 1.5473841865563416e-05, "loss": 0.9197, "step": 2420 }, { "epoch": 0.34, "learning_rate": 1.5470076252876327e-05, "loss": 0.5701, "step": 2421 }, { "epoch": 0.34, "learning_rate": 1.546630953303268e-05, "loss": 0.8613, "step": 2422 }, { "epoch": 0.34, "learning_rate": 1.5462541706794878e-05, "loss": 0.8496, "step": 2423 }, { "epoch": 0.34, "learning_rate": 1.545877277492553e-05, "loss": 0.8708, "step": 2424 }, { "epoch": 0.34, "learning_rate": 1.5455002738187485e-05, "loss": 0.9497, "step": 2425 }, { "epoch": 0.34, "learning_rate": 1.5451231597343803e-05, "loss": 0.8169, "step": 2426 }, { "epoch": 0.34, "learning_rate": 1.5447459353157772e-05, "loss": 0.8787, "step": 2427 }, { "epoch": 0.34, "learning_rate": 1.5443686006392904e-05, "loss": 0.8394, "step": 2428 }, { "epoch": 0.34, "learning_rate": 1.5439911557812935e-05, "loss": 0.9314, "step": 2429 }, { "epoch": 0.34, "learning_rate": 1.5436136008181818e-05, "loss": 0.8354, "step": 2430 }, { "epoch": 0.34, "learning_rate": 1.5432359358263738e-05, "loss": 0.906, "step": 2431 }, { "epoch": 0.34, "learning_rate": 1.5428581608823096e-05, "loss": 0.9519, "step": 2432 }, { "epoch": 0.34, "learning_rate": 1.5424802760624515e-05, "loss": 0.8782, "step": 2433 }, { "epoch": 0.34, "learning_rate": 1.5421022814432845e-05, "loss": 0.7942, "step": 2434 }, { "epoch": 0.34, "learning_rate": 1.5417241771013164e-05, "loss": 0.8799, "step": 2435 }, { "epoch": 0.34, "learning_rate": 1.541345963113075e-05, "loss": 0.8591, "step": 2436 }, { "epoch": 0.34, "learning_rate": 1.540967639555113e-05, "loss": 0.8691, "step": 2437 }, { "epoch": 0.34, "learning_rate": 1.5405892065040027e-05, "loss": 0.8313, "step": 2438 }, { "epoch": 0.34, "learning_rate": 1.540210664036341e-05, "loss": 0.8494, "step": 2439 }, { "epoch": 0.34, "learning_rate": 1.5398320122287454e-05, "loss": 0.9089, "step": 2440 }, { "epoch": 0.34, "learning_rate": 1.5394532511578556e-05, "loss": 0.5983, "step": 2441 }, { "epoch": 0.34, "learning_rate": 1.5390743809003342e-05, "loss": 0.8379, "step": 2442 }, { "epoch": 0.34, "learning_rate": 1.5386954015328658e-05, "loss": 0.8672, "step": 2443 }, { "epoch": 0.34, "learning_rate": 1.5383163131321553e-05, "loss": 0.9084, "step": 2444 }, { "epoch": 0.34, "learning_rate": 1.5379371157749327e-05, "loss": 0.8901, "step": 2445 }, { "epoch": 0.34, "learning_rate": 1.5375578095379476e-05, "loss": 0.8569, "step": 2446 }, { "epoch": 0.34, "learning_rate": 1.5371783944979732e-05, "loss": 0.8657, "step": 2447 }, { "epoch": 0.34, "learning_rate": 1.536798870731803e-05, "loss": 0.8979, "step": 2448 }, { "epoch": 0.34, "learning_rate": 1.536419238316254e-05, "loss": 0.8721, "step": 2449 }, { "epoch": 0.34, "learning_rate": 1.5360394973281646e-05, "loss": 0.8706, "step": 2450 }, { "epoch": 0.34, "learning_rate": 1.5356596478443955e-05, "loss": 0.9104, "step": 2451 }, { "epoch": 0.34, "learning_rate": 1.5352796899418295e-05, "loss": 0.8447, "step": 2452 }, { "epoch": 0.34, "learning_rate": 1.53489962369737e-05, "loss": 0.8877, "step": 2453 }, { "epoch": 0.34, "learning_rate": 1.5345194491879443e-05, "loss": 0.7969, "step": 2454 }, { "epoch": 0.34, "learning_rate": 1.5341391664904998e-05, "loss": 0.8545, "step": 2455 }, { "epoch": 0.34, "learning_rate": 1.533758775682007e-05, "loss": 0.8496, "step": 2456 }, { "epoch": 0.34, "learning_rate": 1.5333782768394584e-05, "loss": 0.6077, "step": 2457 }, { "epoch": 0.34, "learning_rate": 1.532997670039867e-05, "loss": 0.895, "step": 2458 }, { "epoch": 0.34, "learning_rate": 1.5326169553602693e-05, "loss": 0.8906, "step": 2459 }, { "epoch": 0.34, "learning_rate": 1.5322361328777225e-05, "loss": 0.8567, "step": 2460 }, { "epoch": 0.34, "learning_rate": 1.531855202669306e-05, "loss": 0.8962, "step": 2461 }, { "epoch": 0.34, "learning_rate": 1.5314741648121208e-05, "loss": 0.894, "step": 2462 }, { "epoch": 0.34, "learning_rate": 1.5310930193832904e-05, "loss": 0.7681, "step": 2463 }, { "epoch": 0.34, "learning_rate": 1.530711766459959e-05, "loss": 0.574, "step": 2464 }, { "epoch": 0.34, "learning_rate": 1.530330406119293e-05, "loss": 0.9297, "step": 2465 }, { "epoch": 0.34, "learning_rate": 1.5299489384384813e-05, "loss": 0.9221, "step": 2466 }, { "epoch": 0.34, "learning_rate": 1.529567363494734e-05, "loss": 0.8958, "step": 2467 }, { "epoch": 0.34, "learning_rate": 1.5291856813652813e-05, "loss": 0.8193, "step": 2468 }, { "epoch": 0.34, "learning_rate": 1.5288038921273783e-05, "loss": 0.8738, "step": 2469 }, { "epoch": 0.34, "learning_rate": 1.5284219958582992e-05, "loss": 0.8604, "step": 2470 }, { "epoch": 0.34, "learning_rate": 1.528039992635341e-05, "loss": 0.8307, "step": 2471 }, { "epoch": 0.34, "learning_rate": 1.527657882535822e-05, "loss": 0.8491, "step": 2472 }, { "epoch": 0.34, "learning_rate": 1.527275665637082e-05, "loss": 0.9287, "step": 2473 }, { "epoch": 0.34, "learning_rate": 1.5268933420164828e-05, "loss": 0.8557, "step": 2474 }, { "epoch": 0.34, "learning_rate": 1.5265109117514073e-05, "loss": 0.8555, "step": 2475 }, { "epoch": 0.34, "learning_rate": 1.5261283749192608e-05, "loss": 0.9412, "step": 2476 }, { "epoch": 0.34, "learning_rate": 1.5257457315974696e-05, "loss": 0.8691, "step": 2477 }, { "epoch": 0.34, "learning_rate": 1.5253629818634814e-05, "loss": 0.8823, "step": 2478 }, { "epoch": 0.34, "learning_rate": 1.5249801257947657e-05, "loss": 0.8518, "step": 2479 }, { "epoch": 0.34, "learning_rate": 1.5245971634688137e-05, "loss": 0.9333, "step": 2480 }, { "epoch": 0.34, "learning_rate": 1.5242140949631377e-05, "loss": 0.8625, "step": 2481 }, { "epoch": 0.34, "learning_rate": 1.5238309203552714e-05, "loss": 0.8748, "step": 2482 }, { "epoch": 0.34, "learning_rate": 1.5234476397227709e-05, "loss": 0.8545, "step": 2483 }, { "epoch": 0.35, "learning_rate": 1.523064253143213e-05, "loss": 0.8516, "step": 2484 }, { "epoch": 0.35, "learning_rate": 1.5226807606941953e-05, "loss": 0.9333, "step": 2485 }, { "epoch": 0.35, "learning_rate": 1.5222971624533384e-05, "loss": 0.8123, "step": 2486 }, { "epoch": 0.35, "learning_rate": 1.5219134584982835e-05, "loss": 0.8723, "step": 2487 }, { "epoch": 0.35, "learning_rate": 1.5215296489066926e-05, "loss": 0.8767, "step": 2488 }, { "epoch": 0.35, "learning_rate": 1.5211457337562503e-05, "loss": 0.9321, "step": 2489 }, { "epoch": 0.35, "learning_rate": 1.5207617131246615e-05, "loss": 0.9375, "step": 2490 }, { "epoch": 0.35, "learning_rate": 1.5203775870896528e-05, "loss": 0.6686, "step": 2491 }, { "epoch": 0.35, "learning_rate": 1.5199933557289732e-05, "loss": 0.9148, "step": 2492 }, { "epoch": 0.35, "learning_rate": 1.5196090191203911e-05, "loss": 0.9092, "step": 2493 }, { "epoch": 0.35, "learning_rate": 1.5192245773416971e-05, "loss": 0.8513, "step": 2494 }, { "epoch": 0.35, "learning_rate": 1.5188400304707038e-05, "loss": 0.8921, "step": 2495 }, { "epoch": 0.35, "learning_rate": 1.5184553785852439e-05, "loss": 0.8579, "step": 2496 }, { "epoch": 0.35, "learning_rate": 1.518070621763172e-05, "loss": 0.8909, "step": 2497 }, { "epoch": 0.35, "learning_rate": 1.517685760082364e-05, "loss": 0.9387, "step": 2498 }, { "epoch": 0.35, "learning_rate": 1.5173007936207164e-05, "loss": 0.9321, "step": 2499 }, { "epoch": 0.35, "learning_rate": 1.5169157224561476e-05, "loss": 0.6267, "step": 2500 }, { "epoch": 0.35, "learning_rate": 1.516530546666597e-05, "loss": 0.834, "step": 2501 }, { "epoch": 0.35, "learning_rate": 1.5161452663300252e-05, "loss": 0.864, "step": 2502 }, { "epoch": 0.35, "learning_rate": 1.5157598815244136e-05, "loss": 0.8635, "step": 2503 }, { "epoch": 0.35, "learning_rate": 1.515374392327765e-05, "loss": 0.8097, "step": 2504 }, { "epoch": 0.35, "learning_rate": 1.5149887988181035e-05, "loss": 0.9192, "step": 2505 }, { "epoch": 0.35, "learning_rate": 1.5146031010734738e-05, "loss": 0.8396, "step": 2506 }, { "epoch": 0.35, "learning_rate": 1.5142172991719426e-05, "loss": 0.8081, "step": 2507 }, { "epoch": 0.35, "learning_rate": 1.5138313931915968e-05, "loss": 0.8794, "step": 2508 }, { "epoch": 0.35, "learning_rate": 1.5134453832105449e-05, "loss": 0.9548, "step": 2509 }, { "epoch": 0.35, "learning_rate": 1.513059269306916e-05, "loss": 0.8967, "step": 2510 }, { "epoch": 0.35, "learning_rate": 1.5126730515588603e-05, "loss": 0.8899, "step": 2511 }, { "epoch": 0.35, "learning_rate": 1.5122867300445499e-05, "loss": 0.9475, "step": 2512 }, { "epoch": 0.35, "learning_rate": 1.5119003048421767e-05, "loss": 0.6841, "step": 2513 }, { "epoch": 0.35, "learning_rate": 1.5115137760299541e-05, "loss": 0.9062, "step": 2514 }, { "epoch": 0.35, "learning_rate": 1.5111271436861165e-05, "loss": 0.8999, "step": 2515 }, { "epoch": 0.35, "learning_rate": 1.5107404078889192e-05, "loss": 0.8315, "step": 2516 }, { "epoch": 0.35, "learning_rate": 1.5103535687166386e-05, "loss": 0.9097, "step": 2517 }, { "epoch": 0.35, "learning_rate": 1.5099666262475716e-05, "loss": 0.8843, "step": 2518 }, { "epoch": 0.35, "learning_rate": 1.5095795805600366e-05, "loss": 0.9348, "step": 2519 }, { "epoch": 0.35, "learning_rate": 1.5091924317323725e-05, "loss": 0.8467, "step": 2520 }, { "epoch": 0.35, "learning_rate": 1.508805179842939e-05, "loss": 0.926, "step": 2521 }, { "epoch": 0.35, "learning_rate": 1.5084178249701168e-05, "loss": 0.8108, "step": 2522 }, { "epoch": 0.35, "learning_rate": 1.5080303671923075e-05, "loss": 0.886, "step": 2523 }, { "epoch": 0.35, "learning_rate": 1.5076428065879338e-05, "loss": 0.5991, "step": 2524 }, { "epoch": 0.35, "learning_rate": 1.5072551432354385e-05, "loss": 0.6451, "step": 2525 }, { "epoch": 0.35, "learning_rate": 1.5068673772132856e-05, "loss": 0.9353, "step": 2526 }, { "epoch": 0.35, "learning_rate": 1.5064795085999599e-05, "loss": 0.8848, "step": 2527 }, { "epoch": 0.35, "learning_rate": 1.5060915374739673e-05, "loss": 0.8699, "step": 2528 }, { "epoch": 0.35, "learning_rate": 1.5057034639138337e-05, "loss": 0.8472, "step": 2529 }, { "epoch": 0.35, "learning_rate": 1.5053152879981064e-05, "loss": 0.9182, "step": 2530 }, { "epoch": 0.35, "learning_rate": 1.5049270098053526e-05, "loss": 0.8459, "step": 2531 }, { "epoch": 0.35, "learning_rate": 1.5045386294141615e-05, "loss": 0.8335, "step": 2532 }, { "epoch": 0.35, "learning_rate": 1.5041501469031419e-05, "loss": 0.8037, "step": 2533 }, { "epoch": 0.35, "learning_rate": 1.5037615623509232e-05, "loss": 0.8611, "step": 2534 }, { "epoch": 0.35, "learning_rate": 1.503372875836156e-05, "loss": 0.8846, "step": 2535 }, { "epoch": 0.35, "learning_rate": 1.5029840874375117e-05, "loss": 0.8984, "step": 2536 }, { "epoch": 0.35, "learning_rate": 1.5025951972336819e-05, "loss": 0.9309, "step": 2537 }, { "epoch": 0.35, "learning_rate": 1.502206205303379e-05, "loss": 0.6497, "step": 2538 }, { "epoch": 0.35, "learning_rate": 1.5018171117253357e-05, "loss": 0.7817, "step": 2539 }, { "epoch": 0.35, "learning_rate": 1.5014279165783054e-05, "loss": 0.8569, "step": 2540 }, { "epoch": 0.35, "learning_rate": 1.5010386199410625e-05, "loss": 0.8477, "step": 2541 }, { "epoch": 0.35, "learning_rate": 1.5006492218924011e-05, "loss": 0.8652, "step": 2542 }, { "epoch": 0.35, "learning_rate": 1.5002597225111368e-05, "loss": 0.863, "step": 2543 }, { "epoch": 0.35, "learning_rate": 1.499870121876105e-05, "loss": 0.5551, "step": 2544 }, { "epoch": 0.35, "learning_rate": 1.4994804200661612e-05, "loss": 0.8984, "step": 2545 }, { "epoch": 0.35, "learning_rate": 1.4990906171601828e-05, "loss": 0.8811, "step": 2546 }, { "epoch": 0.35, "learning_rate": 1.4987007132370668e-05, "loss": 0.8765, "step": 2547 }, { "epoch": 0.35, "learning_rate": 1.4983107083757304e-05, "loss": 0.8994, "step": 2548 }, { "epoch": 0.35, "learning_rate": 1.4979206026551114e-05, "loss": 0.8708, "step": 2549 }, { "epoch": 0.35, "learning_rate": 1.4975303961541685e-05, "loss": 0.8574, "step": 2550 }, { "epoch": 0.35, "learning_rate": 1.49714008895188e-05, "loss": 0.7961, "step": 2551 }, { "epoch": 0.35, "learning_rate": 1.4967496811272456e-05, "loss": 0.8628, "step": 2552 }, { "epoch": 0.35, "learning_rate": 1.4963591727592844e-05, "loss": 0.8386, "step": 2553 }, { "epoch": 0.35, "learning_rate": 1.495968563927036e-05, "loss": 0.8237, "step": 2554 }, { "epoch": 0.35, "learning_rate": 1.4955778547095609e-05, "loss": 0.8669, "step": 2555 }, { "epoch": 0.36, "learning_rate": 1.4951870451859397e-05, "loss": 0.905, "step": 2556 }, { "epoch": 0.36, "learning_rate": 1.4947961354352728e-05, "loss": 0.957, "step": 2557 }, { "epoch": 0.36, "learning_rate": 1.4944051255366816e-05, "loss": 0.877, "step": 2558 }, { "epoch": 0.36, "learning_rate": 1.4940140155693074e-05, "loss": 0.8923, "step": 2559 }, { "epoch": 0.36, "learning_rate": 1.4936228056123117e-05, "loss": 0.9473, "step": 2560 }, { "epoch": 0.36, "learning_rate": 1.4932314957448762e-05, "loss": 0.8792, "step": 2561 }, { "epoch": 0.36, "learning_rate": 1.492840086046203e-05, "loss": 0.9006, "step": 2562 }, { "epoch": 0.36, "learning_rate": 1.4924485765955146e-05, "loss": 0.8525, "step": 2563 }, { "epoch": 0.36, "learning_rate": 1.4920569674720536e-05, "loss": 0.9136, "step": 2564 }, { "epoch": 0.36, "learning_rate": 1.4916652587550819e-05, "loss": 0.8323, "step": 2565 }, { "epoch": 0.36, "learning_rate": 1.4912734505238829e-05, "loss": 0.8789, "step": 2566 }, { "epoch": 0.36, "learning_rate": 1.4908815428577592e-05, "loss": 0.8896, "step": 2567 }, { "epoch": 0.36, "learning_rate": 1.4904895358360343e-05, "loss": 0.8872, "step": 2568 }, { "epoch": 0.36, "learning_rate": 1.490097429538051e-05, "loss": 0.9287, "step": 2569 }, { "epoch": 0.36, "learning_rate": 1.4897052240431724e-05, "loss": 0.8894, "step": 2570 }, { "epoch": 0.36, "learning_rate": 1.4893129194307822e-05, "loss": 0.8872, "step": 2571 }, { "epoch": 0.36, "learning_rate": 1.4889205157802834e-05, "loss": 0.6173, "step": 2572 }, { "epoch": 0.36, "learning_rate": 1.4885280131710999e-05, "loss": 0.8445, "step": 2573 }, { "epoch": 0.36, "learning_rate": 1.4881354116826752e-05, "loss": 0.8313, "step": 2574 }, { "epoch": 0.36, "learning_rate": 1.4877427113944722e-05, "loss": 0.887, "step": 2575 }, { "epoch": 0.36, "learning_rate": 1.4873499123859749e-05, "loss": 0.8748, "step": 2576 }, { "epoch": 0.36, "learning_rate": 1.4869570147366864e-05, "loss": 0.928, "step": 2577 }, { "epoch": 0.36, "learning_rate": 1.4865640185261303e-05, "loss": 0.8589, "step": 2578 }, { "epoch": 0.36, "learning_rate": 1.4861709238338502e-05, "loss": 0.5645, "step": 2579 }, { "epoch": 0.36, "learning_rate": 1.485777730739409e-05, "loss": 0.8899, "step": 2580 }, { "epoch": 0.36, "learning_rate": 1.4853844393223903e-05, "loss": 0.9023, "step": 2581 }, { "epoch": 0.36, "learning_rate": 1.4849910496623968e-05, "loss": 0.8533, "step": 2582 }, { "epoch": 0.36, "learning_rate": 1.4845975618390518e-05, "loss": 0.8208, "step": 2583 }, { "epoch": 0.36, "learning_rate": 1.4842039759319983e-05, "loss": 0.8579, "step": 2584 }, { "epoch": 0.36, "learning_rate": 1.4838102920208987e-05, "loss": 0.8285, "step": 2585 }, { "epoch": 0.36, "learning_rate": 1.4834165101854359e-05, "loss": 0.8738, "step": 2586 }, { "epoch": 0.36, "learning_rate": 1.4830226305053117e-05, "loss": 0.8728, "step": 2587 }, { "epoch": 0.36, "learning_rate": 1.4826286530602491e-05, "loss": 0.8652, "step": 2588 }, { "epoch": 0.36, "learning_rate": 1.4822345779299898e-05, "loss": 0.8835, "step": 2589 }, { "epoch": 0.36, "learning_rate": 1.4818404051942952e-05, "loss": 0.823, "step": 2590 }, { "epoch": 0.36, "learning_rate": 1.481446134932947e-05, "loss": 0.8545, "step": 2591 }, { "epoch": 0.36, "learning_rate": 1.4810517672257465e-05, "loss": 0.8589, "step": 2592 }, { "epoch": 0.36, "learning_rate": 1.4806573021525146e-05, "loss": 0.8796, "step": 2593 }, { "epoch": 0.36, "learning_rate": 1.4802627397930924e-05, "loss": 0.8765, "step": 2594 }, { "epoch": 0.36, "learning_rate": 1.4798680802273395e-05, "loss": 0.8965, "step": 2595 }, { "epoch": 0.36, "learning_rate": 1.4794733235351367e-05, "loss": 0.8882, "step": 2596 }, { "epoch": 0.36, "learning_rate": 1.479078469796383e-05, "loss": 0.8975, "step": 2597 }, { "epoch": 0.36, "learning_rate": 1.478683519090998e-05, "loss": 0.8787, "step": 2598 }, { "epoch": 0.36, "learning_rate": 1.4782884714989215e-05, "loss": 0.948, "step": 2599 }, { "epoch": 0.36, "learning_rate": 1.4778933271001106e-05, "loss": 0.8896, "step": 2600 }, { "epoch": 0.36, "learning_rate": 1.4774980859745445e-05, "loss": 0.8943, "step": 2601 }, { "epoch": 0.36, "learning_rate": 1.4771027482022207e-05, "loss": 0.8706, "step": 2602 }, { "epoch": 0.36, "learning_rate": 1.4767073138631562e-05, "loss": 0.9053, "step": 2603 }, { "epoch": 0.36, "learning_rate": 1.4763117830373887e-05, "loss": 0.8914, "step": 2604 }, { "epoch": 0.36, "learning_rate": 1.4759161558049737e-05, "loss": 0.8853, "step": 2605 }, { "epoch": 0.36, "learning_rate": 1.4755204322459875e-05, "loss": 0.8882, "step": 2606 }, { "epoch": 0.36, "learning_rate": 1.4751246124405251e-05, "loss": 0.8225, "step": 2607 }, { "epoch": 0.36, "learning_rate": 1.474728696468702e-05, "loss": 0.8689, "step": 2608 }, { "epoch": 0.36, "learning_rate": 1.4743326844106524e-05, "loss": 0.8823, "step": 2609 }, { "epoch": 0.36, "learning_rate": 1.47393657634653e-05, "loss": 0.8672, "step": 2610 }, { "epoch": 0.36, "learning_rate": 1.4735403723565074e-05, "loss": 0.9138, "step": 2611 }, { "epoch": 0.36, "learning_rate": 1.4731440725207782e-05, "loss": 0.8643, "step": 2612 }, { "epoch": 0.36, "learning_rate": 1.472747676919554e-05, "loss": 0.8713, "step": 2613 }, { "epoch": 0.36, "learning_rate": 1.472351185633066e-05, "loss": 0.884, "step": 2614 }, { "epoch": 0.36, "learning_rate": 1.4719545987415655e-05, "loss": 0.8975, "step": 2615 }, { "epoch": 0.36, "learning_rate": 1.4715579163253225e-05, "loss": 0.8459, "step": 2616 }, { "epoch": 0.36, "learning_rate": 1.471161138464626e-05, "loss": 0.5673, "step": 2617 }, { "epoch": 0.36, "learning_rate": 1.4707642652397854e-05, "loss": 0.8447, "step": 2618 }, { "epoch": 0.36, "learning_rate": 1.4703672967311281e-05, "loss": 0.8467, "step": 2619 }, { "epoch": 0.36, "learning_rate": 1.4699702330190026e-05, "loss": 0.8572, "step": 2620 }, { "epoch": 0.36, "learning_rate": 1.4695730741837746e-05, "loss": 0.8392, "step": 2621 }, { "epoch": 0.36, "learning_rate": 1.46917582030583e-05, "loss": 0.832, "step": 2622 }, { "epoch": 0.36, "learning_rate": 1.4687784714655745e-05, "loss": 0.804, "step": 2623 }, { "epoch": 0.36, "learning_rate": 1.4683810277434321e-05, "loss": 0.811, "step": 2624 }, { "epoch": 0.36, "learning_rate": 1.4679834892198463e-05, "loss": 0.9539, "step": 2625 }, { "epoch": 0.36, "learning_rate": 1.46758585597528e-05, "loss": 0.8505, "step": 2626 }, { "epoch": 0.36, "learning_rate": 1.4671881280902152e-05, "loss": 0.7764, "step": 2627 }, { "epoch": 0.37, "learning_rate": 1.4667903056451526e-05, "loss": 0.8904, "step": 2628 }, { "epoch": 0.37, "learning_rate": 1.466392388720613e-05, "loss": 0.9028, "step": 2629 }, { "epoch": 0.37, "learning_rate": 1.4659943773971354e-05, "loss": 0.6566, "step": 2630 }, { "epoch": 0.37, "learning_rate": 1.4655962717552783e-05, "loss": 0.876, "step": 2631 }, { "epoch": 0.37, "learning_rate": 1.4651980718756189e-05, "loss": 0.8601, "step": 2632 }, { "epoch": 0.37, "learning_rate": 1.4647997778387543e-05, "loss": 0.8623, "step": 2633 }, { "epoch": 0.37, "learning_rate": 1.4644013897253e-05, "loss": 0.8557, "step": 2634 }, { "epoch": 0.37, "learning_rate": 1.4640029076158909e-05, "loss": 0.9146, "step": 2635 }, { "epoch": 0.37, "learning_rate": 1.4636043315911803e-05, "loss": 0.833, "step": 2636 }, { "epoch": 0.37, "learning_rate": 1.4632056617318413e-05, "loss": 0.8728, "step": 2637 }, { "epoch": 0.37, "learning_rate": 1.4628068981185652e-05, "loss": 0.8689, "step": 2638 }, { "epoch": 0.37, "learning_rate": 1.4624080408320633e-05, "loss": 0.8599, "step": 2639 }, { "epoch": 0.37, "learning_rate": 1.4620090899530652e-05, "loss": 0.626, "step": 2640 }, { "epoch": 0.37, "learning_rate": 1.461610045562319e-05, "loss": 0.8687, "step": 2641 }, { "epoch": 0.37, "learning_rate": 1.4612109077405924e-05, "loss": 0.634, "step": 2642 }, { "epoch": 0.37, "learning_rate": 1.4608116765686724e-05, "loss": 0.8867, "step": 2643 }, { "epoch": 0.37, "learning_rate": 1.4604123521273638e-05, "loss": 0.8945, "step": 2644 }, { "epoch": 0.37, "learning_rate": 1.4600129344974909e-05, "loss": 0.8225, "step": 2645 }, { "epoch": 0.37, "learning_rate": 1.459613423759897e-05, "loss": 0.8213, "step": 2646 }, { "epoch": 0.37, "learning_rate": 1.4592138199954437e-05, "loss": 0.8423, "step": 2647 }, { "epoch": 0.37, "learning_rate": 1.4588141232850118e-05, "loss": 0.9878, "step": 2648 }, { "epoch": 0.37, "learning_rate": 1.4584143337095016e-05, "loss": 0.8988, "step": 2649 }, { "epoch": 0.37, "learning_rate": 1.4580144513498305e-05, "loss": 0.9146, "step": 2650 }, { "epoch": 0.37, "learning_rate": 1.4576144762869361e-05, "loss": 0.8433, "step": 2651 }, { "epoch": 0.37, "learning_rate": 1.4572144086017743e-05, "loss": 0.8459, "step": 2652 }, { "epoch": 0.37, "learning_rate": 1.4568142483753198e-05, "loss": 0.864, "step": 2653 }, { "epoch": 0.37, "learning_rate": 1.4564139956885658e-05, "loss": 0.5742, "step": 2654 }, { "epoch": 0.37, "learning_rate": 1.4560136506225245e-05, "loss": 0.7937, "step": 2655 }, { "epoch": 0.37, "learning_rate": 1.4556132132582266e-05, "loss": 0.8928, "step": 2656 }, { "epoch": 0.37, "learning_rate": 1.4552126836767218e-05, "loss": 0.9233, "step": 2657 }, { "epoch": 0.37, "learning_rate": 1.4548120619590783e-05, "loss": 0.8552, "step": 2658 }, { "epoch": 0.37, "learning_rate": 1.4544113481863824e-05, "loss": 0.8867, "step": 2659 }, { "epoch": 0.37, "learning_rate": 1.4540105424397402e-05, "loss": 0.8772, "step": 2660 }, { "epoch": 0.37, "learning_rate": 1.453609644800275e-05, "loss": 0.876, "step": 2661 }, { "epoch": 0.37, "learning_rate": 1.4532086553491302e-05, "loss": 0.8701, "step": 2662 }, { "epoch": 0.37, "learning_rate": 1.4528075741674665e-05, "loss": 0.9114, "step": 2663 }, { "epoch": 0.37, "learning_rate": 1.452406401336464e-05, "loss": 0.8293, "step": 2664 }, { "epoch": 0.37, "learning_rate": 1.4520051369373209e-05, "loss": 0.6365, "step": 2665 }, { "epoch": 0.37, "learning_rate": 1.451603781051254e-05, "loss": 0.8691, "step": 2666 }, { "epoch": 0.37, "learning_rate": 1.4512023337594992e-05, "loss": 0.8196, "step": 2667 }, { "epoch": 0.37, "learning_rate": 1.4508007951433093e-05, "loss": 0.8411, "step": 2668 }, { "epoch": 0.37, "learning_rate": 1.4503991652839578e-05, "loss": 0.8457, "step": 2669 }, { "epoch": 0.37, "learning_rate": 1.4499974442627349e-05, "loss": 0.8892, "step": 2670 }, { "epoch": 0.37, "learning_rate": 1.44959563216095e-05, "loss": 0.8208, "step": 2671 }, { "epoch": 0.37, "learning_rate": 1.4491937290599314e-05, "loss": 0.9224, "step": 2672 }, { "epoch": 0.37, "learning_rate": 1.4487917350410246e-05, "loss": 0.8965, "step": 2673 }, { "epoch": 0.37, "learning_rate": 1.4483896501855941e-05, "loss": 0.8542, "step": 2674 }, { "epoch": 0.37, "learning_rate": 1.4479874745750233e-05, "loss": 0.8835, "step": 2675 }, { "epoch": 0.37, "learning_rate": 1.4475852082907134e-05, "loss": 0.6042, "step": 2676 }, { "epoch": 0.37, "learning_rate": 1.4471828514140836e-05, "loss": 0.8987, "step": 2677 }, { "epoch": 0.37, "learning_rate": 1.4467804040265722e-05, "loss": 0.9077, "step": 2678 }, { "epoch": 0.37, "learning_rate": 1.446377866209636e-05, "loss": 0.9155, "step": 2679 }, { "epoch": 0.37, "learning_rate": 1.445975238044749e-05, "loss": 0.8574, "step": 2680 }, { "epoch": 0.37, "learning_rate": 1.4455725196134043e-05, "loss": 0.8286, "step": 2681 }, { "epoch": 0.37, "learning_rate": 1.445169710997113e-05, "loss": 0.9031, "step": 2682 }, { "epoch": 0.37, "learning_rate": 1.4447668122774046e-05, "loss": 0.8726, "step": 2683 }, { "epoch": 0.37, "learning_rate": 1.4443638235358266e-05, "loss": 0.9004, "step": 2684 }, { "epoch": 0.37, "learning_rate": 1.4439607448539452e-05, "loss": 0.8721, "step": 2685 }, { "epoch": 0.37, "learning_rate": 1.4435575763133446e-05, "loss": 0.5778, "step": 2686 }, { "epoch": 0.37, "learning_rate": 1.4431543179956266e-05, "loss": 0.8555, "step": 2687 }, { "epoch": 0.37, "learning_rate": 1.4427509699824118e-05, "loss": 0.8599, "step": 2688 }, { "epoch": 0.37, "learning_rate": 1.4423475323553389e-05, "loss": 0.9255, "step": 2689 }, { "epoch": 0.37, "learning_rate": 1.4419440051960646e-05, "loss": 0.6082, "step": 2690 }, { "epoch": 0.37, "learning_rate": 1.441540388586264e-05, "loss": 0.832, "step": 2691 }, { "epoch": 0.37, "learning_rate": 1.4411366826076296e-05, "loss": 0.8689, "step": 2692 }, { "epoch": 0.37, "learning_rate": 1.4407328873418727e-05, "loss": 0.8516, "step": 2693 }, { "epoch": 0.37, "learning_rate": 1.4403290028707226e-05, "loss": 0.8916, "step": 2694 }, { "epoch": 0.37, "learning_rate": 1.4399250292759262e-05, "loss": 0.9097, "step": 2695 }, { "epoch": 0.37, "learning_rate": 1.439520966639249e-05, "loss": 0.9033, "step": 2696 }, { "epoch": 0.37, "learning_rate": 1.4391168150424742e-05, "loss": 0.7894, "step": 2697 }, { "epoch": 0.37, "learning_rate": 1.4387125745674027e-05, "loss": 0.8479, "step": 2698 }, { "epoch": 0.37, "learning_rate": 1.438308245295854e-05, "loss": 0.8821, "step": 2699 }, { "epoch": 0.38, "learning_rate": 1.4379038273096653e-05, "loss": 0.8857, "step": 2700 }, { "epoch": 0.38, "learning_rate": 1.437499320690692e-05, "loss": 0.855, "step": 2701 }, { "epoch": 0.38, "learning_rate": 1.4370947255208068e-05, "loss": 0.5621, "step": 2702 }, { "epoch": 0.38, "learning_rate": 1.436690041881901e-05, "loss": 0.8306, "step": 2703 }, { "epoch": 0.38, "learning_rate": 1.4362852698558834e-05, "loss": 0.9004, "step": 2704 }, { "epoch": 0.38, "learning_rate": 1.4358804095246808e-05, "loss": 0.8948, "step": 2705 }, { "epoch": 0.38, "learning_rate": 1.4354754609702384e-05, "loss": 0.8749, "step": 2706 }, { "epoch": 0.38, "learning_rate": 1.435070424274518e-05, "loss": 0.6362, "step": 2707 }, { "epoch": 0.38, "learning_rate": 1.4346652995195003e-05, "loss": 0.8584, "step": 2708 }, { "epoch": 0.38, "learning_rate": 1.4342600867871837e-05, "loss": 0.8501, "step": 2709 }, { "epoch": 0.38, "learning_rate": 1.433854786159584e-05, "loss": 0.8936, "step": 2710 }, { "epoch": 0.38, "learning_rate": 1.4334493977187353e-05, "loss": 0.8635, "step": 2711 }, { "epoch": 0.38, "learning_rate": 1.4330439215466888e-05, "loss": 0.8687, "step": 2712 }, { "epoch": 0.38, "learning_rate": 1.4326383577255141e-05, "loss": 0.8539, "step": 2713 }, { "epoch": 0.38, "learning_rate": 1.4322327063372983e-05, "loss": 0.8414, "step": 2714 }, { "epoch": 0.38, "learning_rate": 1.4318269674641461e-05, "loss": 0.9036, "step": 2715 }, { "epoch": 0.38, "learning_rate": 1.4314211411881803e-05, "loss": 0.6005, "step": 2716 }, { "epoch": 0.38, "learning_rate": 1.4310152275915408e-05, "loss": 0.8357, "step": 2717 }, { "epoch": 0.38, "learning_rate": 1.4306092267563854e-05, "loss": 0.8518, "step": 2718 }, { "epoch": 0.38, "learning_rate": 1.43020313876489e-05, "loss": 0.8828, "step": 2719 }, { "epoch": 0.38, "learning_rate": 1.4297969636992474e-05, "loss": 0.8135, "step": 2720 }, { "epoch": 0.38, "learning_rate": 1.429390701641669e-05, "loss": 0.642, "step": 2721 }, { "epoch": 0.38, "learning_rate": 1.4289843526743826e-05, "loss": 0.8125, "step": 2722 }, { "epoch": 0.38, "learning_rate": 1.4285779168796343e-05, "loss": 0.8787, "step": 2723 }, { "epoch": 0.38, "learning_rate": 1.428171394339688e-05, "loss": 0.8092, "step": 2724 }, { "epoch": 0.38, "learning_rate": 1.4277647851368245e-05, "loss": 0.8523, "step": 2725 }, { "epoch": 0.38, "learning_rate": 1.427358089353343e-05, "loss": 0.8115, "step": 2726 }, { "epoch": 0.38, "learning_rate": 1.4269513070715588e-05, "loss": 0.8806, "step": 2727 }, { "epoch": 0.38, "learning_rate": 1.4265444383738066e-05, "loss": 0.9373, "step": 2728 }, { "epoch": 0.38, "learning_rate": 1.4261374833424368e-05, "loss": 0.887, "step": 2729 }, { "epoch": 0.38, "learning_rate": 1.4257304420598183e-05, "loss": 0.8657, "step": 2730 }, { "epoch": 0.38, "learning_rate": 1.4253233146083378e-05, "loss": 0.6243, "step": 2731 }, { "epoch": 0.38, "learning_rate": 1.4249161010703985e-05, "loss": 0.8503, "step": 2732 }, { "epoch": 0.38, "learning_rate": 1.424508801528421e-05, "loss": 0.8728, "step": 2733 }, { "epoch": 0.38, "learning_rate": 1.4241014160648438e-05, "loss": 0.6327, "step": 2734 }, { "epoch": 0.38, "learning_rate": 1.4236939447621231e-05, "loss": 0.8372, "step": 2735 }, { "epoch": 0.38, "learning_rate": 1.423286387702732e-05, "loss": 0.9319, "step": 2736 }, { "epoch": 0.38, "learning_rate": 1.422878744969161e-05, "loss": 0.8472, "step": 2737 }, { "epoch": 0.38, "learning_rate": 1.4224710166439177e-05, "loss": 0.9131, "step": 2738 }, { "epoch": 0.38, "learning_rate": 1.4220632028095276e-05, "loss": 0.8945, "step": 2739 }, { "epoch": 0.38, "learning_rate": 1.4216553035485327e-05, "loss": 0.6086, "step": 2740 }, { "epoch": 0.38, "learning_rate": 1.4212473189434934e-05, "loss": 0.8423, "step": 2741 }, { "epoch": 0.38, "learning_rate": 1.4208392490769869e-05, "loss": 0.8323, "step": 2742 }, { "epoch": 0.38, "learning_rate": 1.4204310940316067e-05, "loss": 0.9011, "step": 2743 }, { "epoch": 0.38, "learning_rate": 1.4200228538899647e-05, "loss": 0.8826, "step": 2744 }, { "epoch": 0.38, "learning_rate": 1.41961452873469e-05, "loss": 0.8281, "step": 2745 }, { "epoch": 0.38, "learning_rate": 1.4192061186484282e-05, "loss": 0.5832, "step": 2746 }, { "epoch": 0.38, "learning_rate": 1.418797623713843e-05, "loss": 0.8975, "step": 2747 }, { "epoch": 0.38, "learning_rate": 1.4183890440136142e-05, "loss": 0.8267, "step": 2748 }, { "epoch": 0.38, "learning_rate": 1.4179803796304394e-05, "loss": 0.8262, "step": 2749 }, { "epoch": 0.38, "learning_rate": 1.4175716306470335e-05, "loss": 0.8479, "step": 2750 }, { "epoch": 0.38, "learning_rate": 1.4171627971461281e-05, "loss": 0.8569, "step": 2751 }, { "epoch": 0.38, "learning_rate": 1.4167538792104722e-05, "loss": 0.6013, "step": 2752 }, { "epoch": 0.38, "learning_rate": 1.4163448769228316e-05, "loss": 0.8215, "step": 2753 }, { "epoch": 0.38, "learning_rate": 1.4159357903659894e-05, "loss": 0.6233, "step": 2754 }, { "epoch": 0.38, "learning_rate": 1.415526619622746e-05, "loss": 0.8362, "step": 2755 }, { "epoch": 0.38, "learning_rate": 1.415117364775918e-05, "loss": 0.8684, "step": 2756 }, { "epoch": 0.38, "learning_rate": 1.4147080259083402e-05, "loss": 0.8662, "step": 2757 }, { "epoch": 0.38, "learning_rate": 1.414298603102863e-05, "loss": 0.828, "step": 2758 }, { "epoch": 0.38, "learning_rate": 1.4138890964423549e-05, "loss": 0.8574, "step": 2759 }, { "epoch": 0.38, "learning_rate": 1.4134795060097013e-05, "loss": 0.8159, "step": 2760 }, { "epoch": 0.38, "learning_rate": 1.413069831887804e-05, "loss": 0.8735, "step": 2761 }, { "epoch": 0.38, "learning_rate": 1.4126600741595824e-05, "loss": 0.9155, "step": 2762 }, { "epoch": 0.38, "learning_rate": 1.412250232907972e-05, "loss": 0.8816, "step": 2763 }, { "epoch": 0.38, "learning_rate": 1.4118403082159255e-05, "loss": 0.8158, "step": 2764 }, { "epoch": 0.38, "learning_rate": 1.4114303001664133e-05, "loss": 0.8911, "step": 2765 }, { "epoch": 0.38, "learning_rate": 1.4110202088424214e-05, "loss": 0.8296, "step": 2766 }, { "epoch": 0.38, "learning_rate": 1.410610034326954e-05, "loss": 0.8696, "step": 2767 }, { "epoch": 0.38, "learning_rate": 1.4101997767030304e-05, "loss": 0.8721, "step": 2768 }, { "epoch": 0.38, "learning_rate": 1.4097894360536885e-05, "loss": 0.8538, "step": 2769 }, { "epoch": 0.38, "learning_rate": 1.4093790124619819e-05, "loss": 0.8619, "step": 2770 }, { "epoch": 0.38, "learning_rate": 1.4089685060109814e-05, "loss": 0.8616, "step": 2771 }, { "epoch": 0.39, "learning_rate": 1.408557916783775e-05, "loss": 0.8618, "step": 2772 }, { "epoch": 0.39, "learning_rate": 1.4081472448634659e-05, "loss": 0.8073, "step": 2773 }, { "epoch": 0.39, "learning_rate": 1.4077364903331758e-05, "loss": 0.947, "step": 2774 }, { "epoch": 0.39, "learning_rate": 1.407325653276042e-05, "loss": 0.9121, "step": 2775 }, { "epoch": 0.39, "learning_rate": 1.4069147337752193e-05, "loss": 0.8948, "step": 2776 }, { "epoch": 0.39, "learning_rate": 1.4065037319138788e-05, "loss": 0.8887, "step": 2777 }, { "epoch": 0.39, "learning_rate": 1.4060926477752079e-05, "loss": 0.8282, "step": 2778 }, { "epoch": 0.39, "learning_rate": 1.4056814814424114e-05, "loss": 0.8013, "step": 2779 }, { "epoch": 0.39, "learning_rate": 1.4052702329987098e-05, "loss": 0.8408, "step": 2780 }, { "epoch": 0.39, "learning_rate": 1.4048589025273413e-05, "loss": 0.8259, "step": 2781 }, { "epoch": 0.39, "learning_rate": 1.40444749011156e-05, "loss": 0.8367, "step": 2782 }, { "epoch": 0.39, "learning_rate": 1.404035995834637e-05, "loss": 0.8762, "step": 2783 }, { "epoch": 0.39, "learning_rate": 1.4036244197798592e-05, "loss": 0.8757, "step": 2784 }, { "epoch": 0.39, "learning_rate": 1.4032127620305308e-05, "loss": 0.877, "step": 2785 }, { "epoch": 0.39, "learning_rate": 1.4028010226699724e-05, "loss": 0.8948, "step": 2786 }, { "epoch": 0.39, "learning_rate": 1.4023892017815215e-05, "loss": 0.6144, "step": 2787 }, { "epoch": 0.39, "learning_rate": 1.4019772994485308e-05, "loss": 0.926, "step": 2788 }, { "epoch": 0.39, "learning_rate": 1.4015653157543705e-05, "loss": 0.8687, "step": 2789 }, { "epoch": 0.39, "learning_rate": 1.4011532507824276e-05, "loss": 0.8669, "step": 2790 }, { "epoch": 0.39, "learning_rate": 1.4007411046161043e-05, "loss": 0.8218, "step": 2791 }, { "epoch": 0.39, "learning_rate": 1.4003288773388205e-05, "loss": 0.8906, "step": 2792 }, { "epoch": 0.39, "learning_rate": 1.3999165690340125e-05, "loss": 0.917, "step": 2793 }, { "epoch": 0.39, "learning_rate": 1.3995041797851312e-05, "loss": 0.8413, "step": 2794 }, { "epoch": 0.39, "learning_rate": 1.3990917096756458e-05, "loss": 0.8977, "step": 2795 }, { "epoch": 0.39, "learning_rate": 1.3986791587890415e-05, "loss": 0.5299, "step": 2796 }, { "epoch": 0.39, "learning_rate": 1.3982665272088192e-05, "loss": 0.8496, "step": 2797 }, { "epoch": 0.39, "learning_rate": 1.3978538150184968e-05, "loss": 0.9221, "step": 2798 }, { "epoch": 0.39, "learning_rate": 1.397441022301608e-05, "loss": 0.8904, "step": 2799 }, { "epoch": 0.39, "learning_rate": 1.3970281491417032e-05, "loss": 0.8418, "step": 2800 }, { "epoch": 0.39, "learning_rate": 1.396615195622349e-05, "loss": 0.9114, "step": 2801 }, { "epoch": 0.39, "learning_rate": 1.396202161827128e-05, "loss": 0.9094, "step": 2802 }, { "epoch": 0.39, "learning_rate": 1.3957890478396392e-05, "loss": 0.8823, "step": 2803 }, { "epoch": 0.39, "learning_rate": 1.395375853743498e-05, "loss": 0.8464, "step": 2804 }, { "epoch": 0.39, "learning_rate": 1.3949625796223357e-05, "loss": 0.7776, "step": 2805 }, { "epoch": 0.39, "learning_rate": 1.3945492255598001e-05, "loss": 0.8708, "step": 2806 }, { "epoch": 0.39, "learning_rate": 1.3941357916395553e-05, "loss": 0.8652, "step": 2807 }, { "epoch": 0.39, "learning_rate": 1.3937222779452808e-05, "loss": 0.8684, "step": 2808 }, { "epoch": 0.39, "learning_rate": 1.393308684560673e-05, "loss": 0.9146, "step": 2809 }, { "epoch": 0.39, "learning_rate": 1.3928950115694445e-05, "loss": 0.8407, "step": 2810 }, { "epoch": 0.39, "learning_rate": 1.3924812590553231e-05, "loss": 0.5842, "step": 2811 }, { "epoch": 0.39, "learning_rate": 1.3920674271020537e-05, "loss": 0.7957, "step": 2812 }, { "epoch": 0.39, "learning_rate": 1.391653515793397e-05, "loss": 0.8926, "step": 2813 }, { "epoch": 0.39, "learning_rate": 1.3912395252131294e-05, "loss": 0.8501, "step": 2814 }, { "epoch": 0.39, "learning_rate": 1.3908254554450435e-05, "loss": 0.8701, "step": 2815 }, { "epoch": 0.39, "learning_rate": 1.390411306572948e-05, "loss": 0.7871, "step": 2816 }, { "epoch": 0.39, "learning_rate": 1.389997078680668e-05, "loss": 0.6277, "step": 2817 }, { "epoch": 0.39, "learning_rate": 1.389582771852044e-05, "loss": 0.8374, "step": 2818 }, { "epoch": 0.39, "learning_rate": 1.389168386170933e-05, "loss": 0.8196, "step": 2819 }, { "epoch": 0.39, "learning_rate": 1.3887539217212067e-05, "loss": 0.9436, "step": 2820 }, { "epoch": 0.39, "learning_rate": 1.3883393785867547e-05, "loss": 0.864, "step": 2821 }, { "epoch": 0.39, "learning_rate": 1.3879247568514809e-05, "loss": 0.8257, "step": 2822 }, { "epoch": 0.39, "learning_rate": 1.3875100565993065e-05, "loss": 0.8921, "step": 2823 }, { "epoch": 0.39, "learning_rate": 1.387095277914167e-05, "loss": 0.8921, "step": 2824 }, { "epoch": 0.39, "learning_rate": 1.3866804208800147e-05, "loss": 0.9485, "step": 2825 }, { "epoch": 0.39, "learning_rate": 1.3862654855808183e-05, "loss": 0.833, "step": 2826 }, { "epoch": 0.39, "learning_rate": 1.3858504721005607e-05, "loss": 0.916, "step": 2827 }, { "epoch": 0.39, "learning_rate": 1.385435380523243e-05, "loss": 0.8828, "step": 2828 }, { "epoch": 0.39, "learning_rate": 1.3850202109328794e-05, "loss": 0.8447, "step": 2829 }, { "epoch": 0.39, "learning_rate": 1.3846049634135019e-05, "loss": 0.8878, "step": 2830 }, { "epoch": 0.39, "learning_rate": 1.3841896380491573e-05, "loss": 0.5746, "step": 2831 }, { "epoch": 0.39, "learning_rate": 1.3837742349239087e-05, "loss": 0.8225, "step": 2832 }, { "epoch": 0.39, "learning_rate": 1.383358754121835e-05, "loss": 0.8308, "step": 2833 }, { "epoch": 0.39, "learning_rate": 1.3829431957270296e-05, "loss": 0.8542, "step": 2834 }, { "epoch": 0.39, "learning_rate": 1.3825275598236033e-05, "loss": 0.7791, "step": 2835 }, { "epoch": 0.39, "learning_rate": 1.3821118464956812e-05, "loss": 0.8696, "step": 2836 }, { "epoch": 0.39, "learning_rate": 1.3816960558274051e-05, "loss": 0.9038, "step": 2837 }, { "epoch": 0.39, "learning_rate": 1.381280187902932e-05, "loss": 0.8824, "step": 2838 }, { "epoch": 0.39, "learning_rate": 1.3808642428064344e-05, "loss": 0.8877, "step": 2839 }, { "epoch": 0.39, "learning_rate": 1.3804482206221008e-05, "loss": 0.8647, "step": 2840 }, { "epoch": 0.39, "learning_rate": 1.3800321214341348e-05, "loss": 0.8962, "step": 2841 }, { "epoch": 0.39, "learning_rate": 1.3796159453267562e-05, "loss": 0.9019, "step": 2842 }, { "epoch": 0.39, "learning_rate": 1.3791996923842e-05, "loss": 0.8982, "step": 2843 }, { "epoch": 0.4, "learning_rate": 1.3787833626907166e-05, "loss": 0.925, "step": 2844 }, { "epoch": 0.4, "learning_rate": 1.378366956330572e-05, "loss": 0.8943, "step": 2845 }, { "epoch": 0.4, "learning_rate": 1.377950473388048e-05, "loss": 0.9187, "step": 2846 }, { "epoch": 0.4, "learning_rate": 1.3775339139474419e-05, "loss": 0.8833, "step": 2847 }, { "epoch": 0.4, "learning_rate": 1.3771172780930663e-05, "loss": 0.8999, "step": 2848 }, { "epoch": 0.4, "learning_rate": 1.3767005659092492e-05, "loss": 0.8762, "step": 2849 }, { "epoch": 0.4, "learning_rate": 1.3762837774803342e-05, "loss": 0.8618, "step": 2850 }, { "epoch": 0.4, "learning_rate": 1.3758669128906798e-05, "loss": 0.873, "step": 2851 }, { "epoch": 0.4, "learning_rate": 1.3754499722246614e-05, "loss": 0.925, "step": 2852 }, { "epoch": 0.4, "learning_rate": 1.375032955566668e-05, "loss": 0.9404, "step": 2853 }, { "epoch": 0.4, "learning_rate": 1.374615863001105e-05, "loss": 0.8198, "step": 2854 }, { "epoch": 0.4, "learning_rate": 1.374198694612393e-05, "loss": 0.8381, "step": 2855 }, { "epoch": 0.4, "learning_rate": 1.3737814504849677e-05, "loss": 0.9028, "step": 2856 }, { "epoch": 0.4, "learning_rate": 1.3733641307032803e-05, "loss": 0.8064, "step": 2857 }, { "epoch": 0.4, "learning_rate": 1.3729467353517978e-05, "loss": 0.8457, "step": 2858 }, { "epoch": 0.4, "learning_rate": 1.3725292645150017e-05, "loss": 0.8767, "step": 2859 }, { "epoch": 0.4, "learning_rate": 1.3721117182773887e-05, "loss": 0.8665, "step": 2860 }, { "epoch": 0.4, "learning_rate": 1.3716940967234717e-05, "loss": 0.8263, "step": 2861 }, { "epoch": 0.4, "learning_rate": 1.371276399937778e-05, "loss": 0.8787, "step": 2862 }, { "epoch": 0.4, "learning_rate": 1.3708586280048506e-05, "loss": 0.8507, "step": 2863 }, { "epoch": 0.4, "learning_rate": 1.370440781009248e-05, "loss": 0.8677, "step": 2864 }, { "epoch": 0.4, "learning_rate": 1.3700228590355425e-05, "loss": 0.8564, "step": 2865 }, { "epoch": 0.4, "learning_rate": 1.3696048621683229e-05, "loss": 0.9014, "step": 2866 }, { "epoch": 0.4, "learning_rate": 1.3691867904921927e-05, "loss": 0.8784, "step": 2867 }, { "epoch": 0.4, "learning_rate": 1.368768644091771e-05, "loss": 0.8159, "step": 2868 }, { "epoch": 0.4, "learning_rate": 1.3683504230516914e-05, "loss": 0.9175, "step": 2869 }, { "epoch": 0.4, "learning_rate": 1.3679321274566027e-05, "loss": 0.8916, "step": 2870 }, { "epoch": 0.4, "learning_rate": 1.367513757391169e-05, "loss": 0.8699, "step": 2871 }, { "epoch": 0.4, "learning_rate": 1.3670953129400693e-05, "loss": 0.6316, "step": 2872 }, { "epoch": 0.4, "learning_rate": 1.366676794187998e-05, "loss": 0.7961, "step": 2873 }, { "epoch": 0.4, "learning_rate": 1.3662582012196644e-05, "loss": 0.8633, "step": 2874 }, { "epoch": 0.4, "learning_rate": 1.3658395341197923e-05, "loss": 0.8184, "step": 2875 }, { "epoch": 0.4, "learning_rate": 1.3654207929731213e-05, "loss": 0.8013, "step": 2876 }, { "epoch": 0.4, "learning_rate": 1.3650019778644053e-05, "loss": 0.8074, "step": 2877 }, { "epoch": 0.4, "learning_rate": 1.3645830888784137e-05, "loss": 0.8325, "step": 2878 }, { "epoch": 0.4, "learning_rate": 1.3641641260999308e-05, "loss": 0.8423, "step": 2879 }, { "epoch": 0.4, "learning_rate": 1.3637450896137549e-05, "loss": 0.938, "step": 2880 }, { "epoch": 0.4, "learning_rate": 1.363325979504701e-05, "loss": 0.8524, "step": 2881 }, { "epoch": 0.4, "learning_rate": 1.3629067958575973e-05, "loss": 0.9016, "step": 2882 }, { "epoch": 0.4, "learning_rate": 1.362487538757288e-05, "loss": 0.8865, "step": 2883 }, { "epoch": 0.4, "learning_rate": 1.3620682082886315e-05, "loss": 0.7971, "step": 2884 }, { "epoch": 0.4, "learning_rate": 1.361648804536501e-05, "loss": 0.8179, "step": 2885 }, { "epoch": 0.4, "learning_rate": 1.3612293275857856e-05, "loss": 0.8374, "step": 2886 }, { "epoch": 0.4, "learning_rate": 1.360809777521388e-05, "loss": 0.8342, "step": 2887 }, { "epoch": 0.4, "learning_rate": 1.3603901544282258e-05, "loss": 0.9294, "step": 2888 }, { "epoch": 0.4, "learning_rate": 1.3599704583912324e-05, "loss": 0.8274, "step": 2889 }, { "epoch": 0.4, "learning_rate": 1.3595506894953545e-05, "loss": 0.8967, "step": 2890 }, { "epoch": 0.4, "learning_rate": 1.3591308478255551e-05, "loss": 0.8911, "step": 2891 }, { "epoch": 0.4, "learning_rate": 1.358710933466811e-05, "loss": 0.8535, "step": 2892 }, { "epoch": 0.4, "learning_rate": 1.3582909465041134e-05, "loss": 0.8652, "step": 2893 }, { "epoch": 0.4, "learning_rate": 1.357870887022469e-05, "loss": 0.8086, "step": 2894 }, { "epoch": 0.4, "learning_rate": 1.357450755106899e-05, "loss": 0.8528, "step": 2895 }, { "epoch": 0.4, "learning_rate": 1.3570305508424388e-05, "loss": 0.8987, "step": 2896 }, { "epoch": 0.4, "learning_rate": 1.356610274314139e-05, "loss": 0.8987, "step": 2897 }, { "epoch": 0.4, "learning_rate": 1.3561899256070644e-05, "loss": 0.8818, "step": 2898 }, { "epoch": 0.4, "learning_rate": 1.3557695048062943e-05, "loss": 0.8384, "step": 2899 }, { "epoch": 0.4, "learning_rate": 1.3553490119969236e-05, "loss": 0.8655, "step": 2900 }, { "epoch": 0.4, "learning_rate": 1.3549284472640607e-05, "loss": 0.8496, "step": 2901 }, { "epoch": 0.4, "learning_rate": 1.3545078106928289e-05, "loss": 0.835, "step": 2902 }, { "epoch": 0.4, "learning_rate": 1.354087102368366e-05, "loss": 0.9143, "step": 2903 }, { "epoch": 0.4, "learning_rate": 1.3536663223758241e-05, "loss": 0.832, "step": 2904 }, { "epoch": 0.4, "learning_rate": 1.3532454708003708e-05, "loss": 0.9238, "step": 2905 }, { "epoch": 0.4, "learning_rate": 1.3528245477271871e-05, "loss": 0.8975, "step": 2906 }, { "epoch": 0.4, "learning_rate": 1.3524035532414685e-05, "loss": 0.9158, "step": 2907 }, { "epoch": 0.4, "learning_rate": 1.3519824874284258e-05, "loss": 0.9065, "step": 2908 }, { "epoch": 0.4, "learning_rate": 1.3515613503732834e-05, "loss": 0.8557, "step": 2909 }, { "epoch": 0.4, "learning_rate": 1.3511401421612806e-05, "loss": 0.7683, "step": 2910 }, { "epoch": 0.4, "learning_rate": 1.3507188628776711e-05, "loss": 0.8655, "step": 2911 }, { "epoch": 0.4, "learning_rate": 1.3502975126077225e-05, "loss": 0.8094, "step": 2912 }, { "epoch": 0.4, "learning_rate": 1.349876091436717e-05, "loss": 0.9324, "step": 2913 }, { "epoch": 0.4, "learning_rate": 1.3494545994499519e-05, "loss": 0.8562, "step": 2914 }, { "epoch": 0.4, "learning_rate": 1.349033036732738e-05, "loss": 0.8669, "step": 2915 }, { "epoch": 0.41, "learning_rate": 1.3486114033704001e-05, "loss": 0.8037, "step": 2916 }, { "epoch": 0.41, "learning_rate": 1.3481896994482782e-05, "loss": 0.8184, "step": 2917 }, { "epoch": 0.41, "learning_rate": 1.3477679250517259e-05, "loss": 0.8843, "step": 2918 }, { "epoch": 0.41, "learning_rate": 1.3473460802661116e-05, "loss": 0.8901, "step": 2919 }, { "epoch": 0.41, "learning_rate": 1.3469241651768182e-05, "loss": 0.8176, "step": 2920 }, { "epoch": 0.41, "learning_rate": 1.3465021798692413e-05, "loss": 0.8518, "step": 2921 }, { "epoch": 0.41, "learning_rate": 1.3460801244287922e-05, "loss": 0.8245, "step": 2922 }, { "epoch": 0.41, "learning_rate": 1.345657998940896e-05, "loss": 0.8381, "step": 2923 }, { "epoch": 0.41, "learning_rate": 1.3452358034909918e-05, "loss": 0.585, "step": 2924 }, { "epoch": 0.41, "learning_rate": 1.3448135381645333e-05, "loss": 0.8601, "step": 2925 }, { "epoch": 0.41, "learning_rate": 1.3443912030469877e-05, "loss": 0.854, "step": 2926 }, { "epoch": 0.41, "learning_rate": 1.3439687982238363e-05, "loss": 0.5997, "step": 2927 }, { "epoch": 0.41, "learning_rate": 1.3435463237805754e-05, "loss": 0.8181, "step": 2928 }, { "epoch": 0.41, "learning_rate": 1.3431237798027149e-05, "loss": 0.8677, "step": 2929 }, { "epoch": 0.41, "learning_rate": 1.3427011663757784e-05, "loss": 0.8276, "step": 2930 }, { "epoch": 0.41, "learning_rate": 1.342278483585304e-05, "loss": 0.8562, "step": 2931 }, { "epoch": 0.41, "learning_rate": 1.3418557315168437e-05, "loss": 0.8992, "step": 2932 }, { "epoch": 0.41, "learning_rate": 1.3414329102559634e-05, "loss": 0.9009, "step": 2933 }, { "epoch": 0.41, "learning_rate": 1.3410100198882432e-05, "loss": 0.8853, "step": 2934 }, { "epoch": 0.41, "learning_rate": 1.3405870604992774e-05, "loss": 0.8955, "step": 2935 }, { "epoch": 0.41, "learning_rate": 1.3401640321746734e-05, "loss": 0.9233, "step": 2936 }, { "epoch": 0.41, "learning_rate": 1.3397409350000539e-05, "loss": 0.8845, "step": 2937 }, { "epoch": 0.41, "learning_rate": 1.3393177690610539e-05, "loss": 0.8889, "step": 2938 }, { "epoch": 0.41, "learning_rate": 1.3388945344433242e-05, "loss": 0.9336, "step": 2939 }, { "epoch": 0.41, "learning_rate": 1.3384712312325278e-05, "loss": 0.9141, "step": 2940 }, { "epoch": 0.41, "learning_rate": 1.3380478595143424e-05, "loss": 0.8369, "step": 2941 }, { "epoch": 0.41, "learning_rate": 1.3376244193744597e-05, "loss": 0.8806, "step": 2942 }, { "epoch": 0.41, "learning_rate": 1.3372009108985849e-05, "loss": 0.8794, "step": 2943 }, { "epoch": 0.41, "learning_rate": 1.3367773341724366e-05, "loss": 0.6089, "step": 2944 }, { "epoch": 0.41, "learning_rate": 1.3363536892817487e-05, "loss": 0.9033, "step": 2945 }, { "epoch": 0.41, "learning_rate": 1.3359299763122673e-05, "loss": 0.8616, "step": 2946 }, { "epoch": 0.41, "learning_rate": 1.335506195349753e-05, "loss": 0.8535, "step": 2947 }, { "epoch": 0.41, "learning_rate": 1.3350823464799803e-05, "loss": 0.9099, "step": 2948 }, { "epoch": 0.41, "learning_rate": 1.3346584297887369e-05, "loss": 0.8997, "step": 2949 }, { "epoch": 0.41, "learning_rate": 1.334234445361825e-05, "loss": 0.895, "step": 2950 }, { "epoch": 0.41, "learning_rate": 1.3338103932850595e-05, "loss": 0.8914, "step": 2951 }, { "epoch": 0.41, "learning_rate": 1.33338627364427e-05, "loss": 0.8235, "step": 2952 }, { "epoch": 0.41, "learning_rate": 1.332962086525299e-05, "loss": 0.8701, "step": 2953 }, { "epoch": 0.41, "learning_rate": 1.3325378320140034e-05, "loss": 0.8491, "step": 2954 }, { "epoch": 0.41, "learning_rate": 1.3321135101962532e-05, "loss": 0.8271, "step": 2955 }, { "epoch": 0.41, "learning_rate": 1.331689121157932e-05, "loss": 0.8406, "step": 2956 }, { "epoch": 0.41, "learning_rate": 1.331264664984937e-05, "loss": 0.8926, "step": 2957 }, { "epoch": 0.41, "learning_rate": 1.3308401417631796e-05, "loss": 0.8855, "step": 2958 }, { "epoch": 0.41, "learning_rate": 1.330415551578584e-05, "loss": 0.8411, "step": 2959 }, { "epoch": 0.41, "learning_rate": 1.3299908945170886e-05, "loss": 0.8308, "step": 2960 }, { "epoch": 0.41, "learning_rate": 1.3295661706646446e-05, "loss": 0.8586, "step": 2961 }, { "epoch": 0.41, "learning_rate": 1.329141380107217e-05, "loss": 0.8401, "step": 2962 }, { "epoch": 0.41, "learning_rate": 1.328716522930785e-05, "loss": 0.866, "step": 2963 }, { "epoch": 0.41, "learning_rate": 1.3282915992213404e-05, "loss": 0.8616, "step": 2964 }, { "epoch": 0.41, "learning_rate": 1.327866609064889e-05, "loss": 0.8586, "step": 2965 }, { "epoch": 0.41, "learning_rate": 1.3274415525474494e-05, "loss": 0.8228, "step": 2966 }, { "epoch": 0.41, "learning_rate": 1.3270164297550543e-05, "loss": 0.8635, "step": 2967 }, { "epoch": 0.41, "learning_rate": 1.3265912407737496e-05, "loss": 0.6039, "step": 2968 }, { "epoch": 0.41, "learning_rate": 1.3261659856895946e-05, "loss": 0.8303, "step": 2969 }, { "epoch": 0.41, "learning_rate": 1.3257406645886616e-05, "loss": 0.9077, "step": 2970 }, { "epoch": 0.41, "learning_rate": 1.3253152775570374e-05, "loss": 0.8778, "step": 2971 }, { "epoch": 0.41, "learning_rate": 1.3248898246808208e-05, "loss": 0.8606, "step": 2972 }, { "epoch": 0.41, "learning_rate": 1.3244643060461242e-05, "loss": 0.8167, "step": 2973 }, { "epoch": 0.41, "learning_rate": 1.3240387217390742e-05, "loss": 0.823, "step": 2974 }, { "epoch": 0.41, "learning_rate": 1.3236130718458095e-05, "loss": 0.8687, "step": 2975 }, { "epoch": 0.41, "learning_rate": 1.3231873564524836e-05, "loss": 0.8887, "step": 2976 }, { "epoch": 0.41, "learning_rate": 1.3227615756452612e-05, "loss": 0.8501, "step": 2977 }, { "epoch": 0.41, "learning_rate": 1.3223357295103218e-05, "loss": 0.8723, "step": 2978 }, { "epoch": 0.41, "learning_rate": 1.3219098181338578e-05, "loss": 0.9185, "step": 2979 }, { "epoch": 0.41, "learning_rate": 1.3214838416020745e-05, "loss": 0.9255, "step": 2980 }, { "epoch": 0.41, "learning_rate": 1.3210578000011911e-05, "loss": 0.9172, "step": 2981 }, { "epoch": 0.41, "learning_rate": 1.3206316934174389e-05, "loss": 0.9116, "step": 2982 }, { "epoch": 0.41, "learning_rate": 1.3202055219370626e-05, "loss": 0.8977, "step": 2983 }, { "epoch": 0.41, "learning_rate": 1.319779285646321e-05, "loss": 0.8562, "step": 2984 }, { "epoch": 0.41, "learning_rate": 1.3193529846314852e-05, "loss": 0.8213, "step": 2985 }, { "epoch": 0.41, "learning_rate": 1.3189266189788394e-05, "loss": 0.8525, "step": 2986 }, { "epoch": 0.41, "learning_rate": 1.3185001887746812e-05, "loss": 0.8884, "step": 2987 }, { "epoch": 0.42, "learning_rate": 1.3180736941053207e-05, "loss": 0.8613, "step": 2988 }, { "epoch": 0.42, "learning_rate": 1.3176471350570817e-05, "loss": 0.8955, "step": 2989 }, { "epoch": 0.42, "learning_rate": 1.3172205117163008e-05, "loss": 0.8672, "step": 2990 }, { "epoch": 0.42, "learning_rate": 1.3167938241693281e-05, "loss": 0.9133, "step": 2991 }, { "epoch": 0.42, "learning_rate": 1.3163670725025251e-05, "loss": 0.8035, "step": 2992 }, { "epoch": 0.42, "learning_rate": 1.3159402568022678e-05, "loss": 0.9128, "step": 2993 }, { "epoch": 0.42, "learning_rate": 1.3155133771549453e-05, "loss": 0.8677, "step": 2994 }, { "epoch": 0.42, "learning_rate": 1.3150864336469584e-05, "loss": 0.6154, "step": 2995 }, { "epoch": 0.42, "learning_rate": 1.3146594263647218e-05, "loss": 0.8865, "step": 2996 }, { "epoch": 0.42, "learning_rate": 1.3142323553946626e-05, "loss": 0.8384, "step": 2997 }, { "epoch": 0.42, "learning_rate": 1.313805220823221e-05, "loss": 0.6221, "step": 2998 }, { "epoch": 0.42, "learning_rate": 1.3133780227368502e-05, "loss": 0.8694, "step": 2999 }, { "epoch": 0.42, "learning_rate": 1.312950761222016e-05, "loss": 0.8555, "step": 3000 }, { "epoch": 0.42, "learning_rate": 1.3125234363651975e-05, "loss": 0.6244, "step": 3001 }, { "epoch": 0.42, "learning_rate": 1.3120960482528857e-05, "loss": 0.8887, "step": 3002 }, { "epoch": 0.42, "learning_rate": 1.3116685969715852e-05, "loss": 0.8269, "step": 3003 }, { "epoch": 0.42, "learning_rate": 1.3112410826078134e-05, "loss": 0.8721, "step": 3004 }, { "epoch": 0.42, "learning_rate": 1.3108135052481e-05, "loss": 0.8271, "step": 3005 }, { "epoch": 0.42, "learning_rate": 1.310385864978988e-05, "loss": 0.8496, "step": 3006 }, { "epoch": 0.42, "learning_rate": 1.3099581618870322e-05, "loss": 0.824, "step": 3007 }, { "epoch": 0.42, "learning_rate": 1.3095303960588015e-05, "loss": 0.8855, "step": 3008 }, { "epoch": 0.42, "learning_rate": 1.309102567580876e-05, "loss": 0.8855, "step": 3009 }, { "epoch": 0.42, "learning_rate": 1.3086746765398494e-05, "loss": 0.8721, "step": 3010 }, { "epoch": 0.42, "learning_rate": 1.3082467230223286e-05, "loss": 0.9194, "step": 3011 }, { "epoch": 0.42, "learning_rate": 1.3078187071149313e-05, "loss": 0.5814, "step": 3012 }, { "epoch": 0.42, "learning_rate": 1.3073906289042897e-05, "loss": 0.8923, "step": 3013 }, { "epoch": 0.42, "learning_rate": 1.3069624884770476e-05, "loss": 0.821, "step": 3014 }, { "epoch": 0.42, "learning_rate": 1.3065342859198615e-05, "loss": 0.8892, "step": 3015 }, { "epoch": 0.42, "learning_rate": 1.3061060213194012e-05, "loss": 0.8108, "step": 3016 }, { "epoch": 0.42, "learning_rate": 1.3056776947623478e-05, "loss": 0.8171, "step": 3017 }, { "epoch": 0.42, "learning_rate": 1.3052493063353956e-05, "loss": 0.8149, "step": 3018 }, { "epoch": 0.42, "learning_rate": 1.3048208561252522e-05, "loss": 0.9233, "step": 3019 }, { "epoch": 0.42, "learning_rate": 1.3043923442186364e-05, "loss": 0.8738, "step": 3020 }, { "epoch": 0.42, "learning_rate": 1.3039637707022803e-05, "loss": 0.5991, "step": 3021 }, { "epoch": 0.42, "learning_rate": 1.3035351356629278e-05, "loss": 0.9084, "step": 3022 }, { "epoch": 0.42, "learning_rate": 1.303106439187336e-05, "loss": 0.8203, "step": 3023 }, { "epoch": 0.42, "learning_rate": 1.3026776813622739e-05, "loss": 0.8225, "step": 3024 }, { "epoch": 0.42, "learning_rate": 1.3022488622745233e-05, "loss": 0.8639, "step": 3025 }, { "epoch": 0.42, "learning_rate": 1.3018199820108783e-05, "loss": 0.8982, "step": 3026 }, { "epoch": 0.42, "learning_rate": 1.301391040658145e-05, "loss": 0.8779, "step": 3027 }, { "epoch": 0.42, "learning_rate": 1.3009620383031422e-05, "loss": 0.8049, "step": 3028 }, { "epoch": 0.42, "learning_rate": 1.3005329750327011e-05, "loss": 0.8867, "step": 3029 }, { "epoch": 0.42, "learning_rate": 1.300103850933665e-05, "loss": 0.8462, "step": 3030 }, { "epoch": 0.42, "learning_rate": 1.2996746660928899e-05, "loss": 0.8716, "step": 3031 }, { "epoch": 0.42, "learning_rate": 1.299245420597244e-05, "loss": 0.9131, "step": 3032 }, { "epoch": 0.42, "learning_rate": 1.2988161145336068e-05, "loss": 0.8257, "step": 3033 }, { "epoch": 0.42, "learning_rate": 1.2983867479888716e-05, "loss": 0.8066, "step": 3034 }, { "epoch": 0.42, "learning_rate": 1.2979573210499432e-05, "loss": 0.8367, "step": 3035 }, { "epoch": 0.42, "learning_rate": 1.2975278338037382e-05, "loss": 0.8269, "step": 3036 }, { "epoch": 0.42, "learning_rate": 1.2970982863371866e-05, "loss": 0.8396, "step": 3037 }, { "epoch": 0.42, "learning_rate": 1.2966686787372289e-05, "loss": 0.8142, "step": 3038 }, { "epoch": 0.42, "learning_rate": 1.2962390110908191e-05, "loss": 0.853, "step": 3039 }, { "epoch": 0.42, "learning_rate": 1.2958092834849232e-05, "loss": 0.8313, "step": 3040 }, { "epoch": 0.42, "learning_rate": 1.2953794960065188e-05, "loss": 0.811, "step": 3041 }, { "epoch": 0.42, "learning_rate": 1.2949496487425963e-05, "loss": 0.832, "step": 3042 }, { "epoch": 0.42, "learning_rate": 1.2945197417801574e-05, "loss": 0.8801, "step": 3043 }, { "epoch": 0.42, "learning_rate": 1.2940897752062163e-05, "loss": 0.8623, "step": 3044 }, { "epoch": 0.42, "learning_rate": 1.2936597491077996e-05, "loss": 0.9065, "step": 3045 }, { "epoch": 0.42, "learning_rate": 1.2932296635719452e-05, "loss": 0.8884, "step": 3046 }, { "epoch": 0.42, "learning_rate": 1.292799518685704e-05, "loss": 0.8469, "step": 3047 }, { "epoch": 0.42, "learning_rate": 1.2923693145361378e-05, "loss": 0.8828, "step": 3048 }, { "epoch": 0.42, "learning_rate": 1.291939051210321e-05, "loss": 0.8633, "step": 3049 }, { "epoch": 0.42, "learning_rate": 1.2915087287953405e-05, "loss": 0.8213, "step": 3050 }, { "epoch": 0.42, "learning_rate": 1.291078347378294e-05, "loss": 0.78, "step": 3051 }, { "epoch": 0.42, "learning_rate": 1.2906479070462923e-05, "loss": 0.8821, "step": 3052 }, { "epoch": 0.42, "learning_rate": 1.2902174078864568e-05, "loss": 0.9233, "step": 3053 }, { "epoch": 0.42, "learning_rate": 1.2897868499859221e-05, "loss": 0.8225, "step": 3054 }, { "epoch": 0.42, "learning_rate": 1.2893562334318337e-05, "loss": 0.6041, "step": 3055 }, { "epoch": 0.42, "learning_rate": 1.28892555831135e-05, "loss": 0.876, "step": 3056 }, { "epoch": 0.42, "learning_rate": 1.2884948247116405e-05, "loss": 0.9099, "step": 3057 }, { "epoch": 0.42, "learning_rate": 1.2880640327198864e-05, "loss": 0.7765, "step": 3058 }, { "epoch": 0.42, "learning_rate": 1.2876331824232813e-05, "loss": 0.5793, "step": 3059 }, { "epoch": 0.43, "learning_rate": 1.2872022739090302e-05, "loss": 0.8384, "step": 3060 }, { "epoch": 0.43, "learning_rate": 1.2867713072643502e-05, "loss": 0.8306, "step": 3061 }, { "epoch": 0.43, "learning_rate": 1.2863402825764699e-05, "loss": 0.8301, "step": 3062 }, { "epoch": 0.43, "learning_rate": 1.2859091999326299e-05, "loss": 0.8352, "step": 3063 }, { "epoch": 0.43, "learning_rate": 1.2854780594200817e-05, "loss": 0.7836, "step": 3064 }, { "epoch": 0.43, "learning_rate": 1.28504686112609e-05, "loss": 0.8076, "step": 3065 }, { "epoch": 0.43, "learning_rate": 1.2846156051379298e-05, "loss": 0.9109, "step": 3066 }, { "epoch": 0.43, "learning_rate": 1.2841842915428889e-05, "loss": 0.7915, "step": 3067 }, { "epoch": 0.43, "learning_rate": 1.2837529204282656e-05, "loss": 0.8669, "step": 3068 }, { "epoch": 0.43, "learning_rate": 1.2833214918813705e-05, "loss": 0.8708, "step": 3069 }, { "epoch": 0.43, "learning_rate": 1.2828900059895263e-05, "loss": 0.9072, "step": 3070 }, { "epoch": 0.43, "learning_rate": 1.2824584628400662e-05, "loss": 0.8284, "step": 3071 }, { "epoch": 0.43, "learning_rate": 1.2820268625203362e-05, "loss": 0.8542, "step": 3072 }, { "epoch": 0.43, "learning_rate": 1.2815952051176927e-05, "loss": 0.8894, "step": 3073 }, { "epoch": 0.43, "learning_rate": 1.2811634907195045e-05, "loss": 0.8623, "step": 3074 }, { "epoch": 0.43, "learning_rate": 1.2807317194131512e-05, "loss": 0.8672, "step": 3075 }, { "epoch": 0.43, "learning_rate": 1.2802998912860247e-05, "loss": 0.8672, "step": 3076 }, { "epoch": 0.43, "learning_rate": 1.2798680064255283e-05, "loss": 0.8552, "step": 3077 }, { "epoch": 0.43, "learning_rate": 1.279436064919076e-05, "loss": 0.8582, "step": 3078 }, { "epoch": 0.43, "learning_rate": 1.2790040668540939e-05, "loss": 0.8372, "step": 3079 }, { "epoch": 0.43, "learning_rate": 1.2785720123180197e-05, "loss": 0.611, "step": 3080 }, { "epoch": 0.43, "learning_rate": 1.2781399013983023e-05, "loss": 0.8582, "step": 3081 }, { "epoch": 0.43, "learning_rate": 1.2777077341824017e-05, "loss": 0.8523, "step": 3082 }, { "epoch": 0.43, "learning_rate": 1.2772755107577897e-05, "loss": 0.8511, "step": 3083 }, { "epoch": 0.43, "learning_rate": 1.2768432312119492e-05, "loss": 0.8481, "step": 3084 }, { "epoch": 0.43, "learning_rate": 1.2764108956323749e-05, "loss": 0.8491, "step": 3085 }, { "epoch": 0.43, "learning_rate": 1.2759785041065724e-05, "loss": 0.8499, "step": 3086 }, { "epoch": 0.43, "learning_rate": 1.275546056722059e-05, "loss": 0.8823, "step": 3087 }, { "epoch": 0.43, "learning_rate": 1.2751135535663629e-05, "loss": 0.6246, "step": 3088 }, { "epoch": 0.43, "learning_rate": 1.2746809947270236e-05, "loss": 0.8696, "step": 3089 }, { "epoch": 0.43, "learning_rate": 1.2742483802915921e-05, "loss": 0.5935, "step": 3090 }, { "epoch": 0.43, "learning_rate": 1.273815710347631e-05, "loss": 0.8293, "step": 3091 }, { "epoch": 0.43, "learning_rate": 1.2733829849827135e-05, "loss": 0.9028, "step": 3092 }, { "epoch": 0.43, "learning_rate": 1.2729502042844242e-05, "loss": 0.8577, "step": 3093 }, { "epoch": 0.43, "learning_rate": 1.272517368340359e-05, "loss": 0.9094, "step": 3094 }, { "epoch": 0.43, "learning_rate": 1.2720844772381247e-05, "loss": 0.8977, "step": 3095 }, { "epoch": 0.43, "learning_rate": 1.2716515310653396e-05, "loss": 0.8538, "step": 3096 }, { "epoch": 0.43, "learning_rate": 1.2712185299096333e-05, "loss": 0.8625, "step": 3097 }, { "epoch": 0.43, "learning_rate": 1.2707854738586462e-05, "loss": 0.8296, "step": 3098 }, { "epoch": 0.43, "learning_rate": 1.2703523630000298e-05, "loss": 0.8435, "step": 3099 }, { "epoch": 0.43, "learning_rate": 1.2699191974214467e-05, "loss": 0.6453, "step": 3100 }, { "epoch": 0.43, "learning_rate": 1.2694859772105708e-05, "loss": 0.8389, "step": 3101 }, { "epoch": 0.43, "learning_rate": 1.2690527024550868e-05, "loss": 0.8428, "step": 3102 }, { "epoch": 0.43, "learning_rate": 1.2686193732426906e-05, "loss": 0.9094, "step": 3103 }, { "epoch": 0.43, "learning_rate": 1.2681859896610891e-05, "loss": 0.843, "step": 3104 }, { "epoch": 0.43, "learning_rate": 1.2677525517979999e-05, "loss": 0.8442, "step": 3105 }, { "epoch": 0.43, "learning_rate": 1.2673190597411521e-05, "loss": 0.6266, "step": 3106 }, { "epoch": 0.43, "learning_rate": 1.2668855135782861e-05, "loss": 0.9106, "step": 3107 }, { "epoch": 0.43, "learning_rate": 1.2664519133971514e-05, "loss": 0.8586, "step": 3108 }, { "epoch": 0.43, "learning_rate": 1.2660182592855108e-05, "loss": 0.8398, "step": 3109 }, { "epoch": 0.43, "learning_rate": 1.2655845513311364e-05, "loss": 0.8418, "step": 3110 }, { "epoch": 0.43, "learning_rate": 1.2651507896218118e-05, "loss": 0.8301, "step": 3111 }, { "epoch": 0.43, "learning_rate": 1.264716974245332e-05, "loss": 0.6047, "step": 3112 }, { "epoch": 0.43, "learning_rate": 1.2642831052895012e-05, "loss": 0.812, "step": 3113 }, { "epoch": 0.43, "learning_rate": 1.2638491828421365e-05, "loss": 0.8254, "step": 3114 }, { "epoch": 0.43, "learning_rate": 1.263415206991064e-05, "loss": 0.8647, "step": 3115 }, { "epoch": 0.43, "learning_rate": 1.2629811778241225e-05, "loss": 0.5882, "step": 3116 }, { "epoch": 0.43, "learning_rate": 1.2625470954291594e-05, "loss": 0.8823, "step": 3117 }, { "epoch": 0.43, "learning_rate": 1.2621129598940347e-05, "loss": 0.3209, "step": 3118 }, { "epoch": 0.43, "learning_rate": 1.2616787713066183e-05, "loss": 0.844, "step": 3119 }, { "epoch": 0.43, "learning_rate": 1.261244529754791e-05, "loss": 0.8257, "step": 3120 }, { "epoch": 0.43, "learning_rate": 1.2608102353264446e-05, "loss": 0.8708, "step": 3121 }, { "epoch": 0.43, "learning_rate": 1.260375888109481e-05, "loss": 0.7837, "step": 3122 }, { "epoch": 0.43, "learning_rate": 1.2599414881918131e-05, "loss": 0.8843, "step": 3123 }, { "epoch": 0.43, "learning_rate": 1.2595070356613646e-05, "loss": 0.8032, "step": 3124 }, { "epoch": 0.43, "learning_rate": 1.2590725306060698e-05, "loss": 0.6315, "step": 3125 }, { "epoch": 0.43, "learning_rate": 1.2586379731138736e-05, "loss": 0.8145, "step": 3126 }, { "epoch": 0.43, "learning_rate": 1.2582033632727312e-05, "loss": 0.9102, "step": 3127 }, { "epoch": 0.43, "learning_rate": 1.257768701170609e-05, "loss": 0.8801, "step": 3128 }, { "epoch": 0.43, "learning_rate": 1.2573339868954833e-05, "loss": 0.822, "step": 3129 }, { "epoch": 0.43, "learning_rate": 1.2568992205353418e-05, "loss": 0.9404, "step": 3130 }, { "epoch": 0.43, "learning_rate": 1.2564644021781818e-05, "loss": 0.844, "step": 3131 }, { "epoch": 0.44, "learning_rate": 1.2560295319120117e-05, "loss": 0.8032, "step": 3132 }, { "epoch": 0.44, "learning_rate": 1.2555946098248504e-05, "loss": 0.8474, "step": 3133 }, { "epoch": 0.44, "learning_rate": 1.2551596360047271e-05, "loss": 0.8726, "step": 3134 }, { "epoch": 0.44, "learning_rate": 1.2547246105396818e-05, "loss": 0.5712, "step": 3135 }, { "epoch": 0.44, "learning_rate": 1.254289533517764e-05, "loss": 0.8777, "step": 3136 }, { "epoch": 0.44, "learning_rate": 1.253854405027035e-05, "loss": 0.8354, "step": 3137 }, { "epoch": 0.44, "learning_rate": 1.2534192251555657e-05, "loss": 0.8369, "step": 3138 }, { "epoch": 0.44, "learning_rate": 1.2529839939914372e-05, "loss": 0.8992, "step": 3139 }, { "epoch": 0.44, "learning_rate": 1.2525487116227422e-05, "loss": 0.8367, "step": 3140 }, { "epoch": 0.44, "learning_rate": 1.2521133781375818e-05, "loss": 0.8536, "step": 3141 }, { "epoch": 0.44, "learning_rate": 1.2516779936240693e-05, "loss": 0.9028, "step": 3142 }, { "epoch": 0.44, "learning_rate": 1.2512425581703269e-05, "loss": 0.8955, "step": 3143 }, { "epoch": 0.44, "learning_rate": 1.250807071864489e-05, "loss": 0.8276, "step": 3144 }, { "epoch": 0.44, "learning_rate": 1.2503715347946977e-05, "loss": 0.8105, "step": 3145 }, { "epoch": 0.44, "learning_rate": 1.2499359470491073e-05, "loss": 0.8313, "step": 3146 }, { "epoch": 0.44, "learning_rate": 1.249500308715882e-05, "loss": 0.8467, "step": 3147 }, { "epoch": 0.44, "learning_rate": 1.2490646198831954e-05, "loss": 0.8555, "step": 3148 }, { "epoch": 0.44, "learning_rate": 1.2486288806392333e-05, "loss": 0.9097, "step": 3149 }, { "epoch": 0.44, "learning_rate": 1.2481930910721888e-05, "loss": 0.8281, "step": 3150 }, { "epoch": 0.44, "learning_rate": 1.2477572512702677e-05, "loss": 0.8306, "step": 3151 }, { "epoch": 0.44, "learning_rate": 1.2473213613216848e-05, "loss": 0.8586, "step": 3152 }, { "epoch": 0.44, "learning_rate": 1.246885421314665e-05, "loss": 0.843, "step": 3153 }, { "epoch": 0.44, "learning_rate": 1.2464494313374443e-05, "loss": 0.8621, "step": 3154 }, { "epoch": 0.44, "learning_rate": 1.2460133914782672e-05, "loss": 0.8948, "step": 3155 }, { "epoch": 0.44, "learning_rate": 1.24557730182539e-05, "loss": 0.5921, "step": 3156 }, { "epoch": 0.44, "learning_rate": 1.2451411624670779e-05, "loss": 0.8499, "step": 3157 }, { "epoch": 0.44, "learning_rate": 1.2447049734916065e-05, "loss": 0.8525, "step": 3158 }, { "epoch": 0.44, "learning_rate": 1.2442687349872617e-05, "loss": 0.8713, "step": 3159 }, { "epoch": 0.44, "learning_rate": 1.2438324470423393e-05, "loss": 0.8376, "step": 3160 }, { "epoch": 0.44, "learning_rate": 1.2433961097451445e-05, "loss": 0.8687, "step": 3161 }, { "epoch": 0.44, "learning_rate": 1.2429597231839937e-05, "loss": 0.8193, "step": 3162 }, { "epoch": 0.44, "learning_rate": 1.2425232874472122e-05, "loss": 0.8557, "step": 3163 }, { "epoch": 0.44, "learning_rate": 1.2420868026231356e-05, "loss": 0.8721, "step": 3164 }, { "epoch": 0.44, "learning_rate": 1.2416502688001098e-05, "loss": 0.9243, "step": 3165 }, { "epoch": 0.44, "learning_rate": 1.2412136860664898e-05, "loss": 0.8943, "step": 3166 }, { "epoch": 0.44, "learning_rate": 1.2407770545106413e-05, "loss": 0.8384, "step": 3167 }, { "epoch": 0.44, "learning_rate": 1.2403403742209395e-05, "loss": 0.9001, "step": 3168 }, { "epoch": 0.44, "learning_rate": 1.23990364528577e-05, "loss": 0.876, "step": 3169 }, { "epoch": 0.44, "learning_rate": 1.2394668677935268e-05, "loss": 0.8748, "step": 3170 }, { "epoch": 0.44, "learning_rate": 1.2390300418326156e-05, "loss": 0.8257, "step": 3171 }, { "epoch": 0.44, "learning_rate": 1.2385931674914507e-05, "loss": 0.8469, "step": 3172 }, { "epoch": 0.44, "learning_rate": 1.2381562448584562e-05, "loss": 0.811, "step": 3173 }, { "epoch": 0.44, "learning_rate": 1.2377192740220672e-05, "loss": 0.8728, "step": 3174 }, { "epoch": 0.44, "learning_rate": 1.2372822550707264e-05, "loss": 0.8972, "step": 3175 }, { "epoch": 0.44, "learning_rate": 1.2368451880928884e-05, "loss": 0.776, "step": 3176 }, { "epoch": 0.44, "learning_rate": 1.2364080731770163e-05, "loss": 0.8931, "step": 3177 }, { "epoch": 0.44, "learning_rate": 1.235970910411583e-05, "loss": 0.8616, "step": 3178 }, { "epoch": 0.44, "learning_rate": 1.2355336998850722e-05, "loss": 0.6262, "step": 3179 }, { "epoch": 0.44, "learning_rate": 1.2350964416859753e-05, "loss": 0.8376, "step": 3180 }, { "epoch": 0.44, "learning_rate": 1.2346591359027945e-05, "loss": 0.8806, "step": 3181 }, { "epoch": 0.44, "learning_rate": 1.2342217826240423e-05, "loss": 0.7727, "step": 3182 }, { "epoch": 0.44, "learning_rate": 1.2337843819382394e-05, "loss": 0.8809, "step": 3183 }, { "epoch": 0.44, "learning_rate": 1.2333469339339171e-05, "loss": 0.8667, "step": 3184 }, { "epoch": 0.44, "learning_rate": 1.2329094386996154e-05, "loss": 0.8567, "step": 3185 }, { "epoch": 0.44, "learning_rate": 1.232471896323885e-05, "loss": 0.8362, "step": 3186 }, { "epoch": 0.44, "learning_rate": 1.2320343068952851e-05, "loss": 0.8354, "step": 3187 }, { "epoch": 0.44, "learning_rate": 1.2315966705023853e-05, "loss": 0.8335, "step": 3188 }, { "epoch": 0.44, "learning_rate": 1.2311589872337639e-05, "loss": 0.8713, "step": 3189 }, { "epoch": 0.44, "learning_rate": 1.230721257178009e-05, "loss": 0.8176, "step": 3190 }, { "epoch": 0.44, "learning_rate": 1.2302834804237182e-05, "loss": 0.8521, "step": 3191 }, { "epoch": 0.44, "learning_rate": 1.229845657059499e-05, "loss": 0.9036, "step": 3192 }, { "epoch": 0.44, "learning_rate": 1.2294077871739674e-05, "loss": 0.8676, "step": 3193 }, { "epoch": 0.44, "learning_rate": 1.2289698708557499e-05, "loss": 0.8875, "step": 3194 }, { "epoch": 0.44, "learning_rate": 1.228531908193481e-05, "loss": 0.8679, "step": 3195 }, { "epoch": 0.44, "learning_rate": 1.2280938992758058e-05, "loss": 0.8909, "step": 3196 }, { "epoch": 0.44, "learning_rate": 1.2276558441913786e-05, "loss": 0.9231, "step": 3197 }, { "epoch": 0.44, "learning_rate": 1.2272177430288624e-05, "loss": 0.8752, "step": 3198 }, { "epoch": 0.44, "learning_rate": 1.2267795958769305e-05, "loss": 0.8408, "step": 3199 }, { "epoch": 0.44, "learning_rate": 1.226341402824264e-05, "loss": 0.8779, "step": 3200 }, { "epoch": 0.44, "learning_rate": 1.2259031639595551e-05, "loss": 0.8357, "step": 3201 }, { "epoch": 0.44, "learning_rate": 1.2254648793715038e-05, "loss": 0.8438, "step": 3202 }, { "epoch": 0.44, "learning_rate": 1.2250265491488202e-05, "loss": 0.8643, "step": 3203 }, { "epoch": 0.45, "learning_rate": 1.2245881733802239e-05, "loss": 0.8877, "step": 3204 }, { "epoch": 0.45, "learning_rate": 1.2241497521544423e-05, "loss": 0.8616, "step": 3205 }, { "epoch": 0.45, "learning_rate": 1.2237112855602134e-05, "loss": 0.816, "step": 3206 }, { "epoch": 0.45, "learning_rate": 1.2232727736862837e-05, "loss": 0.8479, "step": 3207 }, { "epoch": 0.45, "learning_rate": 1.2228342166214091e-05, "loss": 0.6113, "step": 3208 }, { "epoch": 0.45, "learning_rate": 1.2223956144543546e-05, "loss": 0.7839, "step": 3209 }, { "epoch": 0.45, "learning_rate": 1.221956967273895e-05, "loss": 0.886, "step": 3210 }, { "epoch": 0.45, "learning_rate": 1.2215182751688124e-05, "loss": 0.8389, "step": 3211 }, { "epoch": 0.45, "learning_rate": 1.2210795382278998e-05, "loss": 0.8499, "step": 3212 }, { "epoch": 0.45, "learning_rate": 1.2206407565399583e-05, "loss": 0.8296, "step": 3213 }, { "epoch": 0.45, "learning_rate": 1.2202019301937985e-05, "loss": 0.9346, "step": 3214 }, { "epoch": 0.45, "learning_rate": 1.2197630592782403e-05, "loss": 0.9407, "step": 3215 }, { "epoch": 0.45, "learning_rate": 1.2193241438821118e-05, "loss": 0.8501, "step": 3216 }, { "epoch": 0.45, "learning_rate": 1.2188851840942505e-05, "loss": 0.6227, "step": 3217 }, { "epoch": 0.45, "learning_rate": 1.2184461800035028e-05, "loss": 0.894, "step": 3218 }, { "epoch": 0.45, "learning_rate": 1.2180071316987245e-05, "loss": 0.5959, "step": 3219 }, { "epoch": 0.45, "learning_rate": 1.2175680392687803e-05, "loss": 0.9314, "step": 3220 }, { "epoch": 0.45, "learning_rate": 1.2171289028025428e-05, "loss": 0.9294, "step": 3221 }, { "epoch": 0.45, "learning_rate": 1.2166897223888947e-05, "loss": 0.9067, "step": 3222 }, { "epoch": 0.45, "learning_rate": 1.216250498116727e-05, "loss": 0.8684, "step": 3223 }, { "epoch": 0.45, "learning_rate": 1.2158112300749401e-05, "loss": 0.8457, "step": 3224 }, { "epoch": 0.45, "learning_rate": 1.2153719183524429e-05, "loss": 0.8325, "step": 3225 }, { "epoch": 0.45, "learning_rate": 1.2149325630381526e-05, "loss": 0.8768, "step": 3226 }, { "epoch": 0.45, "learning_rate": 1.214493164220996e-05, "loss": 0.8721, "step": 3227 }, { "epoch": 0.45, "learning_rate": 1.2140537219899087e-05, "loss": 0.8591, "step": 3228 }, { "epoch": 0.45, "learning_rate": 1.2136142364338348e-05, "loss": 0.812, "step": 3229 }, { "epoch": 0.45, "learning_rate": 1.2131747076417272e-05, "loss": 0.8599, "step": 3230 }, { "epoch": 0.45, "learning_rate": 1.2127351357025474e-05, "loss": 0.8718, "step": 3231 }, { "epoch": 0.45, "learning_rate": 1.212295520705266e-05, "loss": 0.8394, "step": 3232 }, { "epoch": 0.45, "learning_rate": 1.2118558627388622e-05, "loss": 0.7729, "step": 3233 }, { "epoch": 0.45, "learning_rate": 1.2114161618923234e-05, "loss": 0.8552, "step": 3234 }, { "epoch": 0.45, "learning_rate": 1.2109764182546468e-05, "loss": 0.5902, "step": 3235 }, { "epoch": 0.45, "learning_rate": 1.2105366319148368e-05, "loss": 0.8711, "step": 3236 }, { "epoch": 0.45, "learning_rate": 1.2100968029619078e-05, "loss": 0.8643, "step": 3237 }, { "epoch": 0.45, "learning_rate": 1.209656931484882e-05, "loss": 0.8311, "step": 3238 }, { "epoch": 0.45, "learning_rate": 1.2092170175727907e-05, "loss": 0.8569, "step": 3239 }, { "epoch": 0.45, "learning_rate": 1.208777061314673e-05, "loss": 0.8931, "step": 3240 }, { "epoch": 0.45, "learning_rate": 1.2083370627995777e-05, "loss": 0.887, "step": 3241 }, { "epoch": 0.45, "learning_rate": 1.2078970221165609e-05, "loss": 0.788, "step": 3242 }, { "epoch": 0.45, "learning_rate": 1.2074569393546884e-05, "loss": 0.8103, "step": 3243 }, { "epoch": 0.45, "learning_rate": 1.2070168146030336e-05, "loss": 0.8174, "step": 3244 }, { "epoch": 0.45, "learning_rate": 1.2065766479506796e-05, "loss": 0.8899, "step": 3245 }, { "epoch": 0.45, "learning_rate": 1.2061364394867164e-05, "loss": 0.8674, "step": 3246 }, { "epoch": 0.45, "learning_rate": 1.2056961893002435e-05, "loss": 0.813, "step": 3247 }, { "epoch": 0.45, "learning_rate": 1.2052558974803684e-05, "loss": 0.8586, "step": 3248 }, { "epoch": 0.45, "learning_rate": 1.2048155641162075e-05, "loss": 0.8635, "step": 3249 }, { "epoch": 0.45, "learning_rate": 1.2043751892968856e-05, "loss": 0.835, "step": 3250 }, { "epoch": 0.45, "learning_rate": 1.2039347731115347e-05, "loss": 0.7728, "step": 3251 }, { "epoch": 0.45, "learning_rate": 1.2034943156492969e-05, "loss": 0.843, "step": 3252 }, { "epoch": 0.45, "learning_rate": 1.2030538169993216e-05, "loss": 0.8354, "step": 3253 }, { "epoch": 0.45, "learning_rate": 1.2026132772507669e-05, "loss": 0.8267, "step": 3254 }, { "epoch": 0.45, "learning_rate": 1.2021726964927989e-05, "loss": 0.8125, "step": 3255 }, { "epoch": 0.45, "learning_rate": 1.2017320748145922e-05, "loss": 0.8933, "step": 3256 }, { "epoch": 0.45, "learning_rate": 1.2012914123053296e-05, "loss": 0.8, "step": 3257 }, { "epoch": 0.45, "learning_rate": 1.2008507090542028e-05, "loss": 0.8538, "step": 3258 }, { "epoch": 0.45, "learning_rate": 1.2004099651504104e-05, "loss": 0.9219, "step": 3259 }, { "epoch": 0.45, "learning_rate": 1.1999691806831608e-05, "loss": 0.8904, "step": 3260 }, { "epoch": 0.45, "learning_rate": 1.1995283557416694e-05, "loss": 0.8845, "step": 3261 }, { "epoch": 0.45, "learning_rate": 1.1990874904151602e-05, "loss": 0.8931, "step": 3262 }, { "epoch": 0.45, "learning_rate": 1.1986465847928655e-05, "loss": 0.9055, "step": 3263 }, { "epoch": 0.45, "learning_rate": 1.1982056389640255e-05, "loss": 0.9104, "step": 3264 }, { "epoch": 0.45, "learning_rate": 1.197764653017889e-05, "loss": 0.8447, "step": 3265 }, { "epoch": 0.45, "learning_rate": 1.1973236270437125e-05, "loss": 0.8784, "step": 3266 }, { "epoch": 0.45, "learning_rate": 1.1968825611307606e-05, "loss": 0.7961, "step": 3267 }, { "epoch": 0.45, "learning_rate": 1.196441455368306e-05, "loss": 0.8618, "step": 3268 }, { "epoch": 0.45, "learning_rate": 1.1960003098456302e-05, "loss": 0.8628, "step": 3269 }, { "epoch": 0.45, "learning_rate": 1.1955591246520213e-05, "loss": 0.8909, "step": 3270 }, { "epoch": 0.45, "learning_rate": 1.1951178998767768e-05, "loss": 0.5999, "step": 3271 }, { "epoch": 0.45, "learning_rate": 1.1946766356092012e-05, "loss": 0.8596, "step": 3272 }, { "epoch": 0.45, "learning_rate": 1.1942353319386078e-05, "loss": 0.826, "step": 3273 }, { "epoch": 0.45, "learning_rate": 1.193793988954317e-05, "loss": 0.8496, "step": 3274 }, { "epoch": 0.45, "learning_rate": 1.1933526067456587e-05, "loss": 0.8843, "step": 3275 }, { "epoch": 0.46, "learning_rate": 1.1929111854019687e-05, "loss": 0.8506, "step": 3276 }, { "epoch": 0.46, "learning_rate": 1.1924697250125925e-05, "loss": 0.8579, "step": 3277 }, { "epoch": 0.46, "learning_rate": 1.192028225666882e-05, "loss": 0.8296, "step": 3278 }, { "epoch": 0.46, "learning_rate": 1.1915866874541983e-05, "loss": 0.8743, "step": 3279 }, { "epoch": 0.46, "learning_rate": 1.1911451104639096e-05, "loss": 0.8611, "step": 3280 }, { "epoch": 0.46, "learning_rate": 1.1907034947853921e-05, "loss": 0.8669, "step": 3281 }, { "epoch": 0.46, "learning_rate": 1.19026184050803e-05, "loss": 0.8955, "step": 3282 }, { "epoch": 0.46, "learning_rate": 1.189820147721215e-05, "loss": 0.8748, "step": 3283 }, { "epoch": 0.46, "learning_rate": 1.1893784165143467e-05, "loss": 0.8665, "step": 3284 }, { "epoch": 0.46, "learning_rate": 1.1889366469768329e-05, "loss": 0.8689, "step": 3285 }, { "epoch": 0.46, "learning_rate": 1.1884948391980888e-05, "loss": 0.8345, "step": 3286 }, { "epoch": 0.46, "learning_rate": 1.1880529932675371e-05, "loss": 0.8621, "step": 3287 }, { "epoch": 0.46, "learning_rate": 1.1876111092746086e-05, "loss": 0.8962, "step": 3288 }, { "epoch": 0.46, "learning_rate": 1.1871691873087414e-05, "loss": 0.8691, "step": 3289 }, { "epoch": 0.46, "learning_rate": 1.186727227459382e-05, "loss": 0.9001, "step": 3290 }, { "epoch": 0.46, "learning_rate": 1.1862852298159841e-05, "loss": 0.8508, "step": 3291 }, { "epoch": 0.46, "learning_rate": 1.185843194468009e-05, "loss": 0.8706, "step": 3292 }, { "epoch": 0.46, "learning_rate": 1.1854011215049253e-05, "loss": 0.905, "step": 3293 }, { "epoch": 0.46, "learning_rate": 1.1849590110162102e-05, "loss": 0.8228, "step": 3294 }, { "epoch": 0.46, "learning_rate": 1.1845168630913476e-05, "loss": 0.8398, "step": 3295 }, { "epoch": 0.46, "learning_rate": 1.1840746778198296e-05, "loss": 0.8672, "step": 3296 }, { "epoch": 0.46, "learning_rate": 1.183632455291155e-05, "loss": 0.8772, "step": 3297 }, { "epoch": 0.46, "learning_rate": 1.1831901955948315e-05, "loss": 0.8206, "step": 3298 }, { "epoch": 0.46, "learning_rate": 1.1827478988203729e-05, "loss": 0.7762, "step": 3299 }, { "epoch": 0.46, "learning_rate": 1.1823055650573012e-05, "loss": 0.8906, "step": 3300 }, { "epoch": 0.46, "learning_rate": 1.1818631943951462e-05, "loss": 0.9004, "step": 3301 }, { "epoch": 0.46, "learning_rate": 1.1814207869234442e-05, "loss": 0.7468, "step": 3302 }, { "epoch": 0.46, "learning_rate": 1.18097834273174e-05, "loss": 0.8899, "step": 3303 }, { "epoch": 0.46, "learning_rate": 1.180535861909585e-05, "loss": 0.8726, "step": 3304 }, { "epoch": 0.46, "learning_rate": 1.1800933445465387e-05, "loss": 0.8782, "step": 3305 }, { "epoch": 0.46, "learning_rate": 1.179650790732168e-05, "loss": 0.9067, "step": 3306 }, { "epoch": 0.46, "learning_rate": 1.179208200556046e-05, "loss": 0.8201, "step": 3307 }, { "epoch": 0.46, "learning_rate": 1.1787655741077546e-05, "loss": 0.7762, "step": 3308 }, { "epoch": 0.46, "learning_rate": 1.1783229114768821e-05, "loss": 0.8901, "step": 3309 }, { "epoch": 0.46, "learning_rate": 1.1778802127530246e-05, "loss": 0.7695, "step": 3310 }, { "epoch": 0.46, "learning_rate": 1.1774374780257858e-05, "loss": 0.8335, "step": 3311 }, { "epoch": 0.46, "learning_rate": 1.1769947073847759e-05, "loss": 0.8577, "step": 3312 }, { "epoch": 0.46, "learning_rate": 1.1765519009196125e-05, "loss": 0.8159, "step": 3313 }, { "epoch": 0.46, "learning_rate": 1.1761090587199208e-05, "loss": 0.8411, "step": 3314 }, { "epoch": 0.46, "learning_rate": 1.1756661808753335e-05, "loss": 0.9392, "step": 3315 }, { "epoch": 0.46, "learning_rate": 1.1752232674754902e-05, "loss": 0.842, "step": 3316 }, { "epoch": 0.46, "learning_rate": 1.174780318610037e-05, "loss": 0.7979, "step": 3317 }, { "epoch": 0.46, "learning_rate": 1.1743373343686281e-05, "loss": 0.7952, "step": 3318 }, { "epoch": 0.46, "learning_rate": 1.1738943148409247e-05, "loss": 0.8668, "step": 3319 }, { "epoch": 0.46, "learning_rate": 1.1734512601165951e-05, "loss": 0.8633, "step": 3320 }, { "epoch": 0.46, "learning_rate": 1.1730081702853145e-05, "loss": 0.9041, "step": 3321 }, { "epoch": 0.46, "learning_rate": 1.1725650454367652e-05, "loss": 0.5839, "step": 3322 }, { "epoch": 0.46, "learning_rate": 1.1721218856606367e-05, "loss": 0.7502, "step": 3323 }, { "epoch": 0.46, "learning_rate": 1.171678691046626e-05, "loss": 0.8389, "step": 3324 }, { "epoch": 0.46, "learning_rate": 1.1712354616844364e-05, "loss": 0.8643, "step": 3325 }, { "epoch": 0.46, "learning_rate": 1.1707921976637786e-05, "loss": 0.8733, "step": 3326 }, { "epoch": 0.46, "learning_rate": 1.1703488990743708e-05, "loss": 0.8723, "step": 3327 }, { "epoch": 0.46, "learning_rate": 1.169905566005937e-05, "loss": 0.7988, "step": 3328 }, { "epoch": 0.46, "learning_rate": 1.1694621985482092e-05, "loss": 0.9036, "step": 3329 }, { "epoch": 0.46, "learning_rate": 1.1690187967909261e-05, "loss": 0.8821, "step": 3330 }, { "epoch": 0.46, "learning_rate": 1.168575360823833e-05, "loss": 0.8445, "step": 3331 }, { "epoch": 0.46, "learning_rate": 1.168131890736683e-05, "loss": 0.8569, "step": 3332 }, { "epoch": 0.46, "learning_rate": 1.1676883866192345e-05, "loss": 0.6881, "step": 3333 }, { "epoch": 0.46, "learning_rate": 1.1672448485612549e-05, "loss": 0.9507, "step": 3334 }, { "epoch": 0.46, "learning_rate": 1.1668012766525165e-05, "loss": 0.8507, "step": 3335 }, { "epoch": 0.46, "learning_rate": 1.1663576709828002e-05, "loss": 0.5873, "step": 3336 }, { "epoch": 0.46, "learning_rate": 1.165914031641892e-05, "loss": 0.6454, "step": 3337 }, { "epoch": 0.46, "learning_rate": 1.1654703587195857e-05, "loss": 0.8153, "step": 3338 }, { "epoch": 0.46, "learning_rate": 1.165026652305682e-05, "loss": 0.8743, "step": 3339 }, { "epoch": 0.46, "learning_rate": 1.1645829124899886e-05, "loss": 0.8005, "step": 3340 }, { "epoch": 0.46, "learning_rate": 1.1641391393623187e-05, "loss": 0.8779, "step": 3341 }, { "epoch": 0.46, "learning_rate": 1.1636953330124934e-05, "loss": 0.781, "step": 3342 }, { "epoch": 0.46, "learning_rate": 1.16325149353034e-05, "loss": 0.8547, "step": 3343 }, { "epoch": 0.46, "learning_rate": 1.162807621005693e-05, "loss": 0.855, "step": 3344 }, { "epoch": 0.46, "learning_rate": 1.1623637155283929e-05, "loss": 0.8137, "step": 3345 }, { "epoch": 0.46, "learning_rate": 1.1619197771882875e-05, "loss": 0.8477, "step": 3346 }, { "epoch": 0.46, "learning_rate": 1.161475806075231e-05, "loss": 0.6361, "step": 3347 }, { "epoch": 0.47, "learning_rate": 1.1610318022790837e-05, "loss": 0.8533, "step": 3348 }, { "epoch": 0.47, "learning_rate": 1.1605877658897135e-05, "loss": 0.8733, "step": 3349 }, { "epoch": 0.47, "learning_rate": 1.1601436969969948e-05, "loss": 0.8572, "step": 3350 }, { "epoch": 0.47, "learning_rate": 1.1596995956908075e-05, "loss": 0.8909, "step": 3351 }, { "epoch": 0.47, "learning_rate": 1.159255462061039e-05, "loss": 0.8657, "step": 3352 }, { "epoch": 0.47, "learning_rate": 1.1588112961975831e-05, "loss": 0.8174, "step": 3353 }, { "epoch": 0.47, "learning_rate": 1.1583670981903402e-05, "loss": 0.8492, "step": 3354 }, { "epoch": 0.47, "learning_rate": 1.1579228681292165e-05, "loss": 0.8442, "step": 3355 }, { "epoch": 0.47, "learning_rate": 1.1574786061041256e-05, "loss": 0.8958, "step": 3356 }, { "epoch": 0.47, "learning_rate": 1.1570343122049875e-05, "loss": 0.8494, "step": 3357 }, { "epoch": 0.47, "learning_rate": 1.1565899865217275e-05, "loss": 0.8135, "step": 3358 }, { "epoch": 0.47, "learning_rate": 1.1561456291442789e-05, "loss": 0.8479, "step": 3359 }, { "epoch": 0.47, "learning_rate": 1.155701240162581e-05, "loss": 0.8799, "step": 3360 }, { "epoch": 0.47, "learning_rate": 1.1552568196665781e-05, "loss": 0.8376, "step": 3361 }, { "epoch": 0.47, "learning_rate": 1.1548123677462227e-05, "loss": 0.9011, "step": 3362 }, { "epoch": 0.47, "learning_rate": 1.1543678844914727e-05, "loss": 0.6071, "step": 3363 }, { "epoch": 0.47, "learning_rate": 1.153923369992293e-05, "loss": 0.8584, "step": 3364 }, { "epoch": 0.47, "learning_rate": 1.1534788243386539e-05, "loss": 0.9395, "step": 3365 }, { "epoch": 0.47, "learning_rate": 1.1530342476205325e-05, "loss": 0.8337, "step": 3366 }, { "epoch": 0.47, "learning_rate": 1.1525896399279124e-05, "loss": 0.8884, "step": 3367 }, { "epoch": 0.47, "learning_rate": 1.1521450013507834e-05, "loss": 0.8342, "step": 3368 }, { "epoch": 0.47, "learning_rate": 1.1517003319791414e-05, "loss": 0.8599, "step": 3369 }, { "epoch": 0.47, "learning_rate": 1.1512556319029881e-05, "loss": 0.9011, "step": 3370 }, { "epoch": 0.47, "learning_rate": 1.1508109012123324e-05, "loss": 0.844, "step": 3371 }, { "epoch": 0.47, "learning_rate": 1.1503661399971883e-05, "loss": 0.8472, "step": 3372 }, { "epoch": 0.47, "learning_rate": 1.1499213483475773e-05, "loss": 0.8312, "step": 3373 }, { "epoch": 0.47, "learning_rate": 1.1494765263535257e-05, "loss": 0.8564, "step": 3374 }, { "epoch": 0.47, "learning_rate": 1.1490316741050665e-05, "loss": 0.8838, "step": 3375 }, { "epoch": 0.47, "learning_rate": 1.148586791692239e-05, "loss": 0.791, "step": 3376 }, { "epoch": 0.47, "learning_rate": 1.1481418792050887e-05, "loss": 0.8416, "step": 3377 }, { "epoch": 0.47, "learning_rate": 1.147696936733667e-05, "loss": 0.8064, "step": 3378 }, { "epoch": 0.47, "learning_rate": 1.1472519643680309e-05, "loss": 0.865, "step": 3379 }, { "epoch": 0.47, "learning_rate": 1.146806962198244e-05, "loss": 0.5973, "step": 3380 }, { "epoch": 0.47, "learning_rate": 1.1463619303143758e-05, "loss": 0.7849, "step": 3381 }, { "epoch": 0.47, "learning_rate": 1.145916868806502e-05, "loss": 0.9001, "step": 3382 }, { "epoch": 0.47, "learning_rate": 1.1454717777647044e-05, "loss": 0.8171, "step": 3383 }, { "epoch": 0.47, "learning_rate": 1.1450266572790696e-05, "loss": 0.8243, "step": 3384 }, { "epoch": 0.47, "learning_rate": 1.1445815074396917e-05, "loss": 0.8804, "step": 3385 }, { "epoch": 0.47, "learning_rate": 1.14413632833667e-05, "loss": 0.9185, "step": 3386 }, { "epoch": 0.47, "learning_rate": 1.1436911200601097e-05, "loss": 0.8713, "step": 3387 }, { "epoch": 0.47, "learning_rate": 1.1432458827001222e-05, "loss": 0.8674, "step": 3388 }, { "epoch": 0.47, "learning_rate": 1.1428006163468246e-05, "loss": 0.8782, "step": 3389 }, { "epoch": 0.47, "learning_rate": 1.1423553210903396e-05, "loss": 0.8408, "step": 3390 }, { "epoch": 0.47, "learning_rate": 1.1419099970207963e-05, "loss": 0.821, "step": 3391 }, { "epoch": 0.47, "learning_rate": 1.141464644228329e-05, "loss": 0.8716, "step": 3392 }, { "epoch": 0.47, "learning_rate": 1.141019262803079e-05, "loss": 0.8621, "step": 3393 }, { "epoch": 0.47, "learning_rate": 1.1405738528351918e-05, "loss": 0.8291, "step": 3394 }, { "epoch": 0.47, "learning_rate": 1.1401284144148194e-05, "loss": 0.844, "step": 3395 }, { "epoch": 0.47, "learning_rate": 1.13968294763212e-05, "loss": 0.8652, "step": 3396 }, { "epoch": 0.47, "learning_rate": 1.1392374525772571e-05, "loss": 0.8269, "step": 3397 }, { "epoch": 0.47, "learning_rate": 1.1387919293404002e-05, "loss": 0.8589, "step": 3398 }, { "epoch": 0.47, "learning_rate": 1.1383463780117235e-05, "loss": 0.8445, "step": 3399 }, { "epoch": 0.47, "learning_rate": 1.1379007986814081e-05, "loss": 0.8418, "step": 3400 }, { "epoch": 0.47, "learning_rate": 1.1374551914396404e-05, "loss": 0.845, "step": 3401 }, { "epoch": 0.47, "learning_rate": 1.1370095563766123e-05, "loss": 0.5872, "step": 3402 }, { "epoch": 0.47, "learning_rate": 1.1365638935825216e-05, "loss": 0.8262, "step": 3403 }, { "epoch": 0.47, "learning_rate": 1.1361182031475712e-05, "loss": 0.7805, "step": 3404 }, { "epoch": 0.47, "learning_rate": 1.13567248516197e-05, "loss": 0.7981, "step": 3405 }, { "epoch": 0.47, "learning_rate": 1.1352267397159325e-05, "loss": 0.8708, "step": 3406 }, { "epoch": 0.47, "learning_rate": 1.1347809668996786e-05, "loss": 0.8113, "step": 3407 }, { "epoch": 0.47, "learning_rate": 1.134335166803434e-05, "loss": 0.8625, "step": 3408 }, { "epoch": 0.47, "learning_rate": 1.133889339517429e-05, "loss": 0.835, "step": 3409 }, { "epoch": 0.47, "learning_rate": 1.1334434851319008e-05, "loss": 0.918, "step": 3410 }, { "epoch": 0.47, "learning_rate": 1.1329976037370912e-05, "loss": 0.8794, "step": 3411 }, { "epoch": 0.47, "learning_rate": 1.1325516954232476e-05, "loss": 0.8679, "step": 3412 }, { "epoch": 0.47, "learning_rate": 1.1321057602806231e-05, "loss": 0.9006, "step": 3413 }, { "epoch": 0.47, "learning_rate": 1.1316597983994759e-05, "loss": 0.6045, "step": 3414 }, { "epoch": 0.47, "learning_rate": 1.1312138098700696e-05, "loss": 0.8369, "step": 3415 }, { "epoch": 0.47, "learning_rate": 1.1307677947826736e-05, "loss": 0.9939, "step": 3416 }, { "epoch": 0.47, "learning_rate": 1.1303217532275623e-05, "loss": 0.6672, "step": 3417 }, { "epoch": 0.47, "learning_rate": 1.1298756852950157e-05, "loss": 0.9175, "step": 3418 }, { "epoch": 0.47, "learning_rate": 1.1294295910753189e-05, "loss": 0.8381, "step": 3419 }, { "epoch": 0.48, "learning_rate": 1.1289834706587623e-05, "loss": 0.8489, "step": 3420 }, { "epoch": 0.48, "learning_rate": 1.128537324135642e-05, "loss": 0.8455, "step": 3421 }, { "epoch": 0.48, "learning_rate": 1.1280911515962592e-05, "loss": 0.8223, "step": 3422 }, { "epoch": 0.48, "learning_rate": 1.1276449531309202e-05, "loss": 0.8625, "step": 3423 }, { "epoch": 0.48, "learning_rate": 1.1271987288299362e-05, "loss": 0.8391, "step": 3424 }, { "epoch": 0.48, "learning_rate": 1.1267524787836246e-05, "loss": 0.8838, "step": 3425 }, { "epoch": 0.48, "learning_rate": 1.1263062030823073e-05, "loss": 0.8777, "step": 3426 }, { "epoch": 0.48, "learning_rate": 1.1258599018163117e-05, "loss": 0.5883, "step": 3427 }, { "epoch": 0.48, "learning_rate": 1.1254135750759701e-05, "loss": 0.9031, "step": 3428 }, { "epoch": 0.48, "learning_rate": 1.1249672229516201e-05, "loss": 0.8203, "step": 3429 }, { "epoch": 0.48, "learning_rate": 1.1245208455336044e-05, "loss": 0.9292, "step": 3430 }, { "epoch": 0.48, "learning_rate": 1.124074442912271e-05, "loss": 0.8711, "step": 3431 }, { "epoch": 0.48, "learning_rate": 1.1236280151779729e-05, "loss": 0.8179, "step": 3432 }, { "epoch": 0.48, "learning_rate": 1.123181562421068e-05, "loss": 0.8274, "step": 3433 }, { "epoch": 0.48, "learning_rate": 1.1227350847319194e-05, "loss": 0.8701, "step": 3434 }, { "epoch": 0.48, "learning_rate": 1.1222885822008952e-05, "loss": 0.8403, "step": 3435 }, { "epoch": 0.48, "learning_rate": 1.1218420549183688e-05, "loss": 0.865, "step": 3436 }, { "epoch": 0.48, "learning_rate": 1.1213955029747184e-05, "loss": 0.5825, "step": 3437 }, { "epoch": 0.48, "learning_rate": 1.120948926460327e-05, "loss": 0.8406, "step": 3438 }, { "epoch": 0.48, "learning_rate": 1.1205023254655829e-05, "loss": 0.8206, "step": 3439 }, { "epoch": 0.48, "learning_rate": 1.120055700080879e-05, "loss": 0.8369, "step": 3440 }, { "epoch": 0.48, "learning_rate": 1.1196090503966135e-05, "loss": 0.9143, "step": 3441 }, { "epoch": 0.48, "learning_rate": 1.1191623765031894e-05, "loss": 0.8906, "step": 3442 }, { "epoch": 0.48, "learning_rate": 1.1187156784910145e-05, "loss": 0.8811, "step": 3443 }, { "epoch": 0.48, "learning_rate": 1.1182689564505017e-05, "loss": 0.8628, "step": 3444 }, { "epoch": 0.48, "learning_rate": 1.1178222104720682e-05, "loss": 0.822, "step": 3445 }, { "epoch": 0.48, "learning_rate": 1.1173754406461371e-05, "loss": 0.8066, "step": 3446 }, { "epoch": 0.48, "learning_rate": 1.1169286470631348e-05, "loss": 0.8362, "step": 3447 }, { "epoch": 0.48, "learning_rate": 1.1164818298134943e-05, "loss": 0.8984, "step": 3448 }, { "epoch": 0.48, "learning_rate": 1.1160349889876522e-05, "loss": 0.6255, "step": 3449 }, { "epoch": 0.48, "learning_rate": 1.1155881246760499e-05, "loss": 0.8875, "step": 3450 }, { "epoch": 0.48, "learning_rate": 1.1151412369691339e-05, "loss": 0.8203, "step": 3451 }, { "epoch": 0.48, "learning_rate": 1.1146943259573554e-05, "loss": 0.9141, "step": 3452 }, { "epoch": 0.48, "learning_rate": 1.1142473917311705e-05, "loss": 0.5981, "step": 3453 }, { "epoch": 0.48, "learning_rate": 1.1138004343810394e-05, "loss": 0.9014, "step": 3454 }, { "epoch": 0.48, "learning_rate": 1.1133534539974274e-05, "loss": 0.8435, "step": 3455 }, { "epoch": 0.48, "learning_rate": 1.1129064506708045e-05, "loss": 0.8564, "step": 3456 }, { "epoch": 0.48, "learning_rate": 1.1124594244916452e-05, "loss": 0.8669, "step": 3457 }, { "epoch": 0.48, "learning_rate": 1.1120123755504287e-05, "loss": 0.8245, "step": 3458 }, { "epoch": 0.48, "learning_rate": 1.1115653039376389e-05, "loss": 0.9326, "step": 3459 }, { "epoch": 0.48, "learning_rate": 1.1111182097437638e-05, "loss": 0.8247, "step": 3460 }, { "epoch": 0.48, "learning_rate": 1.1106710930592965e-05, "loss": 0.8014, "step": 3461 }, { "epoch": 0.48, "learning_rate": 1.1102239539747348e-05, "loss": 0.7395, "step": 3462 }, { "epoch": 0.48, "learning_rate": 1.1097767925805802e-05, "loss": 0.6292, "step": 3463 }, { "epoch": 0.48, "learning_rate": 1.10932960896734e-05, "loss": 0.8538, "step": 3464 }, { "epoch": 0.48, "learning_rate": 1.1088824032255245e-05, "loss": 0.8872, "step": 3465 }, { "epoch": 0.48, "learning_rate": 1.1084351754456493e-05, "loss": 0.5619, "step": 3466 }, { "epoch": 0.48, "learning_rate": 1.1079879257182347e-05, "loss": 0.8374, "step": 3467 }, { "epoch": 0.48, "learning_rate": 1.1075406541338047e-05, "loss": 0.8799, "step": 3468 }, { "epoch": 0.48, "learning_rate": 1.107093360782889e-05, "loss": 0.8215, "step": 3469 }, { "epoch": 0.48, "learning_rate": 1.1066460457560197e-05, "loss": 0.7969, "step": 3470 }, { "epoch": 0.48, "learning_rate": 1.1061987091437352e-05, "loss": 0.7799, "step": 3471 }, { "epoch": 0.48, "learning_rate": 1.1057513510365771e-05, "loss": 0.8491, "step": 3472 }, { "epoch": 0.48, "learning_rate": 1.1053039715250922e-05, "loss": 0.8301, "step": 3473 }, { "epoch": 0.48, "learning_rate": 1.1048565706998308e-05, "loss": 0.6388, "step": 3474 }, { "epoch": 0.48, "learning_rate": 1.1044091486513482e-05, "loss": 0.8979, "step": 3475 }, { "epoch": 0.48, "learning_rate": 1.1039617054702031e-05, "loss": 0.5972, "step": 3476 }, { "epoch": 0.48, "learning_rate": 1.1035142412469599e-05, "loss": 0.8704, "step": 3477 }, { "epoch": 0.48, "learning_rate": 1.1030667560721858e-05, "loss": 0.9207, "step": 3478 }, { "epoch": 0.48, "learning_rate": 1.1026192500364535e-05, "loss": 0.8201, "step": 3479 }, { "epoch": 0.48, "learning_rate": 1.1021717232303383e-05, "loss": 0.5533, "step": 3480 }, { "epoch": 0.48, "learning_rate": 1.1017241757444214e-05, "loss": 0.8445, "step": 3481 }, { "epoch": 0.48, "learning_rate": 1.1012766076692876e-05, "loss": 0.8218, "step": 3482 }, { "epoch": 0.48, "learning_rate": 1.1008290190955255e-05, "loss": 0.8264, "step": 3483 }, { "epoch": 0.48, "learning_rate": 1.1003814101137282e-05, "loss": 0.5958, "step": 3484 }, { "epoch": 0.48, "learning_rate": 1.0999337808144927e-05, "loss": 0.5822, "step": 3485 }, { "epoch": 0.48, "learning_rate": 1.0994861312884201e-05, "loss": 0.833, "step": 3486 }, { "epoch": 0.48, "learning_rate": 1.099038461626116e-05, "loss": 0.8333, "step": 3487 }, { "epoch": 0.48, "learning_rate": 1.09859077191819e-05, "loss": 0.6637, "step": 3488 }, { "epoch": 0.48, "learning_rate": 1.0981430622552553e-05, "loss": 0.7876, "step": 3489 }, { "epoch": 0.48, "learning_rate": 1.0976953327279292e-05, "loss": 0.9373, "step": 3490 }, { "epoch": 0.48, "learning_rate": 1.0972475834268334e-05, "loss": 0.8145, "step": 3491 }, { "epoch": 0.49, "learning_rate": 1.0967998144425938e-05, "loss": 0.8088, "step": 3492 }, { "epoch": 0.49, "learning_rate": 1.0963520258658393e-05, "loss": 0.8123, "step": 3493 }, { "epoch": 0.49, "learning_rate": 1.0959042177872041e-05, "loss": 0.8386, "step": 3494 }, { "epoch": 0.49, "learning_rate": 1.095456390297325e-05, "loss": 0.8291, "step": 3495 }, { "epoch": 0.49, "learning_rate": 1.0950085434868436e-05, "loss": 0.8315, "step": 3496 }, { "epoch": 0.49, "learning_rate": 1.094560677446405e-05, "loss": 0.6077, "step": 3497 }, { "epoch": 0.49, "learning_rate": 1.0941127922666586e-05, "loss": 0.8271, "step": 3498 }, { "epoch": 0.49, "learning_rate": 1.0936648880382577e-05, "loss": 0.8257, "step": 3499 }, { "epoch": 0.49, "learning_rate": 1.0932169648518584e-05, "loss": 0.8315, "step": 3500 }, { "epoch": 0.49, "learning_rate": 1.0927690227981218e-05, "loss": 0.8145, "step": 3501 }, { "epoch": 0.49, "learning_rate": 1.0923210619677127e-05, "loss": 0.813, "step": 3502 }, { "epoch": 0.49, "learning_rate": 1.0918730824512994e-05, "loss": 0.8408, "step": 3503 }, { "epoch": 0.49, "learning_rate": 1.0914250843395535e-05, "loss": 0.9147, "step": 3504 }, { "epoch": 0.49, "learning_rate": 1.0909770677231517e-05, "loss": 0.8738, "step": 3505 }, { "epoch": 0.49, "learning_rate": 1.0905290326927731e-05, "loss": 0.8784, "step": 3506 }, { "epoch": 0.49, "learning_rate": 1.090080979339101e-05, "loss": 0.8474, "step": 3507 }, { "epoch": 0.49, "learning_rate": 1.0896329077528226e-05, "loss": 0.8154, "step": 3508 }, { "epoch": 0.49, "learning_rate": 1.089184818024629e-05, "loss": 0.8682, "step": 3509 }, { "epoch": 0.49, "learning_rate": 1.0887367102452142e-05, "loss": 0.8508, "step": 3510 }, { "epoch": 0.49, "learning_rate": 1.0882885845052765e-05, "loss": 0.8328, "step": 3511 }, { "epoch": 0.49, "learning_rate": 1.0878404408955174e-05, "loss": 0.9006, "step": 3512 }, { "epoch": 0.49, "learning_rate": 1.0873922795066425e-05, "loss": 0.6073, "step": 3513 }, { "epoch": 0.49, "learning_rate": 1.0869441004293607e-05, "loss": 0.9045, "step": 3514 }, { "epoch": 0.49, "learning_rate": 1.0864959037543846e-05, "loss": 0.8391, "step": 3515 }, { "epoch": 0.49, "learning_rate": 1.0860476895724299e-05, "loss": 0.8298, "step": 3516 }, { "epoch": 0.49, "learning_rate": 1.0855994579742164e-05, "loss": 0.6099, "step": 3517 }, { "epoch": 0.49, "learning_rate": 1.0851512090504675e-05, "loss": 0.619, "step": 3518 }, { "epoch": 0.49, "learning_rate": 1.0847029428919096e-05, "loss": 0.8176, "step": 3519 }, { "epoch": 0.49, "learning_rate": 1.0842546595892731e-05, "loss": 0.8252, "step": 3520 }, { "epoch": 0.49, "learning_rate": 1.0838063592332912e-05, "loss": 0.8564, "step": 3521 }, { "epoch": 0.49, "learning_rate": 1.0833580419147015e-05, "loss": 0.783, "step": 3522 }, { "epoch": 0.49, "learning_rate": 1.0829097077242438e-05, "loss": 0.8562, "step": 3523 }, { "epoch": 0.49, "learning_rate": 1.0824613567526627e-05, "loss": 0.8442, "step": 3524 }, { "epoch": 0.49, "learning_rate": 1.0820129890907054e-05, "loss": 0.8867, "step": 3525 }, { "epoch": 0.49, "learning_rate": 1.0815646048291221e-05, "loss": 0.8264, "step": 3526 }, { "epoch": 0.49, "learning_rate": 1.0811162040586673e-05, "loss": 0.8379, "step": 3527 }, { "epoch": 0.49, "learning_rate": 1.0806677868700983e-05, "loss": 0.8169, "step": 3528 }, { "epoch": 0.49, "learning_rate": 1.0802193533541756e-05, "loss": 0.5979, "step": 3529 }, { "epoch": 0.49, "learning_rate": 1.0797709036016637e-05, "loss": 0.897, "step": 3530 }, { "epoch": 0.49, "learning_rate": 1.0793224377033295e-05, "loss": 0.8699, "step": 3531 }, { "epoch": 0.49, "learning_rate": 1.0788739557499434e-05, "loss": 0.8533, "step": 3532 }, { "epoch": 0.49, "learning_rate": 1.0784254578322799e-05, "loss": 0.8586, "step": 3533 }, { "epoch": 0.49, "learning_rate": 1.0779769440411154e-05, "loss": 0.8538, "step": 3534 }, { "epoch": 0.49, "learning_rate": 1.0775284144672307e-05, "loss": 0.8682, "step": 3535 }, { "epoch": 0.49, "learning_rate": 1.0770798692014086e-05, "loss": 0.8625, "step": 3536 }, { "epoch": 0.49, "learning_rate": 1.0766313083344364e-05, "loss": 0.5916, "step": 3537 }, { "epoch": 0.49, "learning_rate": 1.0761827319571035e-05, "loss": 0.8269, "step": 3538 }, { "epoch": 0.49, "learning_rate": 1.0757341401602029e-05, "loss": 0.8572, "step": 3539 }, { "epoch": 0.49, "learning_rate": 1.075285533034531e-05, "loss": 0.917, "step": 3540 }, { "epoch": 0.49, "learning_rate": 1.0748369106708862e-05, "loss": 0.8174, "step": 3541 }, { "epoch": 0.49, "learning_rate": 1.0743882731600716e-05, "loss": 0.8818, "step": 3542 }, { "epoch": 0.49, "learning_rate": 1.0739396205928919e-05, "loss": 0.8333, "step": 3543 }, { "epoch": 0.49, "learning_rate": 1.0734909530601556e-05, "loss": 0.7886, "step": 3544 }, { "epoch": 0.49, "learning_rate": 1.0730422706526746e-05, "loss": 0.8877, "step": 3545 }, { "epoch": 0.49, "learning_rate": 1.0725935734612625e-05, "loss": 0.9353, "step": 3546 }, { "epoch": 0.49, "learning_rate": 1.072144861576737e-05, "loss": 0.8147, "step": 3547 }, { "epoch": 0.49, "learning_rate": 1.0716961350899186e-05, "loss": 0.853, "step": 3548 }, { "epoch": 0.49, "learning_rate": 1.0712473940916304e-05, "loss": 0.7715, "step": 3549 }, { "epoch": 0.49, "learning_rate": 1.0707986386726992e-05, "loss": 0.8545, "step": 3550 }, { "epoch": 0.49, "learning_rate": 1.0703498689239533e-05, "loss": 0.8752, "step": 3551 }, { "epoch": 0.49, "learning_rate": 1.0699010849362252e-05, "loss": 0.8533, "step": 3552 }, { "epoch": 0.49, "learning_rate": 1.06945228680035e-05, "loss": 0.8765, "step": 3553 }, { "epoch": 0.49, "learning_rate": 1.0690034746071654e-05, "loss": 0.887, "step": 3554 }, { "epoch": 0.49, "learning_rate": 1.0685546484475123e-05, "loss": 0.7732, "step": 3555 }, { "epoch": 0.49, "learning_rate": 1.0681058084122337e-05, "loss": 0.5946, "step": 3556 }, { "epoch": 0.49, "learning_rate": 1.067656954592176e-05, "loss": 0.8584, "step": 3557 }, { "epoch": 0.49, "learning_rate": 1.0672080870781887e-05, "loss": 0.8103, "step": 3558 }, { "epoch": 0.49, "learning_rate": 1.0667592059611232e-05, "loss": 0.8833, "step": 3559 }, { "epoch": 0.49, "learning_rate": 1.0663103113318342e-05, "loss": 0.9214, "step": 3560 }, { "epoch": 0.49, "learning_rate": 1.0658614032811796e-05, "loss": 0.8394, "step": 3561 }, { "epoch": 0.49, "learning_rate": 1.065412481900019e-05, "loss": 0.8467, "step": 3562 }, { "epoch": 0.49, "learning_rate": 1.0649635472792147e-05, "loss": 0.8127, "step": 3563 }, { "epoch": 0.5, "learning_rate": 1.0645145995096328e-05, "loss": 0.8125, "step": 3564 }, { "epoch": 0.5, "learning_rate": 1.0640656386821415e-05, "loss": 0.5983, "step": 3565 }, { "epoch": 0.5, "learning_rate": 1.0636166648876113e-05, "loss": 0.8247, "step": 3566 }, { "epoch": 0.5, "learning_rate": 1.0631676782169154e-05, "loss": 0.8906, "step": 3567 }, { "epoch": 0.5, "learning_rate": 1.0627186787609299e-05, "loss": 0.8562, "step": 3568 }, { "epoch": 0.5, "learning_rate": 1.0622696666105334e-05, "loss": 0.8621, "step": 3569 }, { "epoch": 0.5, "learning_rate": 1.0618206418566073e-05, "loss": 0.8721, "step": 3570 }, { "epoch": 0.5, "learning_rate": 1.0613716045900348e-05, "loss": 0.8821, "step": 3571 }, { "epoch": 0.5, "learning_rate": 1.0609225549017024e-05, "loss": 0.8657, "step": 3572 }, { "epoch": 0.5, "learning_rate": 1.0604734928824986e-05, "loss": 0.6071, "step": 3573 }, { "epoch": 0.5, "learning_rate": 1.060024418623315e-05, "loss": 0.9019, "step": 3574 }, { "epoch": 0.5, "learning_rate": 1.0595753322150453e-05, "loss": 0.7734, "step": 3575 }, { "epoch": 0.5, "learning_rate": 1.0591262337485852e-05, "loss": 0.827, "step": 3576 }, { "epoch": 0.5, "learning_rate": 1.0586771233148337e-05, "loss": 0.8965, "step": 3577 }, { "epoch": 0.5, "learning_rate": 1.0582280010046918e-05, "loss": 0.6146, "step": 3578 }, { "epoch": 0.5, "learning_rate": 1.0577788669090627e-05, "loss": 0.8667, "step": 3579 }, { "epoch": 0.5, "learning_rate": 1.0573297211188525e-05, "loss": 0.8533, "step": 3580 }, { "epoch": 0.5, "learning_rate": 1.0568805637249693e-05, "loss": 0.8037, "step": 3581 }, { "epoch": 0.5, "learning_rate": 1.0564313948183234e-05, "loss": 0.8779, "step": 3582 }, { "epoch": 0.5, "learning_rate": 1.055982214489828e-05, "loss": 0.8586, "step": 3583 }, { "epoch": 0.5, "learning_rate": 1.0555330228303981e-05, "loss": 0.8711, "step": 3584 }, { "epoch": 0.5, "learning_rate": 1.0550838199309512e-05, "loss": 0.8423, "step": 3585 }, { "epoch": 0.5, "learning_rate": 1.0546346058824068e-05, "loss": 0.776, "step": 3586 }, { "epoch": 0.5, "learning_rate": 1.0541853807756874e-05, "loss": 0.8201, "step": 3587 }, { "epoch": 0.5, "learning_rate": 1.0537361447017169e-05, "loss": 0.9026, "step": 3588 }, { "epoch": 0.5, "learning_rate": 1.0532868977514222e-05, "loss": 0.8318, "step": 3589 }, { "epoch": 0.5, "learning_rate": 1.0528376400157312e-05, "loss": 0.8677, "step": 3590 }, { "epoch": 0.5, "learning_rate": 1.0523883715855751e-05, "loss": 0.8403, "step": 3591 }, { "epoch": 0.5, "learning_rate": 1.0519390925518872e-05, "loss": 0.8235, "step": 3592 }, { "epoch": 0.5, "learning_rate": 1.0514898030056025e-05, "loss": 0.853, "step": 3593 }, { "epoch": 0.5, "learning_rate": 1.0510405030376577e-05, "loss": 0.7722, "step": 3594 }, { "epoch": 0.5, "learning_rate": 1.0505911927389932e-05, "loss": 0.9155, "step": 3595 }, { "epoch": 0.5, "learning_rate": 1.0501418722005497e-05, "loss": 0.8735, "step": 3596 }, { "epoch": 0.5, "learning_rate": 1.049692541513271e-05, "loss": 0.811, "step": 3597 }, { "epoch": 0.5, "learning_rate": 1.0492432007681027e-05, "loss": 0.8013, "step": 3598 }, { "epoch": 0.5, "learning_rate": 1.0487938500559926e-05, "loss": 0.8372, "step": 3599 }, { "epoch": 0.5, "learning_rate": 1.0483444894678902e-05, "loss": 0.8408, "step": 3600 }, { "epoch": 0.5, "learning_rate": 1.0478951190947473e-05, "loss": 0.855, "step": 3601 }, { "epoch": 0.5, "learning_rate": 1.0474457390275172e-05, "loss": 0.8347, "step": 3602 }, { "epoch": 0.5, "learning_rate": 1.046996349357156e-05, "loss": 0.8667, "step": 3603 }, { "epoch": 0.5, "learning_rate": 1.0465469501746207e-05, "loss": 0.8528, "step": 3604 }, { "epoch": 0.5, "learning_rate": 1.0460975415708712e-05, "loss": 0.7847, "step": 3605 }, { "epoch": 0.5, "learning_rate": 1.0456481236368688e-05, "loss": 0.8079, "step": 3606 }, { "epoch": 0.5, "learning_rate": 1.0451986964635767e-05, "loss": 0.8953, "step": 3607 }, { "epoch": 0.5, "learning_rate": 1.0447492601419599e-05, "loss": 0.8977, "step": 3608 }, { "epoch": 0.5, "learning_rate": 1.0442998147629856e-05, "loss": 0.8358, "step": 3609 }, { "epoch": 0.5, "learning_rate": 1.0438503604176224e-05, "loss": 0.8459, "step": 3610 }, { "epoch": 0.5, "learning_rate": 1.0434008971968415e-05, "loss": 0.8347, "step": 3611 }, { "epoch": 0.5, "learning_rate": 1.0429514251916146e-05, "loss": 0.8115, "step": 3612 }, { "epoch": 0.5, "learning_rate": 1.0425019444929163e-05, "loss": 0.8596, "step": 3613 }, { "epoch": 0.5, "learning_rate": 1.0420524551917226e-05, "loss": 0.8234, "step": 3614 }, { "epoch": 0.5, "learning_rate": 1.041602957379011e-05, "loss": 0.8767, "step": 3615 }, { "epoch": 0.5, "learning_rate": 1.0411534511457613e-05, "loss": 0.8148, "step": 3616 }, { "epoch": 0.5, "learning_rate": 1.0407039365829541e-05, "loss": 0.8579, "step": 3617 }, { "epoch": 0.5, "learning_rate": 1.0402544137815724e-05, "loss": 0.855, "step": 3618 }, { "epoch": 0.5, "learning_rate": 1.039804882832601e-05, "loss": 0.6259, "step": 3619 }, { "epoch": 0.5, "learning_rate": 1.039355343827026e-05, "loss": 0.8396, "step": 3620 }, { "epoch": 0.5, "learning_rate": 1.0389057968558347e-05, "loss": 0.8296, "step": 3621 }, { "epoch": 0.5, "learning_rate": 1.0384562420100173e-05, "loss": 0.5833, "step": 3622 }, { "epoch": 0.5, "learning_rate": 1.0380066793805639e-05, "loss": 0.8157, "step": 3623 }, { "epoch": 0.5, "learning_rate": 1.0375571090584675e-05, "loss": 0.8467, "step": 3624 }, { "epoch": 0.5, "learning_rate": 1.037107531134722e-05, "loss": 0.8672, "step": 3625 }, { "epoch": 0.5, "learning_rate": 1.0366579457003234e-05, "loss": 0.9104, "step": 3626 }, { "epoch": 0.5, "learning_rate": 1.0362083528462689e-05, "loss": 0.8708, "step": 3627 }, { "epoch": 0.5, "learning_rate": 1.0357587526635569e-05, "loss": 0.8333, "step": 3628 }, { "epoch": 0.5, "learning_rate": 1.035309145243187e-05, "loss": 0.8987, "step": 3629 }, { "epoch": 0.5, "learning_rate": 1.0348595306761622e-05, "loss": 0.8171, "step": 3630 }, { "epoch": 0.5, "learning_rate": 1.0344099090534843e-05, "loss": 0.7947, "step": 3631 }, { "epoch": 0.5, "learning_rate": 1.0339602804661587e-05, "loss": 0.8608, "step": 3632 }, { "epoch": 0.5, "learning_rate": 1.0335106450051907e-05, "loss": 0.8547, "step": 3633 }, { "epoch": 0.5, "learning_rate": 1.0330610027615874e-05, "loss": 0.8579, "step": 3634 }, { "epoch": 0.5, "learning_rate": 1.0326113538263583e-05, "loss": 0.8557, "step": 3635 }, { "epoch": 0.51, "learning_rate": 1.0321616982905128e-05, "loss": 0.7552, "step": 3636 }, { "epoch": 0.51, "learning_rate": 1.0317120362450626e-05, "loss": 0.8169, "step": 3637 }, { "epoch": 0.51, "learning_rate": 1.0312623677810201e-05, "loss": 0.8196, "step": 3638 }, { "epoch": 0.51, "learning_rate": 1.0308126929893993e-05, "loss": 0.8452, "step": 3639 }, { "epoch": 0.51, "learning_rate": 1.0303630119612156e-05, "loss": 0.8708, "step": 3640 }, { "epoch": 0.51, "learning_rate": 1.0299133247874856e-05, "loss": 0.9207, "step": 3641 }, { "epoch": 0.51, "learning_rate": 1.0294636315592269e-05, "loss": 0.8652, "step": 3642 }, { "epoch": 0.51, "learning_rate": 1.0290139323674584e-05, "loss": 0.8369, "step": 3643 }, { "epoch": 0.51, "learning_rate": 1.0285642273032004e-05, "loss": 0.8625, "step": 3644 }, { "epoch": 0.51, "learning_rate": 1.0281145164574741e-05, "loss": 0.8779, "step": 3645 }, { "epoch": 0.51, "learning_rate": 1.0276647999213026e-05, "loss": 0.8484, "step": 3646 }, { "epoch": 0.51, "learning_rate": 1.0272150777857092e-05, "loss": 0.8562, "step": 3647 }, { "epoch": 0.51, "learning_rate": 1.0267653501417187e-05, "loss": 0.8647, "step": 3648 }, { "epoch": 0.51, "learning_rate": 1.0263156170803572e-05, "loss": 0.8586, "step": 3649 }, { "epoch": 0.51, "learning_rate": 1.0258658786926516e-05, "loss": 0.8306, "step": 3650 }, { "epoch": 0.51, "learning_rate": 1.0254161350696302e-05, "loss": 0.8513, "step": 3651 }, { "epoch": 0.51, "learning_rate": 1.0249663863023223e-05, "loss": 0.8779, "step": 3652 }, { "epoch": 0.51, "learning_rate": 1.0245166324817577e-05, "loss": 0.6229, "step": 3653 }, { "epoch": 0.51, "learning_rate": 1.0240668736989679e-05, "loss": 0.8784, "step": 3654 }, { "epoch": 0.51, "learning_rate": 1.023617110044985e-05, "loss": 0.9148, "step": 3655 }, { "epoch": 0.51, "learning_rate": 1.0231673416108425e-05, "loss": 0.8604, "step": 3656 }, { "epoch": 0.51, "learning_rate": 1.0227175684875748e-05, "loss": 0.8638, "step": 3657 }, { "epoch": 0.51, "learning_rate": 1.0222677907662165e-05, "loss": 0.8621, "step": 3658 }, { "epoch": 0.51, "learning_rate": 1.0218180085378038e-05, "loss": 0.8147, "step": 3659 }, { "epoch": 0.51, "learning_rate": 1.021368221893374e-05, "loss": 0.8738, "step": 3660 }, { "epoch": 0.51, "learning_rate": 1.0209184309239649e-05, "loss": 0.8735, "step": 3661 }, { "epoch": 0.51, "learning_rate": 1.0204686357206153e-05, "loss": 0.843, "step": 3662 }, { "epoch": 0.51, "learning_rate": 1.0200188363743645e-05, "loss": 0.845, "step": 3663 }, { "epoch": 0.51, "learning_rate": 1.0195690329762533e-05, "loss": 0.9121, "step": 3664 }, { "epoch": 0.51, "learning_rate": 1.0191192256173227e-05, "loss": 0.8774, "step": 3665 }, { "epoch": 0.51, "learning_rate": 1.0186694143886153e-05, "loss": 0.894, "step": 3666 }, { "epoch": 0.51, "learning_rate": 1.0182195993811736e-05, "loss": 0.8984, "step": 3667 }, { "epoch": 0.51, "learning_rate": 1.0177697806860413e-05, "loss": 0.8021, "step": 3668 }, { "epoch": 0.51, "learning_rate": 1.0173199583942628e-05, "loss": 0.6044, "step": 3669 }, { "epoch": 0.51, "learning_rate": 1.016870132596883e-05, "loss": 0.8975, "step": 3670 }, { "epoch": 0.51, "learning_rate": 1.016420303384948e-05, "loss": 0.8867, "step": 3671 }, { "epoch": 0.51, "learning_rate": 1.0159704708495043e-05, "loss": 0.8099, "step": 3672 }, { "epoch": 0.51, "learning_rate": 1.0155206350815988e-05, "loss": 0.8442, "step": 3673 }, { "epoch": 0.51, "learning_rate": 1.0150707961722797e-05, "loss": 0.8735, "step": 3674 }, { "epoch": 0.51, "learning_rate": 1.0146209542125953e-05, "loss": 0.7598, "step": 3675 }, { "epoch": 0.51, "learning_rate": 1.0141711092935947e-05, "loss": 0.8508, "step": 3676 }, { "epoch": 0.51, "learning_rate": 1.0137212615063277e-05, "loss": 0.8491, "step": 3677 }, { "epoch": 0.51, "learning_rate": 1.0132714109418443e-05, "loss": 0.8672, "step": 3678 }, { "epoch": 0.51, "learning_rate": 1.0128215576911955e-05, "loss": 0.8337, "step": 3679 }, { "epoch": 0.51, "learning_rate": 1.0123717018454326e-05, "loss": 0.8931, "step": 3680 }, { "epoch": 0.51, "learning_rate": 1.0119218434956076e-05, "loss": 0.8728, "step": 3681 }, { "epoch": 0.51, "learning_rate": 1.011471982732773e-05, "loss": 0.8257, "step": 3682 }, { "epoch": 0.51, "learning_rate": 1.0110221196479817e-05, "loss": 0.8208, "step": 3683 }, { "epoch": 0.51, "learning_rate": 1.0105722543322866e-05, "loss": 0.9094, "step": 3684 }, { "epoch": 0.51, "learning_rate": 1.0101223868767422e-05, "loss": 0.8552, "step": 3685 }, { "epoch": 0.51, "learning_rate": 1.0096725173724023e-05, "loss": 0.8689, "step": 3686 }, { "epoch": 0.51, "learning_rate": 1.0092226459103215e-05, "loss": 0.7747, "step": 3687 }, { "epoch": 0.51, "learning_rate": 1.0087727725815555e-05, "loss": 0.8738, "step": 3688 }, { "epoch": 0.51, "learning_rate": 1.0083228974771589e-05, "loss": 0.79, "step": 3689 }, { "epoch": 0.51, "learning_rate": 1.007873020688188e-05, "loss": 0.843, "step": 3690 }, { "epoch": 0.51, "learning_rate": 1.0074231423056988e-05, "loss": 0.7632, "step": 3691 }, { "epoch": 0.51, "learning_rate": 1.0069732624207478e-05, "loss": 0.8105, "step": 3692 }, { "epoch": 0.51, "learning_rate": 1.006523381124392e-05, "loss": 0.7502, "step": 3693 }, { "epoch": 0.51, "learning_rate": 1.006073498507688e-05, "loss": 0.5671, "step": 3694 }, { "epoch": 0.51, "learning_rate": 1.0056236146616931e-05, "loss": 0.7693, "step": 3695 }, { "epoch": 0.51, "learning_rate": 1.0051737296774654e-05, "loss": 0.8757, "step": 3696 }, { "epoch": 0.51, "learning_rate": 1.0047238436460624e-05, "loss": 0.8181, "step": 3697 }, { "epoch": 0.51, "learning_rate": 1.0042739566585422e-05, "loss": 0.8577, "step": 3698 }, { "epoch": 0.51, "learning_rate": 1.0038240688059628e-05, "loss": 0.8818, "step": 3699 }, { "epoch": 0.51, "learning_rate": 1.0033741801793826e-05, "loss": 0.8013, "step": 3700 }, { "epoch": 0.51, "learning_rate": 1.0029242908698605e-05, "loss": 0.853, "step": 3701 }, { "epoch": 0.51, "learning_rate": 1.0024744009684546e-05, "loss": 0.8826, "step": 3702 }, { "epoch": 0.51, "learning_rate": 1.0020245105662243e-05, "loss": 0.8572, "step": 3703 }, { "epoch": 0.51, "learning_rate": 1.001574619754228e-05, "loss": 0.569, "step": 3704 }, { "epoch": 0.51, "learning_rate": 1.001124728623525e-05, "loss": 0.8892, "step": 3705 }, { "epoch": 0.51, "learning_rate": 1.000674837265174e-05, "loss": 0.8213, "step": 3706 }, { "epoch": 0.51, "learning_rate": 1.0002249457702347e-05, "loss": 0.8445, "step": 3707 }, { "epoch": 0.52, "learning_rate": 9.997750542297655e-06, "loss": 0.7964, "step": 3708 }, { "epoch": 0.52, "learning_rate": 9.993251627348261e-06, "loss": 0.8875, "step": 3709 }, { "epoch": 0.52, "learning_rate": 9.988752713764751e-06, "loss": 0.8462, "step": 3710 }, { "epoch": 0.52, "learning_rate": 9.984253802457723e-06, "loss": 0.7964, "step": 3711 }, { "epoch": 0.52, "learning_rate": 9.979754894337762e-06, "loss": 0.821, "step": 3712 }, { "epoch": 0.52, "learning_rate": 9.975255990315456e-06, "loss": 0.7952, "step": 3713 }, { "epoch": 0.52, "learning_rate": 9.9707570913014e-06, "loss": 0.8616, "step": 3714 }, { "epoch": 0.52, "learning_rate": 9.966258198206175e-06, "loss": 0.897, "step": 3715 }, { "epoch": 0.52, "learning_rate": 9.961759311940376e-06, "loss": 0.824, "step": 3716 }, { "epoch": 0.52, "learning_rate": 9.957260433414583e-06, "loss": 0.8457, "step": 3717 }, { "epoch": 0.52, "learning_rate": 9.952761563539377e-06, "loss": 0.918, "step": 3718 }, { "epoch": 0.52, "learning_rate": 9.948262703225349e-06, "loss": 0.8872, "step": 3719 }, { "epoch": 0.52, "learning_rate": 9.943763853383069e-06, "loss": 0.8774, "step": 3720 }, { "epoch": 0.52, "learning_rate": 9.939265014923124e-06, "loss": 0.8533, "step": 3721 }, { "epoch": 0.52, "learning_rate": 9.934766188756085e-06, "loss": 0.849, "step": 3722 }, { "epoch": 0.52, "learning_rate": 9.930267375792523e-06, "loss": 0.8545, "step": 3723 }, { "epoch": 0.52, "learning_rate": 9.925768576943016e-06, "loss": 0.6259, "step": 3724 }, { "epoch": 0.52, "learning_rate": 9.92126979311812e-06, "loss": 0.8208, "step": 3725 }, { "epoch": 0.52, "learning_rate": 9.916771025228412e-06, "loss": 0.9082, "step": 3726 }, { "epoch": 0.52, "learning_rate": 9.912272274184452e-06, "loss": 0.8474, "step": 3727 }, { "epoch": 0.52, "learning_rate": 9.907773540896786e-06, "loss": 0.9102, "step": 3728 }, { "epoch": 0.52, "learning_rate": 9.90327482627598e-06, "loss": 0.8496, "step": 3729 }, { "epoch": 0.52, "learning_rate": 9.89877613123258e-06, "loss": 0.8767, "step": 3730 }, { "epoch": 0.52, "learning_rate": 9.894277456677136e-06, "loss": 0.8298, "step": 3731 }, { "epoch": 0.52, "learning_rate": 9.889778803520188e-06, "loss": 0.8503, "step": 3732 }, { "epoch": 0.52, "learning_rate": 9.885280172672271e-06, "loss": 0.5726, "step": 3733 }, { "epoch": 0.52, "learning_rate": 9.880781565043926e-06, "loss": 0.7764, "step": 3734 }, { "epoch": 0.52, "learning_rate": 9.876282981545675e-06, "loss": 0.8389, "step": 3735 }, { "epoch": 0.52, "learning_rate": 9.871784423088048e-06, "loss": 0.573, "step": 3736 }, { "epoch": 0.52, "learning_rate": 9.867285890581562e-06, "loss": 0.814, "step": 3737 }, { "epoch": 0.52, "learning_rate": 9.862787384936726e-06, "loss": 0.8694, "step": 3738 }, { "epoch": 0.52, "learning_rate": 9.858288907064057e-06, "loss": 0.589, "step": 3739 }, { "epoch": 0.52, "learning_rate": 9.853790457874049e-06, "loss": 0.8315, "step": 3740 }, { "epoch": 0.52, "learning_rate": 9.849292038277204e-06, "loss": 0.928, "step": 3741 }, { "epoch": 0.52, "learning_rate": 9.844793649184017e-06, "loss": 0.8164, "step": 3742 }, { "epoch": 0.52, "learning_rate": 9.84029529150496e-06, "loss": 0.8284, "step": 3743 }, { "epoch": 0.52, "learning_rate": 9.835796966150524e-06, "loss": 0.8528, "step": 3744 }, { "epoch": 0.52, "learning_rate": 9.831298674031172e-06, "loss": 0.8298, "step": 3745 }, { "epoch": 0.52, "learning_rate": 9.826800416057377e-06, "loss": 0.8379, "step": 3746 }, { "epoch": 0.52, "learning_rate": 9.822302193139592e-06, "loss": 0.8087, "step": 3747 }, { "epoch": 0.52, "learning_rate": 9.817804006188266e-06, "loss": 0.8254, "step": 3748 }, { "epoch": 0.52, "learning_rate": 9.813305856113849e-06, "loss": 0.8599, "step": 3749 }, { "epoch": 0.52, "learning_rate": 9.808807743826771e-06, "loss": 0.8044, "step": 3750 }, { "epoch": 0.52, "learning_rate": 9.804309670237469e-06, "loss": 0.825, "step": 3751 }, { "epoch": 0.52, "learning_rate": 9.79981163625636e-06, "loss": 0.9436, "step": 3752 }, { "epoch": 0.52, "learning_rate": 9.79531364279385e-06, "loss": 0.8228, "step": 3753 }, { "epoch": 0.52, "learning_rate": 9.790815690760355e-06, "loss": 0.8491, "step": 3754 }, { "epoch": 0.52, "learning_rate": 9.78631778106626e-06, "loss": 0.8352, "step": 3755 }, { "epoch": 0.52, "learning_rate": 9.781819914621964e-06, "loss": 0.8972, "step": 3756 }, { "epoch": 0.52, "learning_rate": 9.77732209233784e-06, "loss": 0.8452, "step": 3757 }, { "epoch": 0.52, "learning_rate": 9.772824315124256e-06, "loss": 0.8428, "step": 3758 }, { "epoch": 0.52, "learning_rate": 9.768326583891578e-06, "loss": 0.9006, "step": 3759 }, { "epoch": 0.52, "learning_rate": 9.76382889955015e-06, "loss": 0.8879, "step": 3760 }, { "epoch": 0.52, "learning_rate": 9.759331263010325e-06, "loss": 0.7612, "step": 3761 }, { "epoch": 0.52, "learning_rate": 9.75483367518243e-06, "loss": 0.8658, "step": 3762 }, { "epoch": 0.52, "learning_rate": 9.75033613697678e-06, "loss": 0.8643, "step": 3763 }, { "epoch": 0.52, "learning_rate": 9.7458386493037e-06, "loss": 0.8574, "step": 3764 }, { "epoch": 0.52, "learning_rate": 9.741341213073484e-06, "loss": 0.8269, "step": 3765 }, { "epoch": 0.52, "learning_rate": 9.736843829196431e-06, "loss": 0.5964, "step": 3766 }, { "epoch": 0.52, "learning_rate": 9.732346498582816e-06, "loss": 0.8909, "step": 3767 }, { "epoch": 0.52, "learning_rate": 9.72784922214291e-06, "loss": 0.8506, "step": 3768 }, { "epoch": 0.52, "learning_rate": 9.723352000786976e-06, "loss": 0.8098, "step": 3769 }, { "epoch": 0.52, "learning_rate": 9.718854835425257e-06, "loss": 0.8494, "step": 3770 }, { "epoch": 0.52, "learning_rate": 9.714357726968e-06, "loss": 0.3783, "step": 3771 }, { "epoch": 0.52, "learning_rate": 9.70986067632542e-06, "loss": 0.8748, "step": 3772 }, { "epoch": 0.52, "learning_rate": 9.705363684407733e-06, "loss": 0.8245, "step": 3773 }, { "epoch": 0.52, "learning_rate": 9.700866752125148e-06, "loss": 0.8442, "step": 3774 }, { "epoch": 0.52, "learning_rate": 9.696369880387845e-06, "loss": 0.8818, "step": 3775 }, { "epoch": 0.52, "learning_rate": 9.691873070106009e-06, "loss": 0.8594, "step": 3776 }, { "epoch": 0.52, "learning_rate": 9.687376322189804e-06, "loss": 0.5712, "step": 3777 }, { "epoch": 0.52, "learning_rate": 9.682879637549376e-06, "loss": 0.8442, "step": 3778 }, { "epoch": 0.52, "learning_rate": 9.678383017094875e-06, "loss": 0.8855, "step": 3779 }, { "epoch": 0.53, "learning_rate": 9.673886461736419e-06, "loss": 0.863, "step": 3780 }, { "epoch": 0.53, "learning_rate": 9.669389972384127e-06, "loss": 0.8887, "step": 3781 }, { "epoch": 0.53, "learning_rate": 9.6648935499481e-06, "loss": 0.8503, "step": 3782 }, { "epoch": 0.53, "learning_rate": 9.660397195338417e-06, "loss": 0.8821, "step": 3783 }, { "epoch": 0.53, "learning_rate": 9.65590090946516e-06, "loss": 0.8093, "step": 3784 }, { "epoch": 0.53, "learning_rate": 9.65140469323838e-06, "loss": 0.8704, "step": 3785 }, { "epoch": 0.53, "learning_rate": 9.646908547568131e-06, "loss": 0.802, "step": 3786 }, { "epoch": 0.53, "learning_rate": 9.642412473364438e-06, "loss": 0.8281, "step": 3787 }, { "epoch": 0.53, "learning_rate": 9.637916471537313e-06, "loss": 0.8027, "step": 3788 }, { "epoch": 0.53, "learning_rate": 9.633420542996767e-06, "loss": 0.8179, "step": 3789 }, { "epoch": 0.53, "learning_rate": 9.628924688652783e-06, "loss": 0.8657, "step": 3790 }, { "epoch": 0.53, "learning_rate": 9.624428909415328e-06, "loss": 0.5921, "step": 3791 }, { "epoch": 0.53, "learning_rate": 9.619933206194366e-06, "loss": 0.8647, "step": 3792 }, { "epoch": 0.53, "learning_rate": 9.61543757989983e-06, "loss": 0.8208, "step": 3793 }, { "epoch": 0.53, "learning_rate": 9.610942031441656e-06, "loss": 0.8066, "step": 3794 }, { "epoch": 0.53, "learning_rate": 9.606446561729744e-06, "loss": 0.8416, "step": 3795 }, { "epoch": 0.53, "learning_rate": 9.601951171673991e-06, "loss": 0.8572, "step": 3796 }, { "epoch": 0.53, "learning_rate": 9.59745586218428e-06, "loss": 0.8643, "step": 3797 }, { "epoch": 0.53, "learning_rate": 9.592960634170462e-06, "loss": 0.8926, "step": 3798 }, { "epoch": 0.53, "learning_rate": 9.588465488542394e-06, "loss": 0.8604, "step": 3799 }, { "epoch": 0.53, "learning_rate": 9.583970426209894e-06, "loss": 0.8645, "step": 3800 }, { "epoch": 0.53, "learning_rate": 9.579475448082777e-06, "loss": 0.8214, "step": 3801 }, { "epoch": 0.53, "learning_rate": 9.574980555070842e-06, "loss": 0.7393, "step": 3802 }, { "epoch": 0.53, "learning_rate": 9.570485748083856e-06, "loss": 0.6033, "step": 3803 }, { "epoch": 0.53, "learning_rate": 9.56599102803159e-06, "loss": 0.8635, "step": 3804 }, { "epoch": 0.53, "learning_rate": 9.561496395823777e-06, "loss": 0.8091, "step": 3805 }, { "epoch": 0.53, "learning_rate": 9.557001852370147e-06, "loss": 0.9446, "step": 3806 }, { "epoch": 0.53, "learning_rate": 9.552507398580404e-06, "loss": 0.8882, "step": 3807 }, { "epoch": 0.53, "learning_rate": 9.548013035364235e-06, "loss": 0.8147, "step": 3808 }, { "epoch": 0.53, "learning_rate": 9.543518763631315e-06, "loss": 0.8679, "step": 3809 }, { "epoch": 0.53, "learning_rate": 9.53902458429129e-06, "loss": 0.8508, "step": 3810 }, { "epoch": 0.53, "learning_rate": 9.534530498253794e-06, "loss": 0.8638, "step": 3811 }, { "epoch": 0.53, "learning_rate": 9.530036506428445e-06, "loss": 0.8589, "step": 3812 }, { "epoch": 0.53, "learning_rate": 9.525542609724831e-06, "loss": 0.8323, "step": 3813 }, { "epoch": 0.53, "learning_rate": 9.52104880905253e-06, "loss": 0.8513, "step": 3814 }, { "epoch": 0.53, "learning_rate": 9.5165551053211e-06, "loss": 0.8467, "step": 3815 }, { "epoch": 0.53, "learning_rate": 9.512061499440075e-06, "loss": 0.757, "step": 3816 }, { "epoch": 0.53, "learning_rate": 9.507567992318976e-06, "loss": 0.8259, "step": 3817 }, { "epoch": 0.53, "learning_rate": 9.503074584867293e-06, "loss": 0.8796, "step": 3818 }, { "epoch": 0.53, "learning_rate": 9.498581277994506e-06, "loss": 0.5935, "step": 3819 }, { "epoch": 0.53, "learning_rate": 9.494088072610071e-06, "loss": 0.8711, "step": 3820 }, { "epoch": 0.53, "learning_rate": 9.489594969623424e-06, "loss": 0.7998, "step": 3821 }, { "epoch": 0.53, "learning_rate": 9.48510196994398e-06, "loss": 0.8372, "step": 3822 }, { "epoch": 0.53, "learning_rate": 9.48060907448113e-06, "loss": 0.8381, "step": 3823 }, { "epoch": 0.53, "learning_rate": 9.47611628414425e-06, "loss": 0.9277, "step": 3824 }, { "epoch": 0.53, "learning_rate": 9.471623599842691e-06, "loss": 0.854, "step": 3825 }, { "epoch": 0.53, "learning_rate": 9.467131022485781e-06, "loss": 0.8623, "step": 3826 }, { "epoch": 0.53, "learning_rate": 9.462638552982831e-06, "loss": 0.8289, "step": 3827 }, { "epoch": 0.53, "learning_rate": 9.458146192243129e-06, "loss": 0.7719, "step": 3828 }, { "epoch": 0.53, "learning_rate": 9.453653941175933e-06, "loss": 0.7957, "step": 3829 }, { "epoch": 0.53, "learning_rate": 9.449161800690492e-06, "loss": 0.8604, "step": 3830 }, { "epoch": 0.53, "learning_rate": 9.44466977169602e-06, "loss": 0.7848, "step": 3831 }, { "epoch": 0.53, "learning_rate": 9.440177855101722e-06, "loss": 0.7932, "step": 3832 }, { "epoch": 0.53, "learning_rate": 9.43568605181677e-06, "loss": 0.8589, "step": 3833 }, { "epoch": 0.53, "learning_rate": 9.43119436275031e-06, "loss": 0.5986, "step": 3834 }, { "epoch": 0.53, "learning_rate": 9.426702788811476e-06, "loss": 0.8782, "step": 3835 }, { "epoch": 0.53, "learning_rate": 9.422211330909377e-06, "loss": 0.8076, "step": 3836 }, { "epoch": 0.53, "learning_rate": 9.417719989953084e-06, "loss": 0.7079, "step": 3837 }, { "epoch": 0.53, "learning_rate": 9.413228766851665e-06, "loss": 0.7495, "step": 3838 }, { "epoch": 0.53, "learning_rate": 9.40873766251415e-06, "loss": 0.8711, "step": 3839 }, { "epoch": 0.53, "learning_rate": 9.40424667784955e-06, "loss": 0.8425, "step": 3840 }, { "epoch": 0.53, "learning_rate": 9.399755813766853e-06, "loss": 0.5692, "step": 3841 }, { "epoch": 0.53, "learning_rate": 9.395265071175014e-06, "loss": 0.8103, "step": 3842 }, { "epoch": 0.53, "learning_rate": 9.39077445098298e-06, "loss": 0.5867, "step": 3843 }, { "epoch": 0.53, "learning_rate": 9.386283954099654e-06, "loss": 0.5901, "step": 3844 }, { "epoch": 0.53, "learning_rate": 9.38179358143393e-06, "loss": 0.8689, "step": 3845 }, { "epoch": 0.53, "learning_rate": 9.377303333894668e-06, "loss": 0.8657, "step": 3846 }, { "epoch": 0.53, "learning_rate": 9.372813212390701e-06, "loss": 0.8021, "step": 3847 }, { "epoch": 0.53, "learning_rate": 9.368323217830849e-06, "loss": 0.8372, "step": 3848 }, { "epoch": 0.53, "learning_rate": 9.36383335112389e-06, "loss": 0.8718, "step": 3849 }, { "epoch": 0.53, "learning_rate": 9.359343613178585e-06, "loss": 0.9155, "step": 3850 }, { "epoch": 0.53, "learning_rate": 9.354854004903674e-06, "loss": 0.5573, "step": 3851 }, { "epoch": 0.54, "learning_rate": 9.350364527207853e-06, "loss": 0.8494, "step": 3852 }, { "epoch": 0.54, "learning_rate": 9.345875180999816e-06, "loss": 0.855, "step": 3853 }, { "epoch": 0.54, "learning_rate": 9.341385967188205e-06, "loss": 0.8398, "step": 3854 }, { "epoch": 0.54, "learning_rate": 9.336896886681656e-06, "loss": 0.7417, "step": 3855 }, { "epoch": 0.54, "learning_rate": 9.332407940388771e-06, "loss": 0.8416, "step": 3856 }, { "epoch": 0.54, "learning_rate": 9.327919129218115e-06, "loss": 0.8555, "step": 3857 }, { "epoch": 0.54, "learning_rate": 9.323430454078242e-06, "loss": 0.8909, "step": 3858 }, { "epoch": 0.54, "learning_rate": 9.318941915877666e-06, "loss": 0.8499, "step": 3859 }, { "epoch": 0.54, "learning_rate": 9.314453515524879e-06, "loss": 0.8429, "step": 3860 }, { "epoch": 0.54, "learning_rate": 9.309965253928348e-06, "loss": 0.8866, "step": 3861 }, { "epoch": 0.54, "learning_rate": 9.3054771319965e-06, "loss": 0.843, "step": 3862 }, { "epoch": 0.54, "learning_rate": 9.30098915063775e-06, "loss": 0.875, "step": 3863 }, { "epoch": 0.54, "learning_rate": 9.296501310760472e-06, "loss": 0.9177, "step": 3864 }, { "epoch": 0.54, "learning_rate": 9.292013613273012e-06, "loss": 0.7764, "step": 3865 }, { "epoch": 0.54, "learning_rate": 9.287526059083697e-06, "loss": 0.8486, "step": 3866 }, { "epoch": 0.54, "learning_rate": 9.283038649100815e-06, "loss": 0.8157, "step": 3867 }, { "epoch": 0.54, "learning_rate": 9.278551384232633e-06, "loss": 0.8772, "step": 3868 }, { "epoch": 0.54, "learning_rate": 9.27406426538738e-06, "loss": 0.8171, "step": 3869 }, { "epoch": 0.54, "learning_rate": 9.269577293473257e-06, "loss": 0.7998, "step": 3870 }, { "epoch": 0.54, "learning_rate": 9.265090469398446e-06, "loss": 0.8394, "step": 3871 }, { "epoch": 0.54, "learning_rate": 9.260603794071081e-06, "loss": 0.8354, "step": 3872 }, { "epoch": 0.54, "learning_rate": 9.256117268399287e-06, "loss": 0.5799, "step": 3873 }, { "epoch": 0.54, "learning_rate": 9.251630893291141e-06, "loss": 0.7693, "step": 3874 }, { "epoch": 0.54, "learning_rate": 9.247144669654692e-06, "loss": 0.8286, "step": 3875 }, { "epoch": 0.54, "learning_rate": 9.242658598397975e-06, "loss": 0.8892, "step": 3876 }, { "epoch": 0.54, "learning_rate": 9.238172680428967e-06, "loss": 0.7743, "step": 3877 }, { "epoch": 0.54, "learning_rate": 9.23368691665564e-06, "loss": 0.8091, "step": 3878 }, { "epoch": 0.54, "learning_rate": 9.229201307985917e-06, "loss": 0.8813, "step": 3879 }, { "epoch": 0.54, "learning_rate": 9.224715855327696e-06, "loss": 0.8352, "step": 3880 }, { "epoch": 0.54, "learning_rate": 9.22023055958885e-06, "loss": 0.8057, "step": 3881 }, { "epoch": 0.54, "learning_rate": 9.215745421677203e-06, "loss": 0.7891, "step": 3882 }, { "epoch": 0.54, "learning_rate": 9.211260442500567e-06, "loss": 0.8633, "step": 3883 }, { "epoch": 0.54, "learning_rate": 9.20677562296671e-06, "loss": 0.8011, "step": 3884 }, { "epoch": 0.54, "learning_rate": 9.202290963983365e-06, "loss": 0.7893, "step": 3885 }, { "epoch": 0.54, "learning_rate": 9.197806466458247e-06, "loss": 0.814, "step": 3886 }, { "epoch": 0.54, "learning_rate": 9.193322131299018e-06, "loss": 0.8911, "step": 3887 }, { "epoch": 0.54, "learning_rate": 9.18883795941333e-06, "loss": 0.8381, "step": 3888 }, { "epoch": 0.54, "learning_rate": 9.184353951708784e-06, "loss": 0.7485, "step": 3889 }, { "epoch": 0.54, "learning_rate": 9.179870109092949e-06, "loss": 0.6167, "step": 3890 }, { "epoch": 0.54, "learning_rate": 9.175386432473375e-06, "loss": 0.8464, "step": 3891 }, { "epoch": 0.54, "learning_rate": 9.170902922757562e-06, "loss": 0.5687, "step": 3892 }, { "epoch": 0.54, "learning_rate": 9.166419580852989e-06, "loss": 0.8418, "step": 3893 }, { "epoch": 0.54, "learning_rate": 9.161936407667091e-06, "loss": 0.8704, "step": 3894 }, { "epoch": 0.54, "learning_rate": 9.15745340410727e-06, "loss": 0.855, "step": 3895 }, { "epoch": 0.54, "learning_rate": 9.152970571080907e-06, "loss": 0.865, "step": 3896 }, { "epoch": 0.54, "learning_rate": 9.148487909495327e-06, "loss": 0.8076, "step": 3897 }, { "epoch": 0.54, "learning_rate": 9.144005420257837e-06, "loss": 0.8345, "step": 3898 }, { "epoch": 0.54, "learning_rate": 9.139523104275706e-06, "loss": 0.8979, "step": 3899 }, { "epoch": 0.54, "learning_rate": 9.135040962456158e-06, "loss": 0.7646, "step": 3900 }, { "epoch": 0.54, "learning_rate": 9.130558995706397e-06, "loss": 0.822, "step": 3901 }, { "epoch": 0.54, "learning_rate": 9.126077204933575e-06, "loss": 0.8306, "step": 3902 }, { "epoch": 0.54, "learning_rate": 9.121595591044829e-06, "loss": 0.9116, "step": 3903 }, { "epoch": 0.54, "learning_rate": 9.11711415494724e-06, "loss": 0.8684, "step": 3904 }, { "epoch": 0.54, "learning_rate": 9.11263289754786e-06, "loss": 0.7996, "step": 3905 }, { "epoch": 0.54, "learning_rate": 9.108151819753714e-06, "loss": 0.8906, "step": 3906 }, { "epoch": 0.54, "learning_rate": 9.103670922471775e-06, "loss": 0.8643, "step": 3907 }, { "epoch": 0.54, "learning_rate": 9.099190206608993e-06, "loss": 0.8342, "step": 3908 }, { "epoch": 0.54, "learning_rate": 9.094709673072276e-06, "loss": 0.8694, "step": 3909 }, { "epoch": 0.54, "learning_rate": 9.090229322768485e-06, "loss": 0.8427, "step": 3910 }, { "epoch": 0.54, "learning_rate": 9.085749156604468e-06, "loss": 0.8457, "step": 3911 }, { "epoch": 0.54, "learning_rate": 9.081269175487008e-06, "loss": 0.803, "step": 3912 }, { "epoch": 0.54, "learning_rate": 9.076789380322876e-06, "loss": 0.801, "step": 3913 }, { "epoch": 0.54, "learning_rate": 9.072309772018785e-06, "loss": 0.8826, "step": 3914 }, { "epoch": 0.54, "learning_rate": 9.067830351481419e-06, "loss": 0.8569, "step": 3915 }, { "epoch": 0.54, "learning_rate": 9.06335111961743e-06, "loss": 0.7666, "step": 3916 }, { "epoch": 0.54, "learning_rate": 9.058872077333414e-06, "loss": 0.8745, "step": 3917 }, { "epoch": 0.54, "learning_rate": 9.054393225535953e-06, "loss": 0.6184, "step": 3918 }, { "epoch": 0.54, "learning_rate": 9.04991456513157e-06, "loss": 0.8635, "step": 3919 }, { "epoch": 0.54, "learning_rate": 9.045436097026753e-06, "loss": 0.8342, "step": 3920 }, { "epoch": 0.54, "learning_rate": 9.040957822127964e-06, "loss": 0.8245, "step": 3921 }, { "epoch": 0.54, "learning_rate": 9.036479741341606e-06, "loss": 0.825, "step": 3922 }, { "epoch": 0.54, "learning_rate": 9.032001855574065e-06, "loss": 0.8618, "step": 3923 }, { "epoch": 0.55, "learning_rate": 9.02752416573167e-06, "loss": 0.6018, "step": 3924 }, { "epoch": 0.55, "learning_rate": 9.023046672720711e-06, "loss": 0.8499, "step": 3925 }, { "epoch": 0.55, "learning_rate": 9.018569377447453e-06, "loss": 0.8108, "step": 3926 }, { "epoch": 0.55, "learning_rate": 9.014092280818102e-06, "loss": 0.8992, "step": 3927 }, { "epoch": 0.55, "learning_rate": 9.009615383738843e-06, "loss": 0.8381, "step": 3928 }, { "epoch": 0.55, "learning_rate": 9.005138687115804e-06, "loss": 0.8782, "step": 3929 }, { "epoch": 0.55, "learning_rate": 9.000662191855076e-06, "loss": 0.8928, "step": 3930 }, { "epoch": 0.55, "learning_rate": 8.996185898862723e-06, "loss": 0.8079, "step": 3931 }, { "epoch": 0.55, "learning_rate": 8.991709809044746e-06, "loss": 0.8506, "step": 3932 }, { "epoch": 0.55, "learning_rate": 8.987233923307125e-06, "loss": 0.8423, "step": 3933 }, { "epoch": 0.55, "learning_rate": 8.982758242555789e-06, "loss": 0.822, "step": 3934 }, { "epoch": 0.55, "learning_rate": 8.978282767696618e-06, "loss": 0.8518, "step": 3935 }, { "epoch": 0.55, "learning_rate": 8.973807499635472e-06, "loss": 0.8174, "step": 3936 }, { "epoch": 0.55, "learning_rate": 8.969332439278142e-06, "loss": 0.8269, "step": 3937 }, { "epoch": 0.55, "learning_rate": 8.964857587530404e-06, "loss": 0.7959, "step": 3938 }, { "epoch": 0.55, "learning_rate": 8.960382945297974e-06, "loss": 0.6003, "step": 3939 }, { "epoch": 0.55, "learning_rate": 8.955908513486521e-06, "loss": 0.8687, "step": 3940 }, { "epoch": 0.55, "learning_rate": 8.951434293001695e-06, "loss": 0.9095, "step": 3941 }, { "epoch": 0.55, "learning_rate": 8.946960284749078e-06, "loss": 0.8047, "step": 3942 }, { "epoch": 0.55, "learning_rate": 8.942486489634232e-06, "loss": 0.8044, "step": 3943 }, { "epoch": 0.55, "learning_rate": 8.938012908562653e-06, "loss": 0.7876, "step": 3944 }, { "epoch": 0.55, "learning_rate": 8.933539542439805e-06, "loss": 0.824, "step": 3945 }, { "epoch": 0.55, "learning_rate": 8.929066392171116e-06, "loss": 0.8936, "step": 3946 }, { "epoch": 0.55, "learning_rate": 8.924593458661953e-06, "loss": 0.844, "step": 3947 }, { "epoch": 0.55, "learning_rate": 8.920120742817657e-06, "loss": 0.8694, "step": 3948 }, { "epoch": 0.55, "learning_rate": 8.915648245543507e-06, "loss": 0.813, "step": 3949 }, { "epoch": 0.55, "learning_rate": 8.911175967744758e-06, "loss": 0.866, "step": 3950 }, { "epoch": 0.55, "learning_rate": 8.906703910326606e-06, "loss": 0.8655, "step": 3951 }, { "epoch": 0.55, "learning_rate": 8.902232074194198e-06, "loss": 0.8276, "step": 3952 }, { "epoch": 0.55, "learning_rate": 8.897760460252655e-06, "loss": 0.8452, "step": 3953 }, { "epoch": 0.55, "learning_rate": 8.893289069407033e-06, "loss": 0.8711, "step": 3954 }, { "epoch": 0.55, "learning_rate": 8.888817902562364e-06, "loss": 0.811, "step": 3955 }, { "epoch": 0.55, "learning_rate": 8.884346960623616e-06, "loss": 0.816, "step": 3956 }, { "epoch": 0.55, "learning_rate": 8.879876244495713e-06, "loss": 0.8508, "step": 3957 }, { "epoch": 0.55, "learning_rate": 8.875405755083552e-06, "loss": 0.8262, "step": 3958 }, { "epoch": 0.55, "learning_rate": 8.870935493291955e-06, "loss": 0.8076, "step": 3959 }, { "epoch": 0.55, "learning_rate": 8.866465460025728e-06, "loss": 0.7803, "step": 3960 }, { "epoch": 0.55, "learning_rate": 8.86199565618961e-06, "loss": 0.7961, "step": 3961 }, { "epoch": 0.55, "learning_rate": 8.857526082688297e-06, "loss": 0.8179, "step": 3962 }, { "epoch": 0.55, "learning_rate": 8.853056740426447e-06, "loss": 0.8862, "step": 3963 }, { "epoch": 0.55, "learning_rate": 8.848587630308661e-06, "loss": 0.8748, "step": 3964 }, { "epoch": 0.55, "learning_rate": 8.844118753239503e-06, "loss": 0.5415, "step": 3965 }, { "epoch": 0.55, "learning_rate": 8.839650110123483e-06, "loss": 0.8643, "step": 3966 }, { "epoch": 0.55, "learning_rate": 8.835181701865057e-06, "loss": 0.833, "step": 3967 }, { "epoch": 0.55, "learning_rate": 8.830713529368654e-06, "loss": 0.8372, "step": 3968 }, { "epoch": 0.55, "learning_rate": 8.82624559353863e-06, "loss": 0.7974, "step": 3969 }, { "epoch": 0.55, "learning_rate": 8.82177789527932e-06, "loss": 0.7842, "step": 3970 }, { "epoch": 0.55, "learning_rate": 8.817310435494988e-06, "loss": 0.8479, "step": 3971 }, { "epoch": 0.55, "learning_rate": 8.812843215089857e-06, "loss": 0.8301, "step": 3972 }, { "epoch": 0.55, "learning_rate": 8.80837623496811e-06, "loss": 0.7808, "step": 3973 }, { "epoch": 0.55, "learning_rate": 8.803909496033866e-06, "loss": 0.8835, "step": 3974 }, { "epoch": 0.55, "learning_rate": 8.799442999191214e-06, "loss": 0.8816, "step": 3975 }, { "epoch": 0.55, "learning_rate": 8.794976745344176e-06, "loss": 0.801, "step": 3976 }, { "epoch": 0.55, "learning_rate": 8.790510735396731e-06, "loss": 0.6608, "step": 3977 }, { "epoch": 0.55, "learning_rate": 8.78604497025282e-06, "loss": 0.7629, "step": 3978 }, { "epoch": 0.55, "learning_rate": 8.781579450816312e-06, "loss": 0.8323, "step": 3979 }, { "epoch": 0.55, "learning_rate": 8.77711417799105e-06, "loss": 0.8145, "step": 3980 }, { "epoch": 0.55, "learning_rate": 8.772649152680811e-06, "loss": 0.8508, "step": 3981 }, { "epoch": 0.55, "learning_rate": 8.768184375789323e-06, "loss": 0.8036, "step": 3982 }, { "epoch": 0.55, "learning_rate": 8.763719848220275e-06, "loss": 0.8601, "step": 3983 }, { "epoch": 0.55, "learning_rate": 8.75925557087729e-06, "loss": 0.7341, "step": 3984 }, { "epoch": 0.55, "learning_rate": 8.754791544663959e-06, "loss": 0.8169, "step": 3985 }, { "epoch": 0.55, "learning_rate": 8.750327770483804e-06, "loss": 0.8531, "step": 3986 }, { "epoch": 0.55, "learning_rate": 8.7458642492403e-06, "loss": 0.8445, "step": 3987 }, { "epoch": 0.55, "learning_rate": 8.741400981836888e-06, "loss": 0.8668, "step": 3988 }, { "epoch": 0.55, "learning_rate": 8.736937969176927e-06, "loss": 0.8164, "step": 3989 }, { "epoch": 0.55, "learning_rate": 8.732475212163757e-06, "loss": 0.7631, "step": 3990 }, { "epoch": 0.55, "learning_rate": 8.728012711700643e-06, "loss": 0.9087, "step": 3991 }, { "epoch": 0.55, "learning_rate": 8.723550468690803e-06, "loss": 0.7717, "step": 3992 }, { "epoch": 0.55, "learning_rate": 8.719088484037413e-06, "loss": 0.5569, "step": 3993 }, { "epoch": 0.55, "learning_rate": 8.714626758643581e-06, "loss": 0.8914, "step": 3994 }, { "epoch": 0.55, "learning_rate": 8.71016529341238e-06, "loss": 0.8394, "step": 3995 }, { "epoch": 0.56, "learning_rate": 8.705704089246816e-06, "loss": 0.7371, "step": 3996 }, { "epoch": 0.56, "learning_rate": 8.701243147049844e-06, "loss": 0.9067, "step": 3997 }, { "epoch": 0.56, "learning_rate": 8.69678246772438e-06, "loss": 0.8813, "step": 3998 }, { "epoch": 0.56, "learning_rate": 8.692322052173265e-06, "loss": 0.845, "step": 3999 }, { "epoch": 0.56, "learning_rate": 8.687861901299306e-06, "loss": 0.8179, "step": 4000 }, { "epoch": 0.56, "learning_rate": 8.683402016005246e-06, "loss": 0.9126, "step": 4001 }, { "epoch": 0.56, "learning_rate": 8.67894239719377e-06, "loss": 0.8596, "step": 4002 }, { "epoch": 0.56, "learning_rate": 8.674483045767526e-06, "loss": 0.8342, "step": 4003 }, { "epoch": 0.56, "learning_rate": 8.670023962629088e-06, "loss": 0.8582, "step": 4004 }, { "epoch": 0.56, "learning_rate": 8.665565148680994e-06, "loss": 0.8479, "step": 4005 }, { "epoch": 0.56, "learning_rate": 8.661106604825715e-06, "loss": 0.8752, "step": 4006 }, { "epoch": 0.56, "learning_rate": 8.656648331965665e-06, "loss": 0.821, "step": 4007 }, { "epoch": 0.56, "learning_rate": 8.652190331003218e-06, "loss": 0.8201, "step": 4008 }, { "epoch": 0.56, "learning_rate": 8.647732602840675e-06, "loss": 0.8525, "step": 4009 }, { "epoch": 0.56, "learning_rate": 8.643275148380302e-06, "loss": 0.5896, "step": 4010 }, { "epoch": 0.56, "learning_rate": 8.638817968524292e-06, "loss": 0.8545, "step": 4011 }, { "epoch": 0.56, "learning_rate": 8.634361064174785e-06, "loss": 0.7389, "step": 4012 }, { "epoch": 0.56, "learning_rate": 8.62990443623388e-06, "loss": 0.9004, "step": 4013 }, { "epoch": 0.56, "learning_rate": 8.625448085603596e-06, "loss": 0.8555, "step": 4014 }, { "epoch": 0.56, "learning_rate": 8.620992013185922e-06, "loss": 0.8542, "step": 4015 }, { "epoch": 0.56, "learning_rate": 8.61653621988277e-06, "loss": 0.8262, "step": 4016 }, { "epoch": 0.56, "learning_rate": 8.612080706596001e-06, "loss": 0.7954, "step": 4017 }, { "epoch": 0.56, "learning_rate": 8.607625474227432e-06, "loss": 0.929, "step": 4018 }, { "epoch": 0.56, "learning_rate": 8.6031705236788e-06, "loss": 0.7871, "step": 4019 }, { "epoch": 0.56, "learning_rate": 8.598715855851808e-06, "loss": 0.8408, "step": 4020 }, { "epoch": 0.56, "learning_rate": 8.594261471648087e-06, "loss": 0.8687, "step": 4021 }, { "epoch": 0.56, "learning_rate": 8.589807371969212e-06, "loss": 0.8088, "step": 4022 }, { "epoch": 0.56, "learning_rate": 8.585353557716712e-06, "loss": 0.8225, "step": 4023 }, { "epoch": 0.56, "learning_rate": 8.58090002979204e-06, "loss": 0.8533, "step": 4024 }, { "epoch": 0.56, "learning_rate": 8.576446789096607e-06, "loss": 0.8611, "step": 4025 }, { "epoch": 0.56, "learning_rate": 8.571993836531761e-06, "loss": 0.8765, "step": 4026 }, { "epoch": 0.56, "learning_rate": 8.56754117299878e-06, "loss": 0.7716, "step": 4027 }, { "epoch": 0.56, "learning_rate": 8.563088799398906e-06, "loss": 0.7943, "step": 4028 }, { "epoch": 0.56, "learning_rate": 8.558636716633304e-06, "loss": 0.8674, "step": 4029 }, { "epoch": 0.56, "learning_rate": 8.554184925603086e-06, "loss": 0.8535, "step": 4030 }, { "epoch": 0.56, "learning_rate": 8.54973342720931e-06, "loss": 0.8484, "step": 4031 }, { "epoch": 0.56, "learning_rate": 8.545282222352959e-06, "loss": 0.8501, "step": 4032 }, { "epoch": 0.56, "learning_rate": 8.540831311934983e-06, "loss": 0.7808, "step": 4033 }, { "epoch": 0.56, "learning_rate": 8.536380696856244e-06, "loss": 0.8694, "step": 4034 }, { "epoch": 0.56, "learning_rate": 8.531930378017563e-06, "loss": 0.8381, "step": 4035 }, { "epoch": 0.56, "learning_rate": 8.527480356319696e-06, "loss": 0.8491, "step": 4036 }, { "epoch": 0.56, "learning_rate": 8.523030632663332e-06, "loss": 0.7864, "step": 4037 }, { "epoch": 0.56, "learning_rate": 8.518581207949114e-06, "loss": 0.8271, "step": 4038 }, { "epoch": 0.56, "learning_rate": 8.514132083077611e-06, "loss": 0.8501, "step": 4039 }, { "epoch": 0.56, "learning_rate": 8.509683258949337e-06, "loss": 0.8389, "step": 4040 }, { "epoch": 0.56, "learning_rate": 8.505234736464748e-06, "loss": 0.7676, "step": 4041 }, { "epoch": 0.56, "learning_rate": 8.500786516524228e-06, "loss": 0.557, "step": 4042 }, { "epoch": 0.56, "learning_rate": 8.496338600028119e-06, "loss": 0.8413, "step": 4043 }, { "epoch": 0.56, "learning_rate": 8.49189098787668e-06, "loss": 0.8882, "step": 4044 }, { "epoch": 0.56, "learning_rate": 8.48744368097012e-06, "loss": 0.907, "step": 4045 }, { "epoch": 0.56, "learning_rate": 8.482996680208591e-06, "loss": 0.8679, "step": 4046 }, { "epoch": 0.56, "learning_rate": 8.478549986492168e-06, "loss": 0.8347, "step": 4047 }, { "epoch": 0.56, "learning_rate": 8.474103600720878e-06, "loss": 0.8752, "step": 4048 }, { "epoch": 0.56, "learning_rate": 8.469657523794678e-06, "loss": 0.8538, "step": 4049 }, { "epoch": 0.56, "learning_rate": 8.465211756613466e-06, "loss": 0.5721, "step": 4050 }, { "epoch": 0.56, "learning_rate": 8.460766300077075e-06, "loss": 0.8093, "step": 4051 }, { "epoch": 0.56, "learning_rate": 8.456321155085276e-06, "loss": 0.9368, "step": 4052 }, { "epoch": 0.56, "learning_rate": 8.451876322537777e-06, "loss": 0.8257, "step": 4053 }, { "epoch": 0.56, "learning_rate": 8.447431803334222e-06, "loss": 0.8499, "step": 4054 }, { "epoch": 0.56, "learning_rate": 8.442987598374194e-06, "loss": 0.8479, "step": 4055 }, { "epoch": 0.56, "learning_rate": 8.438543708557212e-06, "loss": 0.812, "step": 4056 }, { "epoch": 0.56, "learning_rate": 8.434100134782726e-06, "loss": 0.8572, "step": 4057 }, { "epoch": 0.56, "learning_rate": 8.42965687795013e-06, "loss": 0.7751, "step": 4058 }, { "epoch": 0.56, "learning_rate": 8.425213938958745e-06, "loss": 0.8284, "step": 4059 }, { "epoch": 0.56, "learning_rate": 8.420771318707837e-06, "loss": 0.8739, "step": 4060 }, { "epoch": 0.56, "learning_rate": 8.416329018096603e-06, "loss": 0.8252, "step": 4061 }, { "epoch": 0.56, "learning_rate": 8.41188703802417e-06, "loss": 0.8386, "step": 4062 }, { "epoch": 0.56, "learning_rate": 8.407445379389613e-06, "loss": 0.7706, "step": 4063 }, { "epoch": 0.56, "learning_rate": 8.403004043091927e-06, "loss": 0.8718, "step": 4064 }, { "epoch": 0.56, "learning_rate": 8.398563030030054e-06, "loss": 0.8564, "step": 4065 }, { "epoch": 0.56, "learning_rate": 8.394122341102863e-06, "loss": 0.8579, "step": 4066 }, { "epoch": 0.56, "learning_rate": 8.389681977209165e-06, "loss": 0.8328, "step": 4067 }, { "epoch": 0.57, "learning_rate": 8.385241939247694e-06, "loss": 0.8225, "step": 4068 }, { "epoch": 0.57, "learning_rate": 8.380802228117128e-06, "loss": 0.8081, "step": 4069 }, { "epoch": 0.57, "learning_rate": 8.376362844716074e-06, "loss": 0.6183, "step": 4070 }, { "epoch": 0.57, "learning_rate": 8.371923789943072e-06, "loss": 0.7893, "step": 4071 }, { "epoch": 0.57, "learning_rate": 8.367485064696602e-06, "loss": 0.7908, "step": 4072 }, { "epoch": 0.57, "learning_rate": 8.36304666987507e-06, "loss": 0.8284, "step": 4073 }, { "epoch": 0.57, "learning_rate": 8.358608606376814e-06, "loss": 0.8191, "step": 4074 }, { "epoch": 0.57, "learning_rate": 8.354170875100118e-06, "loss": 0.8926, "step": 4075 }, { "epoch": 0.57, "learning_rate": 8.349733476943178e-06, "loss": 0.9172, "step": 4076 }, { "epoch": 0.57, "learning_rate": 8.345296412804145e-06, "loss": 0.7927, "step": 4077 }, { "epoch": 0.57, "learning_rate": 8.340859683581084e-06, "loss": 0.8386, "step": 4078 }, { "epoch": 0.57, "learning_rate": 8.336423290172002e-06, "loss": 0.8076, "step": 4079 }, { "epoch": 0.57, "learning_rate": 8.331987233474837e-06, "loss": 0.8379, "step": 4080 }, { "epoch": 0.57, "learning_rate": 8.327551514387451e-06, "loss": 0.8027, "step": 4081 }, { "epoch": 0.57, "learning_rate": 8.323116133807657e-06, "loss": 0.8, "step": 4082 }, { "epoch": 0.57, "learning_rate": 8.318681092633173e-06, "loss": 0.6039, "step": 4083 }, { "epoch": 0.57, "learning_rate": 8.314246391761671e-06, "loss": 0.8877, "step": 4084 }, { "epoch": 0.57, "learning_rate": 8.309812032090744e-06, "loss": 0.7839, "step": 4085 }, { "epoch": 0.57, "learning_rate": 8.30537801451791e-06, "loss": 0.8696, "step": 4086 }, { "epoch": 0.57, "learning_rate": 8.300944339940633e-06, "loss": 0.5767, "step": 4087 }, { "epoch": 0.57, "learning_rate": 8.296511009256296e-06, "loss": 0.8826, "step": 4088 }, { "epoch": 0.57, "learning_rate": 8.292078023362214e-06, "loss": 0.6187, "step": 4089 }, { "epoch": 0.57, "learning_rate": 8.28764538315564e-06, "loss": 0.8223, "step": 4090 }, { "epoch": 0.57, "learning_rate": 8.283213089533742e-06, "loss": 0.8694, "step": 4091 }, { "epoch": 0.57, "learning_rate": 8.278781143393634e-06, "loss": 0.8774, "step": 4092 }, { "epoch": 0.57, "learning_rate": 8.274349545632353e-06, "loss": 0.8156, "step": 4093 }, { "epoch": 0.57, "learning_rate": 8.269918297146859e-06, "loss": 0.8035, "step": 4094 }, { "epoch": 0.57, "learning_rate": 8.265487398834054e-06, "loss": 0.8301, "step": 4095 }, { "epoch": 0.57, "learning_rate": 8.261056851590753e-06, "loss": 0.8215, "step": 4096 }, { "epoch": 0.57, "learning_rate": 8.256626656313722e-06, "loss": 0.8505, "step": 4097 }, { "epoch": 0.57, "learning_rate": 8.252196813899635e-06, "loss": 0.8701, "step": 4098 }, { "epoch": 0.57, "learning_rate": 8.247767325245103e-06, "loss": 0.7834, "step": 4099 }, { "epoch": 0.57, "learning_rate": 8.243338191246667e-06, "loss": 0.8528, "step": 4100 }, { "epoch": 0.57, "learning_rate": 8.238909412800792e-06, "loss": 0.8242, "step": 4101 }, { "epoch": 0.57, "learning_rate": 8.234480990803879e-06, "loss": 0.8416, "step": 4102 }, { "epoch": 0.57, "learning_rate": 8.230052926152248e-06, "loss": 0.9036, "step": 4103 }, { "epoch": 0.57, "learning_rate": 8.225625219742144e-06, "loss": 0.7949, "step": 4104 }, { "epoch": 0.57, "learning_rate": 8.221197872469757e-06, "loss": 0.6085, "step": 4105 }, { "epoch": 0.57, "learning_rate": 8.21677088523118e-06, "loss": 0.8702, "step": 4106 }, { "epoch": 0.57, "learning_rate": 8.212344258922457e-06, "loss": 0.8384, "step": 4107 }, { "epoch": 0.57, "learning_rate": 8.207917994439545e-06, "loss": 0.8372, "step": 4108 }, { "epoch": 0.57, "learning_rate": 8.203492092678322e-06, "loss": 0.8518, "step": 4109 }, { "epoch": 0.57, "learning_rate": 8.199066554534615e-06, "loss": 0.7715, "step": 4110 }, { "epoch": 0.57, "learning_rate": 8.194641380904148e-06, "loss": 0.873, "step": 4111 }, { "epoch": 0.57, "learning_rate": 8.190216572682603e-06, "loss": 0.8445, "step": 4112 }, { "epoch": 0.57, "learning_rate": 8.185792130765563e-06, "loss": 0.7944, "step": 4113 }, { "epoch": 0.57, "learning_rate": 8.181368056048541e-06, "loss": 0.8274, "step": 4114 }, { "epoch": 0.57, "learning_rate": 8.176944349426991e-06, "loss": 0.6234, "step": 4115 }, { "epoch": 0.57, "learning_rate": 8.172521011796273e-06, "loss": 0.9148, "step": 4116 }, { "epoch": 0.57, "learning_rate": 8.168098044051688e-06, "loss": 0.8372, "step": 4117 }, { "epoch": 0.57, "learning_rate": 8.163675447088453e-06, "loss": 0.8071, "step": 4118 }, { "epoch": 0.57, "learning_rate": 8.159253221801706e-06, "loss": 0.7471, "step": 4119 }, { "epoch": 0.57, "learning_rate": 8.154831369086526e-06, "loss": 0.8625, "step": 4120 }, { "epoch": 0.57, "learning_rate": 8.1504098898379e-06, "loss": 0.88, "step": 4121 }, { "epoch": 0.57, "learning_rate": 8.145988784950748e-06, "loss": 0.8625, "step": 4122 }, { "epoch": 0.57, "learning_rate": 8.141568055319916e-06, "loss": 0.7865, "step": 4123 }, { "epoch": 0.57, "learning_rate": 8.13714770184016e-06, "loss": 0.7673, "step": 4124 }, { "epoch": 0.57, "learning_rate": 8.132727725406182e-06, "loss": 0.757, "step": 4125 }, { "epoch": 0.57, "learning_rate": 8.128308126912585e-06, "loss": 0.8667, "step": 4126 }, { "epoch": 0.57, "learning_rate": 8.123888907253918e-06, "loss": 0.772, "step": 4127 }, { "epoch": 0.57, "learning_rate": 8.119470067324634e-06, "loss": 0.8481, "step": 4128 }, { "epoch": 0.57, "learning_rate": 8.115051608019114e-06, "loss": 0.8608, "step": 4129 }, { "epoch": 0.57, "learning_rate": 8.110633530231673e-06, "loss": 0.8599, "step": 4130 }, { "epoch": 0.57, "learning_rate": 8.106215834856533e-06, "loss": 0.8259, "step": 4131 }, { "epoch": 0.57, "learning_rate": 8.101798522787853e-06, "loss": 0.8577, "step": 4132 }, { "epoch": 0.57, "learning_rate": 8.097381594919706e-06, "loss": 0.8254, "step": 4133 }, { "epoch": 0.57, "learning_rate": 8.092965052146082e-06, "loss": 0.8381, "step": 4134 }, { "epoch": 0.57, "learning_rate": 8.088548895360909e-06, "loss": 0.5988, "step": 4135 }, { "epoch": 0.57, "learning_rate": 8.084133125458019e-06, "loss": 0.8733, "step": 4136 }, { "epoch": 0.57, "learning_rate": 8.079717743331183e-06, "loss": 0.855, "step": 4137 }, { "epoch": 0.57, "learning_rate": 8.075302749874081e-06, "loss": 0.8486, "step": 4138 }, { "epoch": 0.57, "learning_rate": 8.070888145980314e-06, "loss": 0.6088, "step": 4139 }, { "epoch": 0.58, "learning_rate": 8.066473932543418e-06, "loss": 0.8613, "step": 4140 }, { "epoch": 0.58, "learning_rate": 8.06206011045683e-06, "loss": 0.8477, "step": 4141 }, { "epoch": 0.58, "learning_rate": 8.057646680613926e-06, "loss": 0.7646, "step": 4142 }, { "epoch": 0.58, "learning_rate": 8.053233643907993e-06, "loss": 0.8406, "step": 4143 }, { "epoch": 0.58, "learning_rate": 8.048821001232235e-06, "loss": 0.6252, "step": 4144 }, { "epoch": 0.58, "learning_rate": 8.04440875347979e-06, "loss": 0.7507, "step": 4145 }, { "epoch": 0.58, "learning_rate": 8.0399969015437e-06, "loss": 0.8142, "step": 4146 }, { "epoch": 0.58, "learning_rate": 8.03558544631694e-06, "loss": 0.8118, "step": 4147 }, { "epoch": 0.58, "learning_rate": 8.031174388692397e-06, "loss": 0.853, "step": 4148 }, { "epoch": 0.58, "learning_rate": 8.026763729562877e-06, "loss": 0.8354, "step": 4149 }, { "epoch": 0.58, "learning_rate": 8.022353469821113e-06, "loss": 0.8313, "step": 4150 }, { "epoch": 0.58, "learning_rate": 8.017943610359745e-06, "loss": 0.8733, "step": 4151 }, { "epoch": 0.58, "learning_rate": 8.013534152071349e-06, "loss": 0.8512, "step": 4152 }, { "epoch": 0.58, "learning_rate": 8.009125095848403e-06, "loss": 0.8245, "step": 4153 }, { "epoch": 0.58, "learning_rate": 8.00471644258331e-06, "loss": 0.8191, "step": 4154 }, { "epoch": 0.58, "learning_rate": 8.000308193168395e-06, "loss": 0.8535, "step": 4155 }, { "epoch": 0.58, "learning_rate": 7.995900348495896e-06, "loss": 0.8181, "step": 4156 }, { "epoch": 0.58, "learning_rate": 7.991492909457976e-06, "loss": 0.8853, "step": 4157 }, { "epoch": 0.58, "learning_rate": 7.987085876946708e-06, "loss": 0.8215, "step": 4158 }, { "epoch": 0.58, "learning_rate": 7.982679251854081e-06, "loss": 0.8298, "step": 4159 }, { "epoch": 0.58, "learning_rate": 7.978273035072016e-06, "loss": 0.8516, "step": 4160 }, { "epoch": 0.58, "learning_rate": 7.973867227492333e-06, "loss": 0.8486, "step": 4161 }, { "epoch": 0.58, "learning_rate": 7.969461830006788e-06, "loss": 0.8831, "step": 4162 }, { "epoch": 0.58, "learning_rate": 7.965056843507036e-06, "loss": 0.8102, "step": 4163 }, { "epoch": 0.58, "learning_rate": 7.960652268884655e-06, "loss": 0.8311, "step": 4164 }, { "epoch": 0.58, "learning_rate": 7.95624810703115e-06, "loss": 0.8127, "step": 4165 }, { "epoch": 0.58, "learning_rate": 7.951844358837927e-06, "loss": 0.9299, "step": 4166 }, { "epoch": 0.58, "learning_rate": 7.947441025196318e-06, "loss": 0.594, "step": 4167 }, { "epoch": 0.58, "learning_rate": 7.943038106997572e-06, "loss": 0.8433, "step": 4168 }, { "epoch": 0.58, "learning_rate": 7.93863560513284e-06, "loss": 0.8667, "step": 4169 }, { "epoch": 0.58, "learning_rate": 7.93423352049321e-06, "loss": 0.9204, "step": 4170 }, { "epoch": 0.58, "learning_rate": 7.929831853969662e-06, "loss": 0.8953, "step": 4171 }, { "epoch": 0.58, "learning_rate": 7.92543060645312e-06, "loss": 0.8953, "step": 4172 }, { "epoch": 0.58, "learning_rate": 7.921029778834396e-06, "loss": 0.822, "step": 4173 }, { "epoch": 0.58, "learning_rate": 7.916629372004228e-06, "loss": 0.8298, "step": 4174 }, { "epoch": 0.58, "learning_rate": 7.912229386853274e-06, "loss": 0.8477, "step": 4175 }, { "epoch": 0.58, "learning_rate": 7.907829824272095e-06, "loss": 0.8811, "step": 4176 }, { "epoch": 0.58, "learning_rate": 7.903430685151182e-06, "loss": 0.9321, "step": 4177 }, { "epoch": 0.58, "learning_rate": 7.899031970380926e-06, "loss": 0.8652, "step": 4178 }, { "epoch": 0.58, "learning_rate": 7.894633680851633e-06, "loss": 0.8696, "step": 4179 }, { "epoch": 0.58, "learning_rate": 7.890235817453537e-06, "loss": 0.6492, "step": 4180 }, { "epoch": 0.58, "learning_rate": 7.885838381076768e-06, "loss": 0.8718, "step": 4181 }, { "epoch": 0.58, "learning_rate": 7.881441372611382e-06, "loss": 0.8027, "step": 4182 }, { "epoch": 0.58, "learning_rate": 7.87704479294734e-06, "loss": 0.8884, "step": 4183 }, { "epoch": 0.58, "learning_rate": 7.872648642974529e-06, "loss": 0.866, "step": 4184 }, { "epoch": 0.58, "learning_rate": 7.868252923582733e-06, "loss": 0.8733, "step": 4185 }, { "epoch": 0.58, "learning_rate": 7.863857635661654e-06, "loss": 0.8528, "step": 4186 }, { "epoch": 0.58, "learning_rate": 7.859462780100915e-06, "loss": 0.7871, "step": 4187 }, { "epoch": 0.58, "learning_rate": 7.85506835779004e-06, "loss": 0.8862, "step": 4188 }, { "epoch": 0.58, "learning_rate": 7.850674369618478e-06, "loss": 0.8047, "step": 4189 }, { "epoch": 0.58, "learning_rate": 7.846280816475576e-06, "loss": 0.7854, "step": 4190 }, { "epoch": 0.58, "learning_rate": 7.841887699250599e-06, "loss": 0.6254, "step": 4191 }, { "epoch": 0.58, "learning_rate": 7.837495018832731e-06, "loss": 0.8174, "step": 4192 }, { "epoch": 0.58, "learning_rate": 7.833102776111053e-06, "loss": 0.8381, "step": 4193 }, { "epoch": 0.58, "learning_rate": 7.828710971974575e-06, "loss": 0.8757, "step": 4194 }, { "epoch": 0.58, "learning_rate": 7.824319607312202e-06, "loss": 0.8376, "step": 4195 }, { "epoch": 0.58, "learning_rate": 7.819928683012755e-06, "loss": 0.835, "step": 4196 }, { "epoch": 0.58, "learning_rate": 7.815538199964976e-06, "loss": 0.8826, "step": 4197 }, { "epoch": 0.58, "learning_rate": 7.811148159057497e-06, "loss": 0.8315, "step": 4198 }, { "epoch": 0.58, "learning_rate": 7.806758561178885e-06, "loss": 0.8359, "step": 4199 }, { "epoch": 0.58, "learning_rate": 7.802369407217602e-06, "loss": 0.8979, "step": 4200 }, { "epoch": 0.58, "learning_rate": 7.797980698062016e-06, "loss": 0.8174, "step": 4201 }, { "epoch": 0.58, "learning_rate": 7.79359243460042e-06, "loss": 0.8157, "step": 4202 }, { "epoch": 0.58, "learning_rate": 7.789204617721004e-06, "loss": 0.7743, "step": 4203 }, { "epoch": 0.58, "learning_rate": 7.78481724831188e-06, "loss": 0.822, "step": 4204 }, { "epoch": 0.58, "learning_rate": 7.780430327261055e-06, "loss": 0.8738, "step": 4205 }, { "epoch": 0.58, "learning_rate": 7.776043855456453e-06, "loss": 0.8962, "step": 4206 }, { "epoch": 0.58, "learning_rate": 7.771657833785912e-06, "loss": 0.8513, "step": 4207 }, { "epoch": 0.58, "learning_rate": 7.767272263137164e-06, "loss": 0.8359, "step": 4208 }, { "epoch": 0.58, "learning_rate": 7.76288714439787e-06, "loss": 0.8108, "step": 4209 }, { "epoch": 0.58, "learning_rate": 7.758502478455584e-06, "loss": 0.824, "step": 4210 }, { "epoch": 0.58, "learning_rate": 7.754118266197764e-06, "loss": 0.8235, "step": 4211 }, { "epoch": 0.59, "learning_rate": 7.7497345085118e-06, "loss": 0.8423, "step": 4212 }, { "epoch": 0.59, "learning_rate": 7.745351206284962e-06, "loss": 0.8921, "step": 4213 }, { "epoch": 0.59, "learning_rate": 7.740968360404452e-06, "loss": 0.7947, "step": 4214 }, { "epoch": 0.59, "learning_rate": 7.736585971757365e-06, "loss": 0.7834, "step": 4215 }, { "epoch": 0.59, "learning_rate": 7.732204041230699e-06, "loss": 0.8591, "step": 4216 }, { "epoch": 0.59, "learning_rate": 7.727822569711378e-06, "loss": 0.8259, "step": 4217 }, { "epoch": 0.59, "learning_rate": 7.723441558086216e-06, "loss": 0.8508, "step": 4218 }, { "epoch": 0.59, "learning_rate": 7.719061007241944e-06, "loss": 0.8606, "step": 4219 }, { "epoch": 0.59, "learning_rate": 7.714680918065196e-06, "loss": 0.8699, "step": 4220 }, { "epoch": 0.59, "learning_rate": 7.710301291442505e-06, "loss": 0.8862, "step": 4221 }, { "epoch": 0.59, "learning_rate": 7.705922128260328e-06, "loss": 0.7867, "step": 4222 }, { "epoch": 0.59, "learning_rate": 7.701543429405011e-06, "loss": 0.9041, "step": 4223 }, { "epoch": 0.59, "learning_rate": 7.69716519576282e-06, "loss": 0.8005, "step": 4224 }, { "epoch": 0.59, "learning_rate": 7.692787428219915e-06, "loss": 0.7974, "step": 4225 }, { "epoch": 0.59, "learning_rate": 7.688410127662363e-06, "loss": 0.8835, "step": 4226 }, { "epoch": 0.59, "learning_rate": 7.68403329497615e-06, "loss": 0.5547, "step": 4227 }, { "epoch": 0.59, "learning_rate": 7.679656931047148e-06, "loss": 0.8638, "step": 4228 }, { "epoch": 0.59, "learning_rate": 7.675281036761153e-06, "loss": 0.7534, "step": 4229 }, { "epoch": 0.59, "learning_rate": 7.67090561300385e-06, "loss": 0.9158, "step": 4230 }, { "epoch": 0.59, "learning_rate": 7.666530660660832e-06, "loss": 0.8425, "step": 4231 }, { "epoch": 0.59, "learning_rate": 7.66215618061761e-06, "loss": 0.8015, "step": 4232 }, { "epoch": 0.59, "learning_rate": 7.657782173759579e-06, "loss": 0.8369, "step": 4233 }, { "epoch": 0.59, "learning_rate": 7.653408640972056e-06, "loss": 0.8486, "step": 4234 }, { "epoch": 0.59, "learning_rate": 7.649035583140253e-06, "loss": 0.9124, "step": 4235 }, { "epoch": 0.59, "learning_rate": 7.64466300114928e-06, "loss": 0.8669, "step": 4236 }, { "epoch": 0.59, "learning_rate": 7.640290895884171e-06, "loss": 0.8096, "step": 4237 }, { "epoch": 0.59, "learning_rate": 7.635919268229838e-06, "loss": 0.7834, "step": 4238 }, { "epoch": 0.59, "learning_rate": 7.631548119071119e-06, "loss": 0.8484, "step": 4239 }, { "epoch": 0.59, "learning_rate": 7.62717744929274e-06, "loss": 0.8887, "step": 4240 }, { "epoch": 0.59, "learning_rate": 7.622807259779332e-06, "loss": 0.8269, "step": 4241 }, { "epoch": 0.59, "learning_rate": 7.618437551415441e-06, "loss": 0.8853, "step": 4242 }, { "epoch": 0.59, "learning_rate": 7.614068325085495e-06, "loss": 0.8496, "step": 4243 }, { "epoch": 0.59, "learning_rate": 7.609699581673846e-06, "loss": 0.8535, "step": 4244 }, { "epoch": 0.59, "learning_rate": 7.605331322064735e-06, "loss": 0.8335, "step": 4245 }, { "epoch": 0.59, "learning_rate": 7.600963547142304e-06, "loss": 0.8074, "step": 4246 }, { "epoch": 0.59, "learning_rate": 7.5965962577906075e-06, "loss": 0.8665, "step": 4247 }, { "epoch": 0.59, "learning_rate": 7.592229454893588e-06, "loss": 0.886, "step": 4248 }, { "epoch": 0.59, "learning_rate": 7.587863139335106e-06, "loss": 0.8605, "step": 4249 }, { "epoch": 0.59, "learning_rate": 7.583497311998909e-06, "loss": 0.8185, "step": 4250 }, { "epoch": 0.59, "learning_rate": 7.579131973768645e-06, "loss": 0.8542, "step": 4251 }, { "epoch": 0.59, "learning_rate": 7.574767125527882e-06, "loss": 0.8569, "step": 4252 }, { "epoch": 0.59, "learning_rate": 7.570402768160066e-06, "loss": 0.8329, "step": 4253 }, { "epoch": 0.59, "learning_rate": 7.566038902548557e-06, "loss": 0.783, "step": 4254 }, { "epoch": 0.59, "learning_rate": 7.561675529576612e-06, "loss": 0.8105, "step": 4255 }, { "epoch": 0.59, "learning_rate": 7.557312650127384e-06, "loss": 0.842, "step": 4256 }, { "epoch": 0.59, "learning_rate": 7.552950265083938e-06, "loss": 0.8767, "step": 4257 }, { "epoch": 0.59, "learning_rate": 7.548588375329225e-06, "loss": 0.8635, "step": 4258 }, { "epoch": 0.59, "learning_rate": 7.544226981746103e-06, "loss": 0.8645, "step": 4259 }, { "epoch": 0.59, "learning_rate": 7.539866085217331e-06, "loss": 0.8357, "step": 4260 }, { "epoch": 0.59, "learning_rate": 7.535505686625559e-06, "loss": 0.8374, "step": 4261 }, { "epoch": 0.59, "learning_rate": 7.531145786853352e-06, "loss": 0.8572, "step": 4262 }, { "epoch": 0.59, "learning_rate": 7.526786386783156e-06, "loss": 0.8408, "step": 4263 }, { "epoch": 0.59, "learning_rate": 7.522427487297326e-06, "loss": 0.7791, "step": 4264 }, { "epoch": 0.59, "learning_rate": 7.518069089278116e-06, "loss": 0.8145, "step": 4265 }, { "epoch": 0.59, "learning_rate": 7.513711193607672e-06, "loss": 0.5841, "step": 4266 }, { "epoch": 0.59, "learning_rate": 7.509353801168046e-06, "loss": 0.8469, "step": 4267 }, { "epoch": 0.59, "learning_rate": 7.504996912841185e-06, "loss": 0.8394, "step": 4268 }, { "epoch": 0.59, "learning_rate": 7.50064052950893e-06, "loss": 0.8562, "step": 4269 }, { "epoch": 0.59, "learning_rate": 7.49628465205303e-06, "loss": 0.6097, "step": 4270 }, { "epoch": 0.59, "learning_rate": 7.491929281355114e-06, "loss": 0.8396, "step": 4271 }, { "epoch": 0.59, "learning_rate": 7.487574418296733e-06, "loss": 0.8579, "step": 4272 }, { "epoch": 0.59, "learning_rate": 7.483220063759311e-06, "loss": 0.8159, "step": 4273 }, { "epoch": 0.59, "learning_rate": 7.478866218624184e-06, "loss": 0.8585, "step": 4274 }, { "epoch": 0.59, "learning_rate": 7.474512883772583e-06, "loss": 0.6013, "step": 4275 }, { "epoch": 0.59, "learning_rate": 7.4701600600856296e-06, "loss": 0.9055, "step": 4276 }, { "epoch": 0.59, "learning_rate": 7.465807748444347e-06, "loss": 0.8447, "step": 4277 }, { "epoch": 0.59, "learning_rate": 7.461455949729653e-06, "loss": 0.8364, "step": 4278 }, { "epoch": 0.59, "learning_rate": 7.457104664822361e-06, "loss": 0.7937, "step": 4279 }, { "epoch": 0.59, "learning_rate": 7.452753894603187e-06, "loss": 0.7677, "step": 4280 }, { "epoch": 0.59, "learning_rate": 7.448403639952732e-06, "loss": 0.8401, "step": 4281 }, { "epoch": 0.59, "learning_rate": 7.444053901751498e-06, "loss": 0.864, "step": 4282 }, { "epoch": 0.59, "learning_rate": 7.439704680879884e-06, "loss": 0.7926, "step": 4283 }, { "epoch": 0.6, "learning_rate": 7.435355978218184e-06, "loss": 0.8357, "step": 4284 }, { "epoch": 0.6, "learning_rate": 7.431007794646587e-06, "loss": 0.9414, "step": 4285 }, { "epoch": 0.6, "learning_rate": 7.426660131045169e-06, "loss": 0.8406, "step": 4286 }, { "epoch": 0.6, "learning_rate": 7.422312988293914e-06, "loss": 0.8914, "step": 4287 }, { "epoch": 0.6, "learning_rate": 7.417966367272691e-06, "loss": 0.8137, "step": 4288 }, { "epoch": 0.6, "learning_rate": 7.413620268861267e-06, "loss": 0.8516, "step": 4289 }, { "epoch": 0.6, "learning_rate": 7.409274693939305e-06, "loss": 0.8208, "step": 4290 }, { "epoch": 0.6, "learning_rate": 7.404929643386357e-06, "loss": 0.8882, "step": 4291 }, { "epoch": 0.6, "learning_rate": 7.400585118081872e-06, "loss": 0.8188, "step": 4292 }, { "epoch": 0.6, "learning_rate": 7.396241118905193e-06, "loss": 0.7703, "step": 4293 }, { "epoch": 0.6, "learning_rate": 7.391897646735556e-06, "loss": 0.8691, "step": 4294 }, { "epoch": 0.6, "learning_rate": 7.387554702452092e-06, "loss": 0.7719, "step": 4295 }, { "epoch": 0.6, "learning_rate": 7.38321228693382e-06, "loss": 0.7744, "step": 4296 }, { "epoch": 0.6, "learning_rate": 7.378870401059656e-06, "loss": 0.8135, "step": 4297 }, { "epoch": 0.6, "learning_rate": 7.374529045708408e-06, "loss": 0.7793, "step": 4298 }, { "epoch": 0.6, "learning_rate": 7.370188221758779e-06, "loss": 0.8411, "step": 4299 }, { "epoch": 0.6, "learning_rate": 7.36584793008936e-06, "loss": 0.8052, "step": 4300 }, { "epoch": 0.6, "learning_rate": 7.361508171578639e-06, "loss": 0.6004, "step": 4301 }, { "epoch": 0.6, "learning_rate": 7.357168947104989e-06, "loss": 0.7556, "step": 4302 }, { "epoch": 0.6, "learning_rate": 7.352830257546684e-06, "loss": 0.811, "step": 4303 }, { "epoch": 0.6, "learning_rate": 7.348492103781883e-06, "loss": 0.8147, "step": 4304 }, { "epoch": 0.6, "learning_rate": 7.344154486688637e-06, "loss": 0.8311, "step": 4305 }, { "epoch": 0.6, "learning_rate": 7.339817407144896e-06, "loss": 0.8191, "step": 4306 }, { "epoch": 0.6, "learning_rate": 7.335480866028488e-06, "loss": 0.5504, "step": 4307 }, { "epoch": 0.6, "learning_rate": 7.331144864217144e-06, "loss": 0.6084, "step": 4308 }, { "epoch": 0.6, "learning_rate": 7.326809402588482e-06, "loss": 0.7932, "step": 4309 }, { "epoch": 0.6, "learning_rate": 7.322474482020001e-06, "loss": 0.8594, "step": 4310 }, { "epoch": 0.6, "learning_rate": 7.318140103389113e-06, "loss": 0.8376, "step": 4311 }, { "epoch": 0.6, "learning_rate": 7.313806267573097e-06, "loss": 0.8435, "step": 4312 }, { "epoch": 0.6, "learning_rate": 7.309472975449134e-06, "loss": 0.8721, "step": 4313 }, { "epoch": 0.6, "learning_rate": 7.305140227894295e-06, "loss": 0.783, "step": 4314 }, { "epoch": 0.6, "learning_rate": 7.300808025785533e-06, "loss": 0.8132, "step": 4315 }, { "epoch": 0.6, "learning_rate": 7.296476369999704e-06, "loss": 0.855, "step": 4316 }, { "epoch": 0.6, "learning_rate": 7.292145261413539e-06, "loss": 0.6221, "step": 4317 }, { "epoch": 0.6, "learning_rate": 7.287814700903667e-06, "loss": 0.8647, "step": 4318 }, { "epoch": 0.6, "learning_rate": 7.283484689346606e-06, "loss": 0.8882, "step": 4319 }, { "epoch": 0.6, "learning_rate": 7.279155227618755e-06, "loss": 0.8867, "step": 4320 }, { "epoch": 0.6, "learning_rate": 7.274826316596414e-06, "loss": 0.7729, "step": 4321 }, { "epoch": 0.6, "learning_rate": 7.27049795715576e-06, "loss": 0.7493, "step": 4322 }, { "epoch": 0.6, "learning_rate": 7.266170150172866e-06, "loss": 0.9216, "step": 4323 }, { "epoch": 0.6, "learning_rate": 7.261842896523692e-06, "loss": 0.8054, "step": 4324 }, { "epoch": 0.6, "learning_rate": 7.257516197084078e-06, "loss": 0.823, "step": 4325 }, { "epoch": 0.6, "learning_rate": 7.253190052729766e-06, "loss": 0.5807, "step": 4326 }, { "epoch": 0.6, "learning_rate": 7.248864464336376e-06, "loss": 0.8252, "step": 4327 }, { "epoch": 0.6, "learning_rate": 7.2445394327794115e-06, "loss": 0.8459, "step": 4328 }, { "epoch": 0.6, "learning_rate": 7.240214958934277e-06, "loss": 0.8867, "step": 4329 }, { "epoch": 0.6, "learning_rate": 7.235891043676251e-06, "loss": 0.734, "step": 4330 }, { "epoch": 0.6, "learning_rate": 7.23156768788051e-06, "loss": 0.8574, "step": 4331 }, { "epoch": 0.6, "learning_rate": 7.2272448924221085e-06, "loss": 0.5895, "step": 4332 }, { "epoch": 0.6, "learning_rate": 7.222922658175986e-06, "loss": 0.7839, "step": 4333 }, { "epoch": 0.6, "learning_rate": 7.218600986016981e-06, "loss": 0.7886, "step": 4334 }, { "epoch": 0.6, "learning_rate": 7.214279876819803e-06, "loss": 0.8479, "step": 4335 }, { "epoch": 0.6, "learning_rate": 7.209959331459062e-06, "loss": 0.8262, "step": 4336 }, { "epoch": 0.6, "learning_rate": 7.205639350809245e-06, "loss": 0.7842, "step": 4337 }, { "epoch": 0.6, "learning_rate": 7.20131993574472e-06, "loss": 0.7814, "step": 4338 }, { "epoch": 0.6, "learning_rate": 7.197001087139755e-06, "loss": 0.8354, "step": 4339 }, { "epoch": 0.6, "learning_rate": 7.192682805868489e-06, "loss": 0.8245, "step": 4340 }, { "epoch": 0.6, "learning_rate": 7.188365092804959e-06, "loss": 0.8213, "step": 4341 }, { "epoch": 0.6, "learning_rate": 7.184047948823077e-06, "loss": 0.8662, "step": 4342 }, { "epoch": 0.6, "learning_rate": 7.179731374796639e-06, "loss": 0.9185, "step": 4343 }, { "epoch": 0.6, "learning_rate": 7.175415371599339e-06, "loss": 0.8115, "step": 4344 }, { "epoch": 0.6, "learning_rate": 7.171099940104737e-06, "loss": 0.845, "step": 4345 }, { "epoch": 0.6, "learning_rate": 7.166785081186297e-06, "loss": 0.8019, "step": 4346 }, { "epoch": 0.6, "learning_rate": 7.16247079571735e-06, "loss": 0.8386, "step": 4347 }, { "epoch": 0.6, "learning_rate": 7.158157084571115e-06, "loss": 0.7908, "step": 4348 }, { "epoch": 0.6, "learning_rate": 7.153843948620705e-06, "loss": 0.5024, "step": 4349 }, { "epoch": 0.6, "learning_rate": 7.149531388739101e-06, "loss": 0.8511, "step": 4350 }, { "epoch": 0.6, "learning_rate": 7.1452194057991855e-06, "loss": 0.8252, "step": 4351 }, { "epoch": 0.6, "learning_rate": 7.140908000673708e-06, "loss": 0.8474, "step": 4352 }, { "epoch": 0.6, "learning_rate": 7.136597174235302e-06, "loss": 0.8066, "step": 4353 }, { "epoch": 0.6, "learning_rate": 7.132286927356501e-06, "loss": 0.891, "step": 4354 }, { "epoch": 0.6, "learning_rate": 7.127977260909698e-06, "loss": 0.9043, "step": 4355 }, { "epoch": 0.61, "learning_rate": 7.12366817576719e-06, "loss": 0.8645, "step": 4356 }, { "epoch": 0.61, "learning_rate": 7.11935967280114e-06, "loss": 0.5994, "step": 4357 }, { "epoch": 0.61, "learning_rate": 7.115051752883597e-06, "loss": 0.7657, "step": 4358 }, { "epoch": 0.61, "learning_rate": 7.1107444168865035e-06, "loss": 0.8237, "step": 4359 }, { "epoch": 0.61, "learning_rate": 7.1064376656816625e-06, "loss": 0.8286, "step": 4360 }, { "epoch": 0.61, "learning_rate": 7.102131500140783e-06, "loss": 0.7717, "step": 4361 }, { "epoch": 0.61, "learning_rate": 7.0978259211354375e-06, "loss": 0.8906, "step": 4362 }, { "epoch": 0.61, "learning_rate": 7.093520929537081e-06, "loss": 0.8237, "step": 4363 }, { "epoch": 0.61, "learning_rate": 7.089216526217062e-06, "loss": 0.8855, "step": 4364 }, { "epoch": 0.61, "learning_rate": 7.0849127120465945e-06, "loss": 0.6019, "step": 4365 }, { "epoch": 0.61, "learning_rate": 7.08060948789679e-06, "loss": 0.8525, "step": 4366 }, { "epoch": 0.61, "learning_rate": 7.0763068546386256e-06, "loss": 0.8817, "step": 4367 }, { "epoch": 0.61, "learning_rate": 7.072004813142963e-06, "loss": 0.8184, "step": 4368 }, { "epoch": 0.61, "learning_rate": 7.067703364280552e-06, "loss": 0.8071, "step": 4369 }, { "epoch": 0.61, "learning_rate": 7.063402508922006e-06, "loss": 0.8574, "step": 4370 }, { "epoch": 0.61, "learning_rate": 7.059102247937839e-06, "loss": 0.8374, "step": 4371 }, { "epoch": 0.61, "learning_rate": 7.054802582198432e-06, "loss": 0.7839, "step": 4372 }, { "epoch": 0.61, "learning_rate": 7.05050351257404e-06, "loss": 0.8708, "step": 4373 }, { "epoch": 0.61, "learning_rate": 7.046205039934815e-06, "loss": 0.8403, "step": 4374 }, { "epoch": 0.61, "learning_rate": 7.04190716515077e-06, "loss": 0.8276, "step": 4375 }, { "epoch": 0.61, "learning_rate": 7.037609889091812e-06, "loss": 0.8284, "step": 4376 }, { "epoch": 0.61, "learning_rate": 7.033313212627717e-06, "loss": 0.8513, "step": 4377 }, { "epoch": 0.61, "learning_rate": 7.029017136628138e-06, "loss": 0.8701, "step": 4378 }, { "epoch": 0.61, "learning_rate": 7.02472166196262e-06, "loss": 0.7971, "step": 4379 }, { "epoch": 0.61, "learning_rate": 7.020426789500569e-06, "loss": 0.3301, "step": 4380 }, { "epoch": 0.61, "learning_rate": 7.016132520111285e-06, "loss": 0.8374, "step": 4381 }, { "epoch": 0.61, "learning_rate": 7.011838854663935e-06, "loss": 0.8438, "step": 4382 }, { "epoch": 0.61, "learning_rate": 7.0075457940275634e-06, "loss": 0.877, "step": 4383 }, { "epoch": 0.61, "learning_rate": 7.003253339071103e-06, "loss": 0.7522, "step": 4384 }, { "epoch": 0.61, "learning_rate": 6.99896149066335e-06, "loss": 0.8784, "step": 4385 }, { "epoch": 0.61, "learning_rate": 6.994670249672992e-06, "loss": 0.3526, "step": 4386 }, { "epoch": 0.61, "learning_rate": 6.990379616968584e-06, "loss": 0.8635, "step": 4387 }, { "epoch": 0.61, "learning_rate": 6.986089593418553e-06, "loss": 0.8704, "step": 4388 }, { "epoch": 0.61, "learning_rate": 6.981800179891221e-06, "loss": 0.5826, "step": 4389 }, { "epoch": 0.61, "learning_rate": 6.977511377254766e-06, "loss": 0.8257, "step": 4390 }, { "epoch": 0.61, "learning_rate": 6.973223186377263e-06, "loss": 0.5856, "step": 4391 }, { "epoch": 0.61, "learning_rate": 6.968935608126645e-06, "loss": 0.8413, "step": 4392 }, { "epoch": 0.61, "learning_rate": 6.964648643370724e-06, "loss": 0.8337, "step": 4393 }, { "epoch": 0.61, "learning_rate": 6.960362292977201e-06, "loss": 0.802, "step": 4394 }, { "epoch": 0.61, "learning_rate": 6.956076557813636e-06, "loss": 0.8877, "step": 4395 }, { "epoch": 0.61, "learning_rate": 6.951791438747479e-06, "loss": 0.8623, "step": 4396 }, { "epoch": 0.61, "learning_rate": 6.947506936646047e-06, "loss": 0.5736, "step": 4397 }, { "epoch": 0.61, "learning_rate": 6.9432230523765265e-06, "loss": 0.8445, "step": 4398 }, { "epoch": 0.61, "learning_rate": 6.938939786805994e-06, "loss": 0.8447, "step": 4399 }, { "epoch": 0.61, "learning_rate": 6.934657140801386e-06, "loss": 0.865, "step": 4400 }, { "epoch": 0.61, "learning_rate": 6.930375115229528e-06, "loss": 0.8132, "step": 4401 }, { "epoch": 0.61, "learning_rate": 6.926093710957108e-06, "loss": 0.8606, "step": 4402 }, { "epoch": 0.61, "learning_rate": 6.921812928850689e-06, "loss": 0.844, "step": 4403 }, { "epoch": 0.61, "learning_rate": 6.917532769776719e-06, "loss": 0.866, "step": 4404 }, { "epoch": 0.61, "learning_rate": 6.913253234601504e-06, "loss": 0.8479, "step": 4405 }, { "epoch": 0.61, "learning_rate": 6.908974324191243e-06, "loss": 0.9026, "step": 4406 }, { "epoch": 0.61, "learning_rate": 6.904696039411991e-06, "loss": 0.561, "step": 4407 }, { "epoch": 0.61, "learning_rate": 6.900418381129679e-06, "loss": 0.6115, "step": 4408 }, { "epoch": 0.61, "learning_rate": 6.896141350210124e-06, "loss": 0.8655, "step": 4409 }, { "epoch": 0.61, "learning_rate": 6.891864947519e-06, "loss": 0.7992, "step": 4410 }, { "epoch": 0.61, "learning_rate": 6.887589173921868e-06, "loss": 0.9121, "step": 4411 }, { "epoch": 0.61, "learning_rate": 6.883314030284152e-06, "loss": 0.8413, "step": 4412 }, { "epoch": 0.61, "learning_rate": 6.879039517471146e-06, "loss": 0.8247, "step": 4413 }, { "epoch": 0.61, "learning_rate": 6.874765636348031e-06, "loss": 0.8706, "step": 4414 }, { "epoch": 0.61, "learning_rate": 6.870492387779841e-06, "loss": 0.8741, "step": 4415 }, { "epoch": 0.61, "learning_rate": 6.866219772631502e-06, "loss": 0.8362, "step": 4416 }, { "epoch": 0.61, "learning_rate": 6.861947791767795e-06, "loss": 0.8271, "step": 4417 }, { "epoch": 0.61, "learning_rate": 6.857676446053377e-06, "loss": 0.8076, "step": 4418 }, { "epoch": 0.61, "learning_rate": 6.8534057363527875e-06, "loss": 0.866, "step": 4419 }, { "epoch": 0.61, "learning_rate": 6.849135663530418e-06, "loss": 0.5865, "step": 4420 }, { "epoch": 0.61, "learning_rate": 6.844866228450551e-06, "loss": 0.7939, "step": 4421 }, { "epoch": 0.61, "learning_rate": 6.840597431977321e-06, "loss": 0.8599, "step": 4422 }, { "epoch": 0.61, "learning_rate": 6.836329274974751e-06, "loss": 0.7981, "step": 4423 }, { "epoch": 0.61, "learning_rate": 6.832061758306725e-06, "loss": 0.8511, "step": 4424 }, { "epoch": 0.61, "learning_rate": 6.827794882836991e-06, "loss": 0.7198, "step": 4425 }, { "epoch": 0.61, "learning_rate": 6.823528649429185e-06, "loss": 0.8264, "step": 4426 }, { "epoch": 0.61, "learning_rate": 6.8192630589467945e-06, "loss": 0.8337, "step": 4427 }, { "epoch": 0.62, "learning_rate": 6.8149981122531924e-06, "loss": 0.8188, "step": 4428 }, { "epoch": 0.62, "learning_rate": 6.8107338102116095e-06, "loss": 0.7751, "step": 4429 }, { "epoch": 0.62, "learning_rate": 6.806470153685149e-06, "loss": 0.8987, "step": 4430 }, { "epoch": 0.62, "learning_rate": 6.802207143536792e-06, "loss": 0.7898, "step": 4431 }, { "epoch": 0.62, "learning_rate": 6.797944780629374e-06, "loss": 0.8467, "step": 4432 }, { "epoch": 0.62, "learning_rate": 6.793683065825616e-06, "loss": 0.8033, "step": 4433 }, { "epoch": 0.62, "learning_rate": 6.789421999988094e-06, "loss": 0.751, "step": 4434 }, { "epoch": 0.62, "learning_rate": 6.785161583979255e-06, "loss": 0.8555, "step": 4435 }, { "epoch": 0.62, "learning_rate": 6.780901818661425e-06, "loss": 0.8303, "step": 4436 }, { "epoch": 0.62, "learning_rate": 6.776642704896783e-06, "loss": 0.896, "step": 4437 }, { "epoch": 0.62, "learning_rate": 6.772384243547392e-06, "loss": 0.7883, "step": 4438 }, { "epoch": 0.62, "learning_rate": 6.768126435475171e-06, "loss": 0.6289, "step": 4439 }, { "epoch": 0.62, "learning_rate": 6.763869281541905e-06, "loss": 0.8364, "step": 4440 }, { "epoch": 0.62, "learning_rate": 6.759612782609262e-06, "loss": 0.8291, "step": 4441 }, { "epoch": 0.62, "learning_rate": 6.755356939538757e-06, "loss": 0.8914, "step": 4442 }, { "epoch": 0.62, "learning_rate": 6.751101753191796e-06, "loss": 0.8591, "step": 4443 }, { "epoch": 0.62, "learning_rate": 6.746847224429629e-06, "loss": 0.8572, "step": 4444 }, { "epoch": 0.62, "learning_rate": 6.742593354113383e-06, "loss": 0.8074, "step": 4445 }, { "epoch": 0.62, "learning_rate": 6.738340143104057e-06, "loss": 0.8362, "step": 4446 }, { "epoch": 0.62, "learning_rate": 6.7340875922625035e-06, "loss": 0.8137, "step": 4447 }, { "epoch": 0.62, "learning_rate": 6.72983570244946e-06, "loss": 0.7549, "step": 4448 }, { "epoch": 0.62, "learning_rate": 6.725584474525511e-06, "loss": 0.8115, "step": 4449 }, { "epoch": 0.62, "learning_rate": 6.721333909351113e-06, "loss": 0.8452, "step": 4450 }, { "epoch": 0.62, "learning_rate": 6.7170840077865986e-06, "loss": 0.8442, "step": 4451 }, { "epoch": 0.62, "learning_rate": 6.712834770692151e-06, "loss": 0.8481, "step": 4452 }, { "epoch": 0.62, "learning_rate": 6.708586198927832e-06, "loss": 0.8535, "step": 4453 }, { "epoch": 0.62, "learning_rate": 6.70433829335356e-06, "loss": 0.7754, "step": 4454 }, { "epoch": 0.62, "learning_rate": 6.700091054829118e-06, "loss": 0.7552, "step": 4455 }, { "epoch": 0.62, "learning_rate": 6.695844484214163e-06, "loss": 0.8538, "step": 4456 }, { "epoch": 0.62, "learning_rate": 6.691598582368205e-06, "loss": 0.8062, "step": 4457 }, { "epoch": 0.62, "learning_rate": 6.687353350150631e-06, "loss": 0.8655, "step": 4458 }, { "epoch": 0.62, "learning_rate": 6.6831087884206845e-06, "loss": 0.8608, "step": 4459 }, { "epoch": 0.62, "learning_rate": 6.67886489803747e-06, "loss": 0.8279, "step": 4460 }, { "epoch": 0.62, "learning_rate": 6.67462167985997e-06, "loss": 0.811, "step": 4461 }, { "epoch": 0.62, "learning_rate": 6.670379134747009e-06, "loss": 0.5728, "step": 4462 }, { "epoch": 0.62, "learning_rate": 6.6661372635573025e-06, "loss": 0.8047, "step": 4463 }, { "epoch": 0.62, "learning_rate": 6.661896067149409e-06, "loss": 0.7979, "step": 4464 }, { "epoch": 0.62, "learning_rate": 6.657655546381754e-06, "loss": 0.7366, "step": 4465 }, { "epoch": 0.62, "learning_rate": 6.653415702112634e-06, "loss": 0.8247, "step": 4466 }, { "epoch": 0.62, "learning_rate": 6.6491765352001995e-06, "loss": 0.7976, "step": 4467 }, { "epoch": 0.62, "learning_rate": 6.6449380465024725e-06, "loss": 0.8943, "step": 4468 }, { "epoch": 0.62, "learning_rate": 6.640700236877331e-06, "loss": 0.7699, "step": 4469 }, { "epoch": 0.62, "learning_rate": 6.6364631071825144e-06, "loss": 0.8787, "step": 4470 }, { "epoch": 0.62, "learning_rate": 6.632226658275635e-06, "loss": 0.8062, "step": 4471 }, { "epoch": 0.62, "learning_rate": 6.627990891014153e-06, "loss": 0.5301, "step": 4472 }, { "epoch": 0.62, "learning_rate": 6.623755806255405e-06, "loss": 0.8545, "step": 4473 }, { "epoch": 0.62, "learning_rate": 6.619521404856579e-06, "loss": 0.7949, "step": 4474 }, { "epoch": 0.62, "learning_rate": 6.615287687674724e-06, "loss": 0.5674, "step": 4475 }, { "epoch": 0.62, "learning_rate": 6.611054655566762e-06, "loss": 0.8052, "step": 4476 }, { "epoch": 0.62, "learning_rate": 6.60682230938946e-06, "loss": 0.8394, "step": 4477 }, { "epoch": 0.62, "learning_rate": 6.602590649999465e-06, "loss": 0.8406, "step": 4478 }, { "epoch": 0.62, "learning_rate": 6.59835967825327e-06, "loss": 0.8492, "step": 4479 }, { "epoch": 0.62, "learning_rate": 6.5941293950072295e-06, "loss": 0.5591, "step": 4480 }, { "epoch": 0.62, "learning_rate": 6.589899801117572e-06, "loss": 0.8063, "step": 4481 }, { "epoch": 0.62, "learning_rate": 6.585670897440368e-06, "loss": 0.5895, "step": 4482 }, { "epoch": 0.62, "learning_rate": 6.5814426848315674e-06, "loss": 0.8813, "step": 4483 }, { "epoch": 0.62, "learning_rate": 6.577215164146964e-06, "loss": 0.8279, "step": 4484 }, { "epoch": 0.62, "learning_rate": 6.572988336242217e-06, "loss": 0.8391, "step": 4485 }, { "epoch": 0.62, "learning_rate": 6.568762201972854e-06, "loss": 0.8738, "step": 4486 }, { "epoch": 0.62, "learning_rate": 6.564536762194247e-06, "loss": 0.8845, "step": 4487 }, { "epoch": 0.62, "learning_rate": 6.560312017761639e-06, "loss": 0.877, "step": 4488 }, { "epoch": 0.62, "learning_rate": 6.55608796953013e-06, "loss": 0.8306, "step": 4489 }, { "epoch": 0.62, "learning_rate": 6.55186461835467e-06, "loss": 0.8191, "step": 4490 }, { "epoch": 0.62, "learning_rate": 6.547641965090085e-06, "loss": 0.8765, "step": 4491 }, { "epoch": 0.62, "learning_rate": 6.543420010591044e-06, "loss": 0.782, "step": 4492 }, { "epoch": 0.62, "learning_rate": 6.539198755712082e-06, "loss": 0.887, "step": 4493 }, { "epoch": 0.62, "learning_rate": 6.534978201307593e-06, "loss": 0.8245, "step": 4494 }, { "epoch": 0.62, "learning_rate": 6.530758348231822e-06, "loss": 0.8252, "step": 4495 }, { "epoch": 0.62, "learning_rate": 6.526539197338886e-06, "loss": 0.7927, "step": 4496 }, { "epoch": 0.62, "learning_rate": 6.5223207494827436e-06, "loss": 0.8748, "step": 4497 }, { "epoch": 0.62, "learning_rate": 6.518103005517222e-06, "loss": 0.9253, "step": 4498 }, { "epoch": 0.62, "learning_rate": 6.513885966296004e-06, "loss": 0.8096, "step": 4499 }, { "epoch": 0.63, "learning_rate": 6.509669632672624e-06, "loss": 0.8096, "step": 4500 }, { "epoch": 0.63, "learning_rate": 6.5054540055004835e-06, "loss": 0.856, "step": 4501 }, { "epoch": 0.63, "learning_rate": 6.501239085632831e-06, "loss": 0.8163, "step": 4502 }, { "epoch": 0.63, "learning_rate": 6.497024873922778e-06, "loss": 0.7939, "step": 4503 }, { "epoch": 0.63, "learning_rate": 6.492811371223295e-06, "loss": 0.8604, "step": 4504 }, { "epoch": 0.63, "learning_rate": 6.4885985783871954e-06, "loss": 0.832, "step": 4505 }, { "epoch": 0.63, "learning_rate": 6.48438649626717e-06, "loss": 0.8284, "step": 4506 }, { "epoch": 0.63, "learning_rate": 6.480175125715745e-06, "loss": 0.7822, "step": 4507 }, { "epoch": 0.63, "learning_rate": 6.475964467585317e-06, "loss": 0.8118, "step": 4508 }, { "epoch": 0.63, "learning_rate": 6.4717545227281345e-06, "loss": 0.8752, "step": 4509 }, { "epoch": 0.63, "learning_rate": 6.467545291996296e-06, "loss": 0.8296, "step": 4510 }, { "epoch": 0.63, "learning_rate": 6.46333677624176e-06, "loss": 0.8406, "step": 4511 }, { "epoch": 0.63, "learning_rate": 6.459128976316344e-06, "loss": 0.793, "step": 4512 }, { "epoch": 0.63, "learning_rate": 6.4549218930717135e-06, "loss": 0.5536, "step": 4513 }, { "epoch": 0.63, "learning_rate": 6.450715527359397e-06, "loss": 0.5728, "step": 4514 }, { "epoch": 0.63, "learning_rate": 6.446509880030767e-06, "loss": 0.8196, "step": 4515 }, { "epoch": 0.63, "learning_rate": 6.442304951937058e-06, "loss": 0.567, "step": 4516 }, { "epoch": 0.63, "learning_rate": 6.43810074392936e-06, "loss": 0.8582, "step": 4517 }, { "epoch": 0.63, "learning_rate": 6.433897256858614e-06, "loss": 0.7937, "step": 4518 }, { "epoch": 0.63, "learning_rate": 6.4296944915756165e-06, "loss": 0.8455, "step": 4519 }, { "epoch": 0.63, "learning_rate": 6.425492448931015e-06, "loss": 0.8298, "step": 4520 }, { "epoch": 0.63, "learning_rate": 6.421291129775313e-06, "loss": 0.8191, "step": 4521 }, { "epoch": 0.63, "learning_rate": 6.41709053495887e-06, "loss": 0.8379, "step": 4522 }, { "epoch": 0.63, "learning_rate": 6.412890665331894e-06, "loss": 0.8464, "step": 4523 }, { "epoch": 0.63, "learning_rate": 6.408691521744452e-06, "loss": 0.5672, "step": 4524 }, { "epoch": 0.63, "learning_rate": 6.404493105046457e-06, "loss": 0.8136, "step": 4525 }, { "epoch": 0.63, "learning_rate": 6.4002954160876804e-06, "loss": 0.833, "step": 4526 }, { "epoch": 0.63, "learning_rate": 6.396098455717745e-06, "loss": 0.7703, "step": 4527 }, { "epoch": 0.63, "learning_rate": 6.391902224786124e-06, "loss": 0.811, "step": 4528 }, { "epoch": 0.63, "learning_rate": 6.3877067241421475e-06, "loss": 0.8772, "step": 4529 }, { "epoch": 0.63, "learning_rate": 6.383511954634991e-06, "loss": 0.8486, "step": 4530 }, { "epoch": 0.63, "learning_rate": 6.3793179171136885e-06, "loss": 0.8562, "step": 4531 }, { "epoch": 0.63, "learning_rate": 6.375124612427122e-06, "loss": 0.8054, "step": 4532 }, { "epoch": 0.63, "learning_rate": 6.37093204142403e-06, "loss": 0.8706, "step": 4533 }, { "epoch": 0.63, "learning_rate": 6.366740204952993e-06, "loss": 0.8518, "step": 4534 }, { "epoch": 0.63, "learning_rate": 6.362549103862452e-06, "loss": 0.9006, "step": 4535 }, { "epoch": 0.63, "learning_rate": 6.358358739000697e-06, "loss": 0.8149, "step": 4536 }, { "epoch": 0.63, "learning_rate": 6.354169111215864e-06, "loss": 0.8428, "step": 4537 }, { "epoch": 0.63, "learning_rate": 6.349980221355951e-06, "loss": 0.5942, "step": 4538 }, { "epoch": 0.63, "learning_rate": 6.345792070268788e-06, "loss": 0.7812, "step": 4539 }, { "epoch": 0.63, "learning_rate": 6.3416046588020785e-06, "loss": 0.8552, "step": 4540 }, { "epoch": 0.63, "learning_rate": 6.337417987803358e-06, "loss": 0.554, "step": 4541 }, { "epoch": 0.63, "learning_rate": 6.33323205812002e-06, "loss": 0.7893, "step": 4542 }, { "epoch": 0.63, "learning_rate": 6.329046870599309e-06, "loss": 0.606, "step": 4543 }, { "epoch": 0.63, "learning_rate": 6.324862426088312e-06, "loss": 0.5575, "step": 4544 }, { "epoch": 0.63, "learning_rate": 6.320678725433977e-06, "loss": 0.8506, "step": 4545 }, { "epoch": 0.63, "learning_rate": 6.316495769483089e-06, "loss": 0.8516, "step": 4546 }, { "epoch": 0.63, "learning_rate": 6.312313559082291e-06, "loss": 0.7706, "step": 4547 }, { "epoch": 0.63, "learning_rate": 6.308132095078074e-06, "loss": 0.8158, "step": 4548 }, { "epoch": 0.63, "learning_rate": 6.303951378316773e-06, "loss": 0.7983, "step": 4549 }, { "epoch": 0.63, "learning_rate": 6.2997714096445795e-06, "loss": 0.8833, "step": 4550 }, { "epoch": 0.63, "learning_rate": 6.2955921899075245e-06, "loss": 0.567, "step": 4551 }, { "epoch": 0.63, "learning_rate": 6.291413719951493e-06, "loss": 0.8074, "step": 4552 }, { "epoch": 0.63, "learning_rate": 6.287236000622222e-06, "loss": 0.7935, "step": 4553 }, { "epoch": 0.63, "learning_rate": 6.283059032765284e-06, "loss": 0.8479, "step": 4554 }, { "epoch": 0.63, "learning_rate": 6.278882817226115e-06, "loss": 0.8547, "step": 4555 }, { "epoch": 0.63, "learning_rate": 6.2747073548499895e-06, "loss": 0.8298, "step": 4556 }, { "epoch": 0.63, "learning_rate": 6.270532646482024e-06, "loss": 0.8533, "step": 4557 }, { "epoch": 0.63, "learning_rate": 6.2663586929671985e-06, "loss": 0.8352, "step": 4558 }, { "epoch": 0.63, "learning_rate": 6.262185495150323e-06, "loss": 0.8269, "step": 4559 }, { "epoch": 0.63, "learning_rate": 6.258013053876073e-06, "loss": 0.5465, "step": 4560 }, { "epoch": 0.63, "learning_rate": 6.253841369988953e-06, "loss": 0.7983, "step": 4561 }, { "epoch": 0.63, "learning_rate": 6.2496704443333214e-06, "loss": 0.7935, "step": 4562 }, { "epoch": 0.63, "learning_rate": 6.245500277753389e-06, "loss": 0.8088, "step": 4563 }, { "epoch": 0.63, "learning_rate": 6.2413308710932004e-06, "loss": 0.7698, "step": 4564 }, { "epoch": 0.63, "learning_rate": 6.237162225196662e-06, "loss": 0.8225, "step": 4565 }, { "epoch": 0.63, "learning_rate": 6.2329943409075125e-06, "loss": 0.7915, "step": 4566 }, { "epoch": 0.63, "learning_rate": 6.228827219069339e-06, "loss": 0.8467, "step": 4567 }, { "epoch": 0.63, "learning_rate": 6.2246608605255846e-06, "loss": 0.8152, "step": 4568 }, { "epoch": 0.63, "learning_rate": 6.220495266119522e-06, "loss": 0.7842, "step": 4569 }, { "epoch": 0.63, "learning_rate": 6.216330436694284e-06, "loss": 0.5498, "step": 4570 }, { "epoch": 0.63, "learning_rate": 6.21216637309284e-06, "loss": 0.8298, "step": 4571 }, { "epoch": 0.64, "learning_rate": 6.208003076158002e-06, "loss": 0.8149, "step": 4572 }, { "epoch": 0.64, "learning_rate": 6.2038405467324405e-06, "loss": 0.8269, "step": 4573 }, { "epoch": 0.64, "learning_rate": 6.199678785658652e-06, "loss": 0.8687, "step": 4574 }, { "epoch": 0.64, "learning_rate": 6.195517793778995e-06, "loss": 0.863, "step": 4575 }, { "epoch": 0.64, "learning_rate": 6.191357571935659e-06, "loss": 0.8525, "step": 4576 }, { "epoch": 0.64, "learning_rate": 6.187198120970681e-06, "loss": 0.7927, "step": 4577 }, { "epoch": 0.64, "learning_rate": 6.183039441725952e-06, "loss": 0.8123, "step": 4578 }, { "epoch": 0.64, "learning_rate": 6.17888153504319e-06, "loss": 0.8228, "step": 4579 }, { "epoch": 0.64, "learning_rate": 6.1747244017639715e-06, "loss": 0.5226, "step": 4580 }, { "epoch": 0.64, "learning_rate": 6.1705680427297085e-06, "loss": 0.8362, "step": 4581 }, { "epoch": 0.64, "learning_rate": 6.166412458781654e-06, "loss": 0.8306, "step": 4582 }, { "epoch": 0.64, "learning_rate": 6.162257650760914e-06, "loss": 0.8647, "step": 4583 }, { "epoch": 0.64, "learning_rate": 6.1581036195084265e-06, "loss": 0.6057, "step": 4584 }, { "epoch": 0.64, "learning_rate": 6.153950365864984e-06, "loss": 0.825, "step": 4585 }, { "epoch": 0.64, "learning_rate": 6.149797890671211e-06, "loss": 0.8655, "step": 4586 }, { "epoch": 0.64, "learning_rate": 6.145646194767574e-06, "loss": 0.8159, "step": 4587 }, { "epoch": 0.64, "learning_rate": 6.141495278994393e-06, "loss": 0.8782, "step": 4588 }, { "epoch": 0.64, "learning_rate": 6.13734514419182e-06, "loss": 0.8547, "step": 4589 }, { "epoch": 0.64, "learning_rate": 6.133195791199855e-06, "loss": 0.8293, "step": 4590 }, { "epoch": 0.64, "learning_rate": 6.1290472208583365e-06, "loss": 0.8418, "step": 4591 }, { "epoch": 0.64, "learning_rate": 6.124899434006939e-06, "loss": 0.7468, "step": 4592 }, { "epoch": 0.64, "learning_rate": 6.120752431485193e-06, "loss": 0.8425, "step": 4593 }, { "epoch": 0.64, "learning_rate": 6.116606214132455e-06, "loss": 0.8235, "step": 4594 }, { "epoch": 0.64, "learning_rate": 6.112460782787936e-06, "loss": 0.8142, "step": 4595 }, { "epoch": 0.64, "learning_rate": 6.1083161382906775e-06, "loss": 0.8193, "step": 4596 }, { "epoch": 0.64, "learning_rate": 6.104172281479561e-06, "loss": 0.8265, "step": 4597 }, { "epoch": 0.64, "learning_rate": 6.100029213193322e-06, "loss": 0.7805, "step": 4598 }, { "epoch": 0.64, "learning_rate": 6.095886934270519e-06, "loss": 0.8024, "step": 4599 }, { "epoch": 0.64, "learning_rate": 6.091745445549569e-06, "loss": 0.8076, "step": 4600 }, { "epoch": 0.64, "learning_rate": 6.087604747868711e-06, "loss": 0.8518, "step": 4601 }, { "epoch": 0.64, "learning_rate": 6.083464842066032e-06, "loss": 0.8491, "step": 4602 }, { "epoch": 0.64, "learning_rate": 6.0793257289794646e-06, "loss": 0.8877, "step": 4603 }, { "epoch": 0.64, "learning_rate": 6.07518740944677e-06, "loss": 0.8557, "step": 4604 }, { "epoch": 0.64, "learning_rate": 6.071049884305558e-06, "loss": 0.7892, "step": 4605 }, { "epoch": 0.64, "learning_rate": 6.066913154393273e-06, "loss": 0.8245, "step": 4606 }, { "epoch": 0.64, "learning_rate": 6.062777220547193e-06, "loss": 0.7815, "step": 4607 }, { "epoch": 0.64, "learning_rate": 6.058642083604451e-06, "loss": 0.7823, "step": 4608 }, { "epoch": 0.64, "learning_rate": 6.054507744401999e-06, "loss": 0.8447, "step": 4609 }, { "epoch": 0.64, "learning_rate": 6.050374203776646e-06, "loss": 0.8572, "step": 4610 }, { "epoch": 0.64, "learning_rate": 6.046241462565025e-06, "loss": 0.876, "step": 4611 }, { "epoch": 0.64, "learning_rate": 6.0421095216036095e-06, "loss": 0.6132, "step": 4612 }, { "epoch": 0.64, "learning_rate": 6.037978381728724e-06, "loss": 0.8149, "step": 4613 }, { "epoch": 0.64, "learning_rate": 6.033848043776511e-06, "loss": 0.8904, "step": 4614 }, { "epoch": 0.64, "learning_rate": 6.0297185085829694e-06, "loss": 0.8193, "step": 4615 }, { "epoch": 0.64, "learning_rate": 6.025589776983923e-06, "loss": 0.8235, "step": 4616 }, { "epoch": 0.64, "learning_rate": 6.021461849815034e-06, "loss": 0.7849, "step": 4617 }, { "epoch": 0.64, "learning_rate": 6.01733472791181e-06, "loss": 0.8027, "step": 4618 }, { "epoch": 0.64, "learning_rate": 6.013208412109586e-06, "loss": 0.8928, "step": 4619 }, { "epoch": 0.64, "learning_rate": 6.009082903243544e-06, "loss": 0.866, "step": 4620 }, { "epoch": 0.64, "learning_rate": 6.004958202148694e-06, "loss": 0.8098, "step": 4621 }, { "epoch": 0.64, "learning_rate": 6.000834309659879e-06, "loss": 0.8447, "step": 4622 }, { "epoch": 0.64, "learning_rate": 5.996711226611795e-06, "loss": 0.5431, "step": 4623 }, { "epoch": 0.64, "learning_rate": 5.992588953838957e-06, "loss": 0.5829, "step": 4624 }, { "epoch": 0.64, "learning_rate": 5.988467492175728e-06, "loss": 0.8318, "step": 4625 }, { "epoch": 0.64, "learning_rate": 5.984346842456299e-06, "loss": 0.8342, "step": 4626 }, { "epoch": 0.64, "learning_rate": 5.980227005514696e-06, "loss": 0.9048, "step": 4627 }, { "epoch": 0.64, "learning_rate": 5.97610798218479e-06, "loss": 0.5509, "step": 4628 }, { "epoch": 0.64, "learning_rate": 5.9719897733002755e-06, "loss": 0.8547, "step": 4629 }, { "epoch": 0.64, "learning_rate": 5.967872379694695e-06, "loss": 0.5658, "step": 4630 }, { "epoch": 0.64, "learning_rate": 5.963755802201414e-06, "loss": 0.8206, "step": 4631 }, { "epoch": 0.64, "learning_rate": 5.959640041653634e-06, "loss": 0.7805, "step": 4632 }, { "epoch": 0.64, "learning_rate": 5.9555250988844025e-06, "loss": 0.5685, "step": 4633 }, { "epoch": 0.64, "learning_rate": 5.951410974726588e-06, "loss": 0.8882, "step": 4634 }, { "epoch": 0.64, "learning_rate": 5.9472976700129046e-06, "loss": 0.793, "step": 4635 }, { "epoch": 0.64, "learning_rate": 5.943185185575893e-06, "loss": 0.6229, "step": 4636 }, { "epoch": 0.64, "learning_rate": 5.939073522247923e-06, "loss": 0.7538, "step": 4637 }, { "epoch": 0.64, "learning_rate": 5.934962680861216e-06, "loss": 0.855, "step": 4638 }, { "epoch": 0.64, "learning_rate": 5.930852662247808e-06, "loss": 0.7671, "step": 4639 }, { "epoch": 0.64, "learning_rate": 5.926743467239582e-06, "loss": 0.9229, "step": 4640 }, { "epoch": 0.64, "learning_rate": 5.922635096668248e-06, "loss": 0.8396, "step": 4641 }, { "epoch": 0.64, "learning_rate": 5.918527551365344e-06, "loss": 0.8291, "step": 4642 }, { "epoch": 0.64, "learning_rate": 5.914420832162256e-06, "loss": 0.8118, "step": 4643 }, { "epoch": 0.65, "learning_rate": 5.910314939890185e-06, "loss": 0.8989, "step": 4644 }, { "epoch": 0.65, "learning_rate": 5.906209875380182e-06, "loss": 0.8625, "step": 4645 }, { "epoch": 0.65, "learning_rate": 5.902105639463119e-06, "loss": 0.7745, "step": 4646 }, { "epoch": 0.65, "learning_rate": 5.8980022329696975e-06, "loss": 0.7616, "step": 4647 }, { "epoch": 0.65, "learning_rate": 5.893899656730465e-06, "loss": 0.7679, "step": 4648 }, { "epoch": 0.65, "learning_rate": 5.8897979115757855e-06, "loss": 0.7986, "step": 4649 }, { "epoch": 0.65, "learning_rate": 5.88569699833587e-06, "loss": 0.8418, "step": 4650 }, { "epoch": 0.65, "learning_rate": 5.881596917840748e-06, "loss": 0.8579, "step": 4651 }, { "epoch": 0.65, "learning_rate": 5.877497670920284e-06, "loss": 0.7947, "step": 4652 }, { "epoch": 0.65, "learning_rate": 5.873399258404181e-06, "loss": 0.865, "step": 4653 }, { "epoch": 0.65, "learning_rate": 5.86930168112196e-06, "loss": 0.8025, "step": 4654 }, { "epoch": 0.65, "learning_rate": 5.86520493990299e-06, "loss": 0.8127, "step": 4655 }, { "epoch": 0.65, "learning_rate": 5.861109035576451e-06, "loss": 0.8506, "step": 4656 }, { "epoch": 0.65, "learning_rate": 5.857013968971375e-06, "loss": 0.8217, "step": 4657 }, { "epoch": 0.65, "learning_rate": 5.852919740916605e-06, "loss": 0.8435, "step": 4658 }, { "epoch": 0.65, "learning_rate": 5.848826352240822e-06, "loss": 0.8031, "step": 4659 }, { "epoch": 0.65, "learning_rate": 5.844733803772544e-06, "loss": 0.833, "step": 4660 }, { "epoch": 0.65, "learning_rate": 5.840642096340106e-06, "loss": 0.8116, "step": 4661 }, { "epoch": 0.65, "learning_rate": 5.836551230771687e-06, "loss": 0.8862, "step": 4662 }, { "epoch": 0.65, "learning_rate": 5.83246120789528e-06, "loss": 0.8298, "step": 4663 }, { "epoch": 0.65, "learning_rate": 5.828372028538723e-06, "loss": 0.583, "step": 4664 }, { "epoch": 0.65, "learning_rate": 5.8242836935296695e-06, "loss": 0.7998, "step": 4665 }, { "epoch": 0.65, "learning_rate": 5.8201962036956085e-06, "loss": 0.8723, "step": 4666 }, { "epoch": 0.65, "learning_rate": 5.816109559863863e-06, "loss": 0.5532, "step": 4667 }, { "epoch": 0.65, "learning_rate": 5.8120237628615714e-06, "loss": 0.8335, "step": 4668 }, { "epoch": 0.65, "learning_rate": 5.80793881351572e-06, "loss": 0.8149, "step": 4669 }, { "epoch": 0.65, "learning_rate": 5.803854712653105e-06, "loss": 0.8584, "step": 4670 }, { "epoch": 0.65, "learning_rate": 5.799771461100354e-06, "loss": 0.7917, "step": 4671 }, { "epoch": 0.65, "learning_rate": 5.795689059683938e-06, "loss": 0.7583, "step": 4672 }, { "epoch": 0.65, "learning_rate": 5.791607509230139e-06, "loss": 0.8386, "step": 4673 }, { "epoch": 0.65, "learning_rate": 5.787526810565067e-06, "loss": 0.8284, "step": 4674 }, { "epoch": 0.65, "learning_rate": 5.783446964514676e-06, "loss": 0.8635, "step": 4675 }, { "epoch": 0.65, "learning_rate": 5.779367971904728e-06, "loss": 0.8237, "step": 4676 }, { "epoch": 0.65, "learning_rate": 5.7752898335608276e-06, "loss": 0.8655, "step": 4677 }, { "epoch": 0.65, "learning_rate": 5.771212550308396e-06, "loss": 0.8048, "step": 4678 }, { "epoch": 0.65, "learning_rate": 5.767136122972683e-06, "loss": 0.8926, "step": 4679 }, { "epoch": 0.65, "learning_rate": 5.763060552378773e-06, "loss": 0.8425, "step": 4680 }, { "epoch": 0.65, "learning_rate": 5.758985839351564e-06, "loss": 0.8462, "step": 4681 }, { "epoch": 0.65, "learning_rate": 5.754911984715796e-06, "loss": 0.8501, "step": 4682 }, { "epoch": 0.65, "learning_rate": 5.7508389892960236e-06, "loss": 0.807, "step": 4683 }, { "epoch": 0.65, "learning_rate": 5.746766853916626e-06, "loss": 0.8501, "step": 4684 }, { "epoch": 0.65, "learning_rate": 5.74269557940182e-06, "loss": 0.7708, "step": 4685 }, { "epoch": 0.65, "learning_rate": 5.7386251665756356e-06, "loss": 0.823, "step": 4686 }, { "epoch": 0.65, "learning_rate": 5.73455561626194e-06, "loss": 0.748, "step": 4687 }, { "epoch": 0.65, "learning_rate": 5.7304869292844175e-06, "loss": 0.8389, "step": 4688 }, { "epoch": 0.65, "learning_rate": 5.726419106466577e-06, "loss": 0.8274, "step": 4689 }, { "epoch": 0.65, "learning_rate": 5.7223521486317605e-06, "loss": 0.6373, "step": 4690 }, { "epoch": 0.65, "learning_rate": 5.718286056603124e-06, "loss": 0.9143, "step": 4691 }, { "epoch": 0.65, "learning_rate": 5.714220831203661e-06, "loss": 0.8213, "step": 4692 }, { "epoch": 0.65, "learning_rate": 5.710156473256181e-06, "loss": 0.875, "step": 4693 }, { "epoch": 0.65, "learning_rate": 5.706092983583316e-06, "loss": 0.8416, "step": 4694 }, { "epoch": 0.65, "learning_rate": 5.70203036300753e-06, "loss": 0.7971, "step": 4695 }, { "epoch": 0.65, "learning_rate": 5.697968612351103e-06, "loss": 0.6248, "step": 4696 }, { "epoch": 0.65, "learning_rate": 5.69390773243615e-06, "loss": 0.7869, "step": 4697 }, { "epoch": 0.65, "learning_rate": 5.689847724084599e-06, "loss": 0.8228, "step": 4698 }, { "epoch": 0.65, "learning_rate": 5.685788588118202e-06, "loss": 0.7983, "step": 4699 }, { "epoch": 0.65, "learning_rate": 5.681730325358543e-06, "loss": 0.5885, "step": 4700 }, { "epoch": 0.65, "learning_rate": 5.67767293662702e-06, "loss": 0.8472, "step": 4701 }, { "epoch": 0.65, "learning_rate": 5.673616422744863e-06, "loss": 0.8032, "step": 4702 }, { "epoch": 0.65, "learning_rate": 5.669560784533119e-06, "loss": 0.8875, "step": 4703 }, { "epoch": 0.65, "learning_rate": 5.665506022812652e-06, "loss": 0.7781, "step": 4704 }, { "epoch": 0.65, "learning_rate": 5.661452138404166e-06, "loss": 0.8772, "step": 4705 }, { "epoch": 0.65, "learning_rate": 5.657399132128167e-06, "loss": 0.8169, "step": 4706 }, { "epoch": 0.65, "learning_rate": 5.653347004805002e-06, "loss": 0.7668, "step": 4707 }, { "epoch": 0.65, "learning_rate": 5.649295757254828e-06, "loss": 0.7731, "step": 4708 }, { "epoch": 0.65, "learning_rate": 5.645245390297622e-06, "loss": 0.8191, "step": 4709 }, { "epoch": 0.65, "learning_rate": 5.641195904753196e-06, "loss": 0.8257, "step": 4710 }, { "epoch": 0.65, "learning_rate": 5.63714730144117e-06, "loss": 0.8174, "step": 4711 }, { "epoch": 0.65, "learning_rate": 5.633099581180995e-06, "loss": 0.7883, "step": 4712 }, { "epoch": 0.65, "learning_rate": 5.629052744791938e-06, "loss": 0.8457, "step": 4713 }, { "epoch": 0.65, "learning_rate": 5.625006793093084e-06, "loss": 0.797, "step": 4714 }, { "epoch": 0.65, "learning_rate": 5.620961726903351e-06, "loss": 0.7668, "step": 4715 }, { "epoch": 0.66, "learning_rate": 5.616917547041463e-06, "loss": 0.8486, "step": 4716 }, { "epoch": 0.66, "learning_rate": 5.612874254325978e-06, "loss": 0.8105, "step": 4717 }, { "epoch": 0.66, "learning_rate": 5.608831849575266e-06, "loss": 0.8062, "step": 4718 }, { "epoch": 0.66, "learning_rate": 5.604790333607514e-06, "loss": 0.7874, "step": 4719 }, { "epoch": 0.66, "learning_rate": 5.6007497072407424e-06, "loss": 0.8943, "step": 4720 }, { "epoch": 0.66, "learning_rate": 5.596709971292778e-06, "loss": 0.5868, "step": 4721 }, { "epoch": 0.66, "learning_rate": 5.5926711265812775e-06, "loss": 0.8105, "step": 4722 }, { "epoch": 0.66, "learning_rate": 5.58863317392371e-06, "loss": 0.8218, "step": 4723 }, { "epoch": 0.66, "learning_rate": 5.584596114137365e-06, "loss": 0.7548, "step": 4724 }, { "epoch": 0.66, "learning_rate": 5.5805599480393595e-06, "loss": 0.8254, "step": 4725 }, { "epoch": 0.66, "learning_rate": 5.576524676446614e-06, "loss": 0.8191, "step": 4726 }, { "epoch": 0.66, "learning_rate": 5.572490300175888e-06, "loss": 0.8462, "step": 4727 }, { "epoch": 0.66, "learning_rate": 5.568456820043741e-06, "loss": 0.8455, "step": 4728 }, { "epoch": 0.66, "learning_rate": 5.5644242368665595e-06, "loss": 0.8708, "step": 4729 }, { "epoch": 0.66, "learning_rate": 5.560392551460552e-06, "loss": 0.7784, "step": 4730 }, { "epoch": 0.66, "learning_rate": 5.5563617646417355e-06, "loss": 0.8158, "step": 4731 }, { "epoch": 0.66, "learning_rate": 5.552331877225959e-06, "loss": 0.8115, "step": 4732 }, { "epoch": 0.66, "learning_rate": 5.548302890028877e-06, "loss": 0.886, "step": 4733 }, { "epoch": 0.66, "learning_rate": 5.544274803865962e-06, "loss": 0.8276, "step": 4734 }, { "epoch": 0.66, "learning_rate": 5.540247619552517e-06, "loss": 0.7888, "step": 4735 }, { "epoch": 0.66, "learning_rate": 5.536221337903643e-06, "loss": 0.8357, "step": 4736 }, { "epoch": 0.66, "learning_rate": 5.5321959597342814e-06, "loss": 0.8267, "step": 4737 }, { "epoch": 0.66, "learning_rate": 5.528171485859171e-06, "loss": 0.7463, "step": 4738 }, { "epoch": 0.66, "learning_rate": 5.524147917092872e-06, "loss": 0.772, "step": 4739 }, { "epoch": 0.66, "learning_rate": 5.520125254249773e-06, "loss": 0.803, "step": 4740 }, { "epoch": 0.66, "learning_rate": 5.516103498144062e-06, "loss": 0.8196, "step": 4741 }, { "epoch": 0.66, "learning_rate": 5.5120826495897604e-06, "loss": 0.8306, "step": 4742 }, { "epoch": 0.66, "learning_rate": 5.508062709400692e-06, "loss": 0.8289, "step": 4743 }, { "epoch": 0.66, "learning_rate": 5.504043678390501e-06, "loss": 0.8496, "step": 4744 }, { "epoch": 0.66, "learning_rate": 5.500025557372656e-06, "loss": 0.8406, "step": 4745 }, { "epoch": 0.66, "learning_rate": 5.496008347160425e-06, "loss": 0.8635, "step": 4746 }, { "epoch": 0.66, "learning_rate": 5.491992048566911e-06, "loss": 0.8184, "step": 4747 }, { "epoch": 0.66, "learning_rate": 5.4879766624050165e-06, "loss": 0.6069, "step": 4748 }, { "epoch": 0.66, "learning_rate": 5.483962189487463e-06, "loss": 0.8203, "step": 4749 }, { "epoch": 0.66, "learning_rate": 5.479948630626795e-06, "loss": 0.7448, "step": 4750 }, { "epoch": 0.66, "learning_rate": 5.475935986635361e-06, "loss": 0.8313, "step": 4751 }, { "epoch": 0.66, "learning_rate": 5.471924258325338e-06, "loss": 0.8132, "step": 4752 }, { "epoch": 0.66, "learning_rate": 5.467913446508704e-06, "loss": 0.8435, "step": 4753 }, { "epoch": 0.66, "learning_rate": 5.463903551997252e-06, "loss": 0.7839, "step": 4754 }, { "epoch": 0.66, "learning_rate": 5.459894575602604e-06, "loss": 0.7742, "step": 4755 }, { "epoch": 0.66, "learning_rate": 5.455886518136178e-06, "loss": 0.8083, "step": 4756 }, { "epoch": 0.66, "learning_rate": 5.4518793804092215e-06, "loss": 0.8335, "step": 4757 }, { "epoch": 0.66, "learning_rate": 5.447873163232786e-06, "loss": 0.7271, "step": 4758 }, { "epoch": 0.66, "learning_rate": 5.443867867417737e-06, "loss": 0.8567, "step": 4759 }, { "epoch": 0.66, "learning_rate": 5.43986349377476e-06, "loss": 0.834, "step": 4760 }, { "epoch": 0.66, "learning_rate": 5.435860043114345e-06, "loss": 0.832, "step": 4761 }, { "epoch": 0.66, "learning_rate": 5.431857516246806e-06, "loss": 0.8125, "step": 4762 }, { "epoch": 0.66, "learning_rate": 5.4278559139822615e-06, "loss": 0.5735, "step": 4763 }, { "epoch": 0.66, "learning_rate": 5.423855237130642e-06, "loss": 0.8147, "step": 4764 }, { "epoch": 0.66, "learning_rate": 5.419855486501699e-06, "loss": 0.748, "step": 4765 }, { "epoch": 0.66, "learning_rate": 5.415856662904986e-06, "loss": 0.8524, "step": 4766 }, { "epoch": 0.66, "learning_rate": 5.411858767149882e-06, "loss": 0.8752, "step": 4767 }, { "epoch": 0.66, "learning_rate": 5.4078618000455685e-06, "loss": 0.8367, "step": 4768 }, { "epoch": 0.66, "learning_rate": 5.403865762401033e-06, "loss": 0.8596, "step": 4769 }, { "epoch": 0.66, "learning_rate": 5.399870655025095e-06, "loss": 0.8409, "step": 4770 }, { "epoch": 0.66, "learning_rate": 5.395876478726364e-06, "loss": 0.8655, "step": 4771 }, { "epoch": 0.66, "learning_rate": 5.39188323431328e-06, "loss": 0.8162, "step": 4772 }, { "epoch": 0.66, "learning_rate": 5.387890922594075e-06, "loss": 0.8354, "step": 4773 }, { "epoch": 0.66, "learning_rate": 5.383899544376814e-06, "loss": 0.8308, "step": 4774 }, { "epoch": 0.66, "learning_rate": 5.379909100469354e-06, "loss": 0.7766, "step": 4775 }, { "epoch": 0.66, "learning_rate": 5.375919591679368e-06, "loss": 0.8015, "step": 4776 }, { "epoch": 0.66, "learning_rate": 5.371931018814349e-06, "loss": 0.7853, "step": 4777 }, { "epoch": 0.66, "learning_rate": 5.367943382681589e-06, "loss": 0.8845, "step": 4778 }, { "epoch": 0.66, "learning_rate": 5.3639566840882e-06, "loss": 0.769, "step": 4779 }, { "epoch": 0.66, "learning_rate": 5.359970923841096e-06, "loss": 0.8206, "step": 4780 }, { "epoch": 0.66, "learning_rate": 5.355986102747e-06, "loss": 0.8052, "step": 4781 }, { "epoch": 0.66, "learning_rate": 5.352002221612459e-06, "loss": 0.8425, "step": 4782 }, { "epoch": 0.66, "learning_rate": 5.34801928124381e-06, "loss": 0.6016, "step": 4783 }, { "epoch": 0.66, "learning_rate": 5.344037282447221e-06, "loss": 0.8008, "step": 4784 }, { "epoch": 0.66, "learning_rate": 5.340056226028649e-06, "loss": 0.8115, "step": 4785 }, { "epoch": 0.66, "learning_rate": 5.336076112793871e-06, "loss": 0.7837, "step": 4786 }, { "epoch": 0.66, "learning_rate": 5.332096943548475e-06, "loss": 0.8911, "step": 4787 }, { "epoch": 0.67, "learning_rate": 5.328118719097849e-06, "loss": 0.8967, "step": 4788 }, { "epoch": 0.67, "learning_rate": 5.3241414402472014e-06, "loss": 0.7512, "step": 4789 }, { "epoch": 0.67, "learning_rate": 5.3201651078015406e-06, "loss": 0.7673, "step": 4790 }, { "epoch": 0.67, "learning_rate": 5.3161897225656814e-06, "loss": 0.8667, "step": 4791 }, { "epoch": 0.67, "learning_rate": 5.312215285344258e-06, "loss": 0.7632, "step": 4792 }, { "epoch": 0.67, "learning_rate": 5.3082417969417e-06, "loss": 0.842, "step": 4793 }, { "epoch": 0.67, "learning_rate": 5.304269258162258e-06, "loss": 0.6055, "step": 4794 }, { "epoch": 0.67, "learning_rate": 5.3002976698099784e-06, "loss": 0.856, "step": 4795 }, { "epoch": 0.67, "learning_rate": 5.296327032688718e-06, "loss": 0.8665, "step": 4796 }, { "epoch": 0.67, "learning_rate": 5.2923573476021505e-06, "loss": 0.8293, "step": 4797 }, { "epoch": 0.67, "learning_rate": 5.288388615353741e-06, "loss": 0.7695, "step": 4798 }, { "epoch": 0.67, "learning_rate": 5.284420836746779e-06, "loss": 0.7988, "step": 4799 }, { "epoch": 0.67, "learning_rate": 5.280454012584349e-06, "loss": 0.8088, "step": 4800 }, { "epoch": 0.67, "learning_rate": 5.276488143669341e-06, "loss": 0.8535, "step": 4801 }, { "epoch": 0.67, "learning_rate": 5.272523230804465e-06, "loss": 0.792, "step": 4802 }, { "epoch": 0.67, "learning_rate": 5.26855927479222e-06, "loss": 0.8582, "step": 4803 }, { "epoch": 0.67, "learning_rate": 5.264596276434928e-06, "loss": 0.8387, "step": 4804 }, { "epoch": 0.67, "learning_rate": 5.2606342365347075e-06, "loss": 0.8213, "step": 4805 }, { "epoch": 0.67, "learning_rate": 5.256673155893479e-06, "loss": 0.8525, "step": 4806 }, { "epoch": 0.67, "learning_rate": 5.252713035312982e-06, "loss": 0.8687, "step": 4807 }, { "epoch": 0.67, "learning_rate": 5.2487538755947485e-06, "loss": 0.7747, "step": 4808 }, { "epoch": 0.67, "learning_rate": 5.244795677540129e-06, "loss": 0.8313, "step": 4809 }, { "epoch": 0.67, "learning_rate": 5.2408384419502675e-06, "loss": 0.8101, "step": 4810 }, { "epoch": 0.67, "learning_rate": 5.236882169626116e-06, "loss": 0.8125, "step": 4811 }, { "epoch": 0.67, "learning_rate": 5.232926861368439e-06, "loss": 0.8164, "step": 4812 }, { "epoch": 0.67, "learning_rate": 5.228972517977794e-06, "loss": 0.8, "step": 4813 }, { "epoch": 0.67, "learning_rate": 5.225019140254557e-06, "loss": 0.8655, "step": 4814 }, { "epoch": 0.67, "learning_rate": 5.221066728998898e-06, "loss": 0.7444, "step": 4815 }, { "epoch": 0.67, "learning_rate": 5.21711528501079e-06, "loss": 0.5428, "step": 4816 }, { "epoch": 0.67, "learning_rate": 5.213164809090021e-06, "loss": 0.835, "step": 4817 }, { "epoch": 0.67, "learning_rate": 5.2092153020361715e-06, "loss": 0.5998, "step": 4818 }, { "epoch": 0.67, "learning_rate": 5.205266764648638e-06, "loss": 0.8047, "step": 4819 }, { "epoch": 0.67, "learning_rate": 5.201319197726608e-06, "loss": 0.6819, "step": 4820 }, { "epoch": 0.67, "learning_rate": 5.19737260206908e-06, "loss": 0.7792, "step": 4821 }, { "epoch": 0.67, "learning_rate": 5.1934269784748555e-06, "loss": 0.7468, "step": 4822 }, { "epoch": 0.67, "learning_rate": 5.189482327742536e-06, "loss": 0.864, "step": 4823 }, { "epoch": 0.67, "learning_rate": 5.185538650670534e-06, "loss": 0.8591, "step": 4824 }, { "epoch": 0.67, "learning_rate": 5.181595948057054e-06, "loss": 0.8042, "step": 4825 }, { "epoch": 0.67, "learning_rate": 5.177654220700106e-06, "loss": 0.7957, "step": 4826 }, { "epoch": 0.67, "learning_rate": 5.173713469397512e-06, "loss": 0.7546, "step": 4827 }, { "epoch": 0.67, "learning_rate": 5.169773694946883e-06, "loss": 0.8127, "step": 4828 }, { "epoch": 0.67, "learning_rate": 5.1658348981456455e-06, "loss": 0.8792, "step": 4829 }, { "epoch": 0.67, "learning_rate": 5.161897079791018e-06, "loss": 0.7201, "step": 4830 }, { "epoch": 0.67, "learning_rate": 5.15796024068002e-06, "loss": 0.8865, "step": 4831 }, { "epoch": 0.67, "learning_rate": 5.154024381609485e-06, "loss": 0.6699, "step": 4832 }, { "epoch": 0.67, "learning_rate": 5.150089503376033e-06, "loss": 0.8164, "step": 4833 }, { "epoch": 0.67, "learning_rate": 5.146155606776101e-06, "loss": 0.9062, "step": 4834 }, { "epoch": 0.67, "learning_rate": 5.142222692605913e-06, "loss": 0.821, "step": 4835 }, { "epoch": 0.67, "learning_rate": 5.1382907616615e-06, "loss": 0.874, "step": 4836 }, { "epoch": 0.67, "learning_rate": 5.1343598147387e-06, "loss": 0.7939, "step": 4837 }, { "epoch": 0.67, "learning_rate": 5.130429852633136e-06, "loss": 0.595, "step": 4838 }, { "epoch": 0.67, "learning_rate": 5.1265008761402544e-06, "loss": 0.7982, "step": 4839 }, { "epoch": 0.67, "learning_rate": 5.122572886055282e-06, "loss": 0.5967, "step": 4840 }, { "epoch": 0.67, "learning_rate": 5.11864588317325e-06, "loss": 0.7988, "step": 4841 }, { "epoch": 0.67, "learning_rate": 5.114719868289002e-06, "loss": 0.8296, "step": 4842 }, { "epoch": 0.67, "learning_rate": 5.1107948421971655e-06, "loss": 0.7803, "step": 4843 }, { "epoch": 0.67, "learning_rate": 5.106870805692181e-06, "loss": 0.8201, "step": 4844 }, { "epoch": 0.67, "learning_rate": 5.1029477595682795e-06, "loss": 0.7476, "step": 4845 }, { "epoch": 0.67, "learning_rate": 5.0990257046194935e-06, "loss": 0.8369, "step": 4846 }, { "epoch": 0.67, "learning_rate": 5.0951046416396614e-06, "loss": 0.8232, "step": 4847 }, { "epoch": 0.67, "learning_rate": 5.091184571422407e-06, "loss": 0.7742, "step": 4848 }, { "epoch": 0.67, "learning_rate": 5.087265494761173e-06, "loss": 0.8324, "step": 4849 }, { "epoch": 0.67, "learning_rate": 5.083347412449185e-06, "loss": 0.5969, "step": 4850 }, { "epoch": 0.67, "learning_rate": 5.079430325279467e-06, "loss": 0.7438, "step": 4851 }, { "epoch": 0.67, "learning_rate": 5.075514234044856e-06, "loss": 0.8496, "step": 4852 }, { "epoch": 0.67, "learning_rate": 5.07159913953797e-06, "loss": 0.8, "step": 4853 }, { "epoch": 0.67, "learning_rate": 5.067685042551242e-06, "loss": 0.7974, "step": 4854 }, { "epoch": 0.67, "learning_rate": 5.063771943876888e-06, "loss": 0.7976, "step": 4855 }, { "epoch": 0.67, "learning_rate": 5.059859844306928e-06, "loss": 0.5977, "step": 4856 }, { "epoch": 0.67, "learning_rate": 5.055948744633187e-06, "loss": 0.793, "step": 4857 }, { "epoch": 0.67, "learning_rate": 5.0520386456472725e-06, "loss": 0.8469, "step": 4858 }, { "epoch": 0.67, "learning_rate": 5.048129548140606e-06, "loss": 0.8467, "step": 4859 }, { "epoch": 0.68, "learning_rate": 5.044221452904394e-06, "loss": 0.807, "step": 4860 }, { "epoch": 0.68, "learning_rate": 5.040314360729641e-06, "loss": 0.8542, "step": 4861 }, { "epoch": 0.68, "learning_rate": 5.03640827240716e-06, "loss": 0.8237, "step": 4862 }, { "epoch": 0.68, "learning_rate": 5.032503188727544e-06, "loss": 0.8469, "step": 4863 }, { "epoch": 0.68, "learning_rate": 5.0285991104812e-06, "loss": 0.8201, "step": 4864 }, { "epoch": 0.68, "learning_rate": 5.024696038458319e-06, "loss": 0.8055, "step": 4865 }, { "epoch": 0.68, "learning_rate": 5.020793973448887e-06, "loss": 0.7661, "step": 4866 }, { "epoch": 0.68, "learning_rate": 5.016892916242699e-06, "loss": 0.8745, "step": 4867 }, { "epoch": 0.68, "learning_rate": 5.0129928676293325e-06, "loss": 0.8086, "step": 4868 }, { "epoch": 0.68, "learning_rate": 5.0090938283981725e-06, "loss": 0.8552, "step": 4869 }, { "epoch": 0.68, "learning_rate": 5.005195799338392e-06, "loss": 0.7496, "step": 4870 }, { "epoch": 0.68, "learning_rate": 5.001298781238954e-06, "loss": 0.832, "step": 4871 }, { "epoch": 0.68, "learning_rate": 4.997402774888636e-06, "loss": 0.7917, "step": 4872 }, { "epoch": 0.68, "learning_rate": 4.993507781075989e-06, "loss": 0.8633, "step": 4873 }, { "epoch": 0.68, "learning_rate": 4.989613800589378e-06, "loss": 0.8252, "step": 4874 }, { "epoch": 0.68, "learning_rate": 4.985720834216949e-06, "loss": 0.8804, "step": 4875 }, { "epoch": 0.68, "learning_rate": 4.981828882746644e-06, "loss": 0.771, "step": 4876 }, { "epoch": 0.68, "learning_rate": 4.977937946966213e-06, "loss": 0.8013, "step": 4877 }, { "epoch": 0.68, "learning_rate": 4.974048027663181e-06, "loss": 0.8201, "step": 4878 }, { "epoch": 0.68, "learning_rate": 4.970159125624885e-06, "loss": 0.8184, "step": 4879 }, { "epoch": 0.68, "learning_rate": 4.966271241638444e-06, "loss": 0.7754, "step": 4880 }, { "epoch": 0.68, "learning_rate": 4.962384376490772e-06, "loss": 0.3868, "step": 4881 }, { "epoch": 0.68, "learning_rate": 4.958498530968588e-06, "loss": 0.824, "step": 4882 }, { "epoch": 0.68, "learning_rate": 4.954613705858387e-06, "loss": 0.8147, "step": 4883 }, { "epoch": 0.68, "learning_rate": 4.950729901946476e-06, "loss": 0.8494, "step": 4884 }, { "epoch": 0.68, "learning_rate": 4.946847120018942e-06, "loss": 0.7913, "step": 4885 }, { "epoch": 0.68, "learning_rate": 4.942965360861664e-06, "loss": 0.8096, "step": 4886 }, { "epoch": 0.68, "learning_rate": 4.93908462526033e-06, "loss": 0.8479, "step": 4887 }, { "epoch": 0.68, "learning_rate": 4.935204914000401e-06, "loss": 0.8276, "step": 4888 }, { "epoch": 0.68, "learning_rate": 4.931326227867147e-06, "loss": 0.7903, "step": 4889 }, { "epoch": 0.68, "learning_rate": 4.9274485676456205e-06, "loss": 0.8152, "step": 4890 }, { "epoch": 0.68, "learning_rate": 4.923571934120665e-06, "loss": 0.7573, "step": 4891 }, { "epoch": 0.68, "learning_rate": 4.9196963280769274e-06, "loss": 0.8921, "step": 4892 }, { "epoch": 0.68, "learning_rate": 4.915821750298834e-06, "loss": 0.8159, "step": 4893 }, { "epoch": 0.68, "learning_rate": 4.911948201570613e-06, "loss": 0.5787, "step": 4894 }, { "epoch": 0.68, "learning_rate": 4.908075682676276e-06, "loss": 0.8257, "step": 4895 }, { "epoch": 0.68, "learning_rate": 4.904204194399635e-06, "loss": 0.8596, "step": 4896 }, { "epoch": 0.68, "learning_rate": 4.9003337375242865e-06, "loss": 0.5833, "step": 4897 }, { "epoch": 0.68, "learning_rate": 4.896464312833616e-06, "loss": 0.8867, "step": 4898 }, { "epoch": 0.68, "learning_rate": 4.892595921110811e-06, "loss": 0.8433, "step": 4899 }, { "epoch": 0.68, "learning_rate": 4.888728563138836e-06, "loss": 0.7712, "step": 4900 }, { "epoch": 0.68, "learning_rate": 4.884862239700462e-06, "loss": 0.8501, "step": 4901 }, { "epoch": 0.68, "learning_rate": 4.880996951578237e-06, "loss": 0.8186, "step": 4902 }, { "epoch": 0.68, "learning_rate": 4.877132699554502e-06, "loss": 0.5768, "step": 4903 }, { "epoch": 0.68, "learning_rate": 4.873269484411398e-06, "loss": 0.8013, "step": 4904 }, { "epoch": 0.68, "learning_rate": 4.869407306930841e-06, "loss": 0.8073, "step": 4905 }, { "epoch": 0.68, "learning_rate": 4.865546167894554e-06, "loss": 0.8496, "step": 4906 }, { "epoch": 0.68, "learning_rate": 4.861686068084035e-06, "loss": 0.8223, "step": 4907 }, { "epoch": 0.68, "learning_rate": 4.857827008280575e-06, "loss": 0.874, "step": 4908 }, { "epoch": 0.68, "learning_rate": 4.853968989265264e-06, "loss": 0.8772, "step": 4909 }, { "epoch": 0.68, "learning_rate": 4.850112011818967e-06, "loss": 0.8564, "step": 4910 }, { "epoch": 0.68, "learning_rate": 4.846256076722353e-06, "loss": 0.8425, "step": 4911 }, { "epoch": 0.68, "learning_rate": 4.842401184755868e-06, "loss": 0.8652, "step": 4912 }, { "epoch": 0.68, "learning_rate": 4.838547336699749e-06, "loss": 0.5214, "step": 4913 }, { "epoch": 0.68, "learning_rate": 4.834694533334031e-06, "loss": 0.636, "step": 4914 }, { "epoch": 0.68, "learning_rate": 4.830842775438524e-06, "loss": 0.772, "step": 4915 }, { "epoch": 0.68, "learning_rate": 4.826992063792838e-06, "loss": 0.7584, "step": 4916 }, { "epoch": 0.68, "learning_rate": 4.823142399176365e-06, "loss": 0.8372, "step": 4917 }, { "epoch": 0.68, "learning_rate": 4.819293782368282e-06, "loss": 0.8145, "step": 4918 }, { "epoch": 0.68, "learning_rate": 4.815446214147565e-06, "loss": 0.8518, "step": 4919 }, { "epoch": 0.68, "learning_rate": 4.811599695292963e-06, "loss": 0.8201, "step": 4920 }, { "epoch": 0.68, "learning_rate": 4.807754226583031e-06, "loss": 0.8433, "step": 4921 }, { "epoch": 0.68, "learning_rate": 4.803909808796095e-06, "loss": 0.8428, "step": 4922 }, { "epoch": 0.68, "learning_rate": 4.80006644271027e-06, "loss": 0.6147, "step": 4923 }, { "epoch": 0.68, "learning_rate": 4.796224129103472e-06, "loss": 0.8489, "step": 4924 }, { "epoch": 0.68, "learning_rate": 4.792382868753387e-06, "loss": 0.8569, "step": 4925 }, { "epoch": 0.68, "learning_rate": 4.788542662437501e-06, "loss": 0.8171, "step": 4926 }, { "epoch": 0.68, "learning_rate": 4.7847035109330774e-06, "loss": 0.9216, "step": 4927 }, { "epoch": 0.68, "learning_rate": 4.7808654150171675e-06, "loss": 0.8179, "step": 4928 }, { "epoch": 0.68, "learning_rate": 4.777028375466618e-06, "loss": 0.9023, "step": 4929 }, { "epoch": 0.68, "learning_rate": 4.773192393058047e-06, "loss": 0.8052, "step": 4930 }, { "epoch": 0.68, "learning_rate": 4.7693574685678745e-06, "loss": 0.8247, "step": 4931 }, { "epoch": 0.69, "learning_rate": 4.765523602772294e-06, "loss": 0.803, "step": 4932 }, { "epoch": 0.69, "learning_rate": 4.761690796447286e-06, "loss": 0.6368, "step": 4933 }, { "epoch": 0.69, "learning_rate": 4.757859050368627e-06, "loss": 0.7793, "step": 4934 }, { "epoch": 0.69, "learning_rate": 4.754028365311865e-06, "loss": 0.825, "step": 4935 }, { "epoch": 0.69, "learning_rate": 4.7501987420523455e-06, "loss": 0.7986, "step": 4936 }, { "epoch": 0.69, "learning_rate": 4.74637018136519e-06, "loss": 0.8376, "step": 4937 }, { "epoch": 0.69, "learning_rate": 4.742542684025305e-06, "loss": 0.7864, "step": 4938 }, { "epoch": 0.69, "learning_rate": 4.738716250807395e-06, "loss": 0.7634, "step": 4939 }, { "epoch": 0.69, "learning_rate": 4.7348908824859275e-06, "loss": 0.7654, "step": 4940 }, { "epoch": 0.69, "learning_rate": 4.731066579835177e-06, "loss": 0.78, "step": 4941 }, { "epoch": 0.69, "learning_rate": 4.727243343629187e-06, "loss": 0.7373, "step": 4942 }, { "epoch": 0.69, "learning_rate": 4.723421174641784e-06, "loss": 0.8381, "step": 4943 }, { "epoch": 0.69, "learning_rate": 4.719600073646594e-06, "loss": 0.825, "step": 4944 }, { "epoch": 0.69, "learning_rate": 4.7157800414170084e-06, "loss": 0.801, "step": 4945 }, { "epoch": 0.69, "learning_rate": 4.711961078726219e-06, "loss": 0.8682, "step": 4946 }, { "epoch": 0.69, "learning_rate": 4.708143186347189e-06, "loss": 0.8491, "step": 4947 }, { "epoch": 0.69, "learning_rate": 4.704326365052666e-06, "loss": 0.908, "step": 4948 }, { "epoch": 0.69, "learning_rate": 4.700510615615189e-06, "loss": 0.7546, "step": 4949 }, { "epoch": 0.69, "learning_rate": 4.69669593880707e-06, "loss": 0.8108, "step": 4950 }, { "epoch": 0.69, "learning_rate": 4.692882335400415e-06, "loss": 0.821, "step": 4951 }, { "epoch": 0.69, "learning_rate": 4.6890698061671015e-06, "loss": 0.8029, "step": 4952 }, { "epoch": 0.69, "learning_rate": 4.685258351878793e-06, "loss": 0.8413, "step": 4953 }, { "epoch": 0.69, "learning_rate": 4.681447973306944e-06, "loss": 0.7622, "step": 4954 }, { "epoch": 0.69, "learning_rate": 4.677638671222775e-06, "loss": 0.8672, "step": 4955 }, { "epoch": 0.69, "learning_rate": 4.673830446397308e-06, "loss": 0.8472, "step": 4956 }, { "epoch": 0.69, "learning_rate": 4.670023299601332e-06, "loss": 0.8401, "step": 4957 }, { "epoch": 0.69, "learning_rate": 4.6662172316054175e-06, "loss": 0.8069, "step": 4958 }, { "epoch": 0.69, "learning_rate": 4.662412243179931e-06, "loss": 0.8228, "step": 4959 }, { "epoch": 0.69, "learning_rate": 4.658608335095003e-06, "loss": 0.8159, "step": 4960 }, { "epoch": 0.69, "learning_rate": 4.6548055081205615e-06, "loss": 0.8142, "step": 4961 }, { "epoch": 0.69, "learning_rate": 4.651003763026304e-06, "loss": 0.8484, "step": 4962 }, { "epoch": 0.69, "learning_rate": 4.647203100581708e-06, "loss": 0.7781, "step": 4963 }, { "epoch": 0.69, "learning_rate": 4.643403521556047e-06, "loss": 0.8735, "step": 4964 }, { "epoch": 0.69, "learning_rate": 4.639605026718355e-06, "loss": 0.8398, "step": 4965 }, { "epoch": 0.69, "learning_rate": 4.635807616837464e-06, "loss": 0.8569, "step": 4966 }, { "epoch": 0.69, "learning_rate": 4.632011292681976e-06, "loss": 0.7971, "step": 4967 }, { "epoch": 0.69, "learning_rate": 4.628216055020272e-06, "loss": 0.78, "step": 4968 }, { "epoch": 0.69, "learning_rate": 4.624421904620525e-06, "loss": 0.8018, "step": 4969 }, { "epoch": 0.69, "learning_rate": 4.620628842250673e-06, "loss": 0.8589, "step": 4970 }, { "epoch": 0.69, "learning_rate": 4.616836868678447e-06, "loss": 0.8455, "step": 4971 }, { "epoch": 0.69, "learning_rate": 4.613045984671349e-06, "loss": 0.761, "step": 4972 }, { "epoch": 0.69, "learning_rate": 4.609256190996657e-06, "loss": 0.598, "step": 4973 }, { "epoch": 0.69, "learning_rate": 4.6054674884214455e-06, "loss": 0.8049, "step": 4974 }, { "epoch": 0.69, "learning_rate": 4.601679877712548e-06, "loss": 0.803, "step": 4975 }, { "epoch": 0.69, "learning_rate": 4.5978933596365925e-06, "loss": 0.7319, "step": 4976 }, { "epoch": 0.69, "learning_rate": 4.594107934959976e-06, "loss": 0.8456, "step": 4977 }, { "epoch": 0.69, "learning_rate": 4.5903236044488745e-06, "loss": 0.791, "step": 4978 }, { "epoch": 0.69, "learning_rate": 4.586540368869252e-06, "loss": 0.7874, "step": 4979 }, { "epoch": 0.69, "learning_rate": 4.582758228986839e-06, "loss": 0.8584, "step": 4980 }, { "epoch": 0.69, "learning_rate": 4.578977185567154e-06, "loss": 0.8215, "step": 4981 }, { "epoch": 0.69, "learning_rate": 4.5751972393754885e-06, "loss": 0.8901, "step": 4982 }, { "epoch": 0.69, "learning_rate": 4.571418391176907e-06, "loss": 0.8052, "step": 4983 }, { "epoch": 0.69, "learning_rate": 4.567640641736266e-06, "loss": 0.7888, "step": 4984 }, { "epoch": 0.69, "learning_rate": 4.563863991818183e-06, "loss": 0.7357, "step": 4985 }, { "epoch": 0.69, "learning_rate": 4.560088442187068e-06, "loss": 0.8828, "step": 4986 }, { "epoch": 0.69, "learning_rate": 4.5563139936071e-06, "loss": 0.842, "step": 4987 }, { "epoch": 0.69, "learning_rate": 4.55254064684223e-06, "loss": 0.5753, "step": 4988 }, { "epoch": 0.69, "learning_rate": 4.5487684026562006e-06, "loss": 0.8729, "step": 4989 }, { "epoch": 0.69, "learning_rate": 4.544997261812516e-06, "loss": 0.5938, "step": 4990 }, { "epoch": 0.69, "learning_rate": 4.54122722507447e-06, "loss": 0.8589, "step": 4991 }, { "epoch": 0.69, "learning_rate": 4.537458293205127e-06, "loss": 0.8074, "step": 4992 }, { "epoch": 0.69, "learning_rate": 4.533690466967321e-06, "loss": 0.8481, "step": 4993 }, { "epoch": 0.69, "learning_rate": 4.529923747123678e-06, "loss": 0.7764, "step": 4994 }, { "epoch": 0.69, "learning_rate": 4.526158134436583e-06, "loss": 0.8667, "step": 4995 }, { "epoch": 0.69, "learning_rate": 4.522393629668211e-06, "loss": 0.7993, "step": 4996 }, { "epoch": 0.69, "learning_rate": 4.5186302335805065e-06, "loss": 0.7771, "step": 4997 }, { "epoch": 0.69, "learning_rate": 4.514867946935184e-06, "loss": 0.8335, "step": 4998 }, { "epoch": 0.69, "learning_rate": 4.511106770493746e-06, "loss": 0.8188, "step": 4999 }, { "epoch": 0.69, "learning_rate": 4.507346705017459e-06, "loss": 0.6357, "step": 5000 }, { "epoch": 0.69, "learning_rate": 4.503587751267374e-06, "loss": 0.8257, "step": 5001 }, { "epoch": 0.69, "learning_rate": 4.49982991000431e-06, "loss": 0.8066, "step": 5002 }, { "epoch": 0.69, "learning_rate": 4.4960731819888585e-06, "loss": 0.8392, "step": 5003 }, { "epoch": 0.7, "learning_rate": 4.492317567981398e-06, "loss": 0.8408, "step": 5004 }, { "epoch": 0.7, "learning_rate": 4.488563068742067e-06, "loss": 0.7789, "step": 5005 }, { "epoch": 0.7, "learning_rate": 4.484809685030792e-06, "loss": 0.8115, "step": 5006 }, { "epoch": 0.7, "learning_rate": 4.481057417607263e-06, "loss": 0.5941, "step": 5007 }, { "epoch": 0.7, "learning_rate": 4.477306267230944e-06, "loss": 0.7153, "step": 5008 }, { "epoch": 0.7, "learning_rate": 4.4735562346610864e-06, "loss": 0.8301, "step": 5009 }, { "epoch": 0.7, "learning_rate": 4.469807320656695e-06, "loss": 0.811, "step": 5010 }, { "epoch": 0.7, "learning_rate": 4.466059525976568e-06, "loss": 0.8384, "step": 5011 }, { "epoch": 0.7, "learning_rate": 4.462312851379261e-06, "loss": 0.8201, "step": 5012 }, { "epoch": 0.7, "learning_rate": 4.4585672976231175e-06, "loss": 0.6046, "step": 5013 }, { "epoch": 0.7, "learning_rate": 4.454822865466242e-06, "loss": 0.8423, "step": 5014 }, { "epoch": 0.7, "learning_rate": 4.451079555666512e-06, "loss": 0.8279, "step": 5015 }, { "epoch": 0.7, "learning_rate": 4.447337368981592e-06, "loss": 0.7985, "step": 5016 }, { "epoch": 0.7, "learning_rate": 4.443596306168901e-06, "loss": 0.844, "step": 5017 }, { "epoch": 0.7, "learning_rate": 4.439856367985648e-06, "loss": 0.5465, "step": 5018 }, { "epoch": 0.7, "learning_rate": 4.4361175551887994e-06, "loss": 0.7729, "step": 5019 }, { "epoch": 0.7, "learning_rate": 4.432379868535096e-06, "loss": 0.5782, "step": 5020 }, { "epoch": 0.7, "learning_rate": 4.4286433087810646e-06, "loss": 0.7648, "step": 5021 }, { "epoch": 0.7, "learning_rate": 4.424907876682985e-06, "loss": 0.8474, "step": 5022 }, { "epoch": 0.7, "learning_rate": 4.421173572996923e-06, "loss": 0.8723, "step": 5023 }, { "epoch": 0.7, "learning_rate": 4.4174403984787105e-06, "loss": 0.761, "step": 5024 }, { "epoch": 0.7, "learning_rate": 4.413708353883946e-06, "loss": 0.8149, "step": 5025 }, { "epoch": 0.7, "learning_rate": 4.4099774399680106e-06, "loss": 0.8315, "step": 5026 }, { "epoch": 0.7, "learning_rate": 4.406247657486043e-06, "loss": 0.7722, "step": 5027 }, { "epoch": 0.7, "learning_rate": 4.402519007192969e-06, "loss": 0.819, "step": 5028 }, { "epoch": 0.7, "learning_rate": 4.398791489843471e-06, "loss": 0.7939, "step": 5029 }, { "epoch": 0.7, "learning_rate": 4.395065106192006e-06, "loss": 0.7732, "step": 5030 }, { "epoch": 0.7, "learning_rate": 4.391339856992808e-06, "loss": 0.8606, "step": 5031 }, { "epoch": 0.7, "learning_rate": 4.387615742999869e-06, "loss": 0.7743, "step": 5032 }, { "epoch": 0.7, "learning_rate": 4.383892764966969e-06, "loss": 0.8147, "step": 5033 }, { "epoch": 0.7, "learning_rate": 4.380170923647639e-06, "loss": 0.7865, "step": 5034 }, { "epoch": 0.7, "learning_rate": 4.37645021979519e-06, "loss": 0.8711, "step": 5035 }, { "epoch": 0.7, "learning_rate": 4.372730654162706e-06, "loss": 0.8347, "step": 5036 }, { "epoch": 0.7, "learning_rate": 4.369012227503028e-06, "loss": 0.803, "step": 5037 }, { "epoch": 0.7, "learning_rate": 4.365294940568784e-06, "loss": 0.7788, "step": 5038 }, { "epoch": 0.7, "learning_rate": 4.361578794112357e-06, "loss": 0.7898, "step": 5039 }, { "epoch": 0.7, "learning_rate": 4.3578637888859e-06, "loss": 0.8247, "step": 5040 }, { "epoch": 0.7, "learning_rate": 4.354149925641348e-06, "loss": 0.8174, "step": 5041 }, { "epoch": 0.7, "learning_rate": 4.3504372051303855e-06, "loss": 0.6677, "step": 5042 }, { "epoch": 0.7, "learning_rate": 4.346725628104485e-06, "loss": 0.895, "step": 5043 }, { "epoch": 0.7, "learning_rate": 4.343015195314877e-06, "loss": 0.8014, "step": 5044 }, { "epoch": 0.7, "learning_rate": 4.3393059075125545e-06, "loss": 0.8132, "step": 5045 }, { "epoch": 0.7, "learning_rate": 4.335597765448296e-06, "loss": 0.7502, "step": 5046 }, { "epoch": 0.7, "learning_rate": 4.33189076987263e-06, "loss": 0.814, "step": 5047 }, { "epoch": 0.7, "learning_rate": 4.32818492153587e-06, "loss": 0.8357, "step": 5048 }, { "epoch": 0.7, "learning_rate": 4.324480221188083e-06, "loss": 0.8599, "step": 5049 }, { "epoch": 0.7, "learning_rate": 4.3207766695791064e-06, "loss": 0.8477, "step": 5050 }, { "epoch": 0.7, "learning_rate": 4.317074267458555e-06, "loss": 0.8091, "step": 5051 }, { "epoch": 0.7, "learning_rate": 4.313373015575798e-06, "loss": 0.7581, "step": 5052 }, { "epoch": 0.7, "learning_rate": 4.309672914679984e-06, "loss": 0.6003, "step": 5053 }, { "epoch": 0.7, "learning_rate": 4.305973965520018e-06, "loss": 0.8638, "step": 5054 }, { "epoch": 0.7, "learning_rate": 4.302276168844573e-06, "loss": 0.8586, "step": 5055 }, { "epoch": 0.7, "learning_rate": 4.2985795254021e-06, "loss": 0.8384, "step": 5056 }, { "epoch": 0.7, "learning_rate": 4.2948840359407994e-06, "loss": 0.8193, "step": 5057 }, { "epoch": 0.7, "learning_rate": 4.291189701208656e-06, "loss": 0.7745, "step": 5058 }, { "epoch": 0.7, "learning_rate": 4.287496521953408e-06, "loss": 0.8052, "step": 5059 }, { "epoch": 0.7, "learning_rate": 4.28380449892256e-06, "loss": 0.8657, "step": 5060 }, { "epoch": 0.7, "learning_rate": 4.280113632863393e-06, "loss": 0.6035, "step": 5061 }, { "epoch": 0.7, "learning_rate": 4.276423924522941e-06, "loss": 0.7971, "step": 5062 }, { "epoch": 0.7, "learning_rate": 4.272735374648016e-06, "loss": 0.8004, "step": 5063 }, { "epoch": 0.7, "learning_rate": 4.269047983985188e-06, "loss": 0.8513, "step": 5064 }, { "epoch": 0.7, "learning_rate": 4.265361753280786e-06, "loss": 0.8579, "step": 5065 }, { "epoch": 0.7, "learning_rate": 4.261676683280922e-06, "loss": 0.8286, "step": 5066 }, { "epoch": 0.7, "learning_rate": 4.257992774731459e-06, "loss": 0.8101, "step": 5067 }, { "epoch": 0.7, "learning_rate": 4.254310028378026e-06, "loss": 0.8367, "step": 5068 }, { "epoch": 0.7, "learning_rate": 4.250628444966025e-06, "loss": 0.7854, "step": 5069 }, { "epoch": 0.7, "learning_rate": 4.2469480252406116e-06, "loss": 0.8193, "step": 5070 }, { "epoch": 0.7, "learning_rate": 4.243268769946718e-06, "loss": 0.7683, "step": 5071 }, { "epoch": 0.7, "learning_rate": 4.2395906798290324e-06, "loss": 0.9045, "step": 5072 }, { "epoch": 0.7, "learning_rate": 4.235913755632003e-06, "loss": 0.777, "step": 5073 }, { "epoch": 0.7, "learning_rate": 4.232237998099857e-06, "loss": 0.8313, "step": 5074 }, { "epoch": 0.7, "learning_rate": 4.228563407976568e-06, "loss": 0.609, "step": 5075 }, { "epoch": 0.71, "learning_rate": 4.22488998600589e-06, "loss": 0.8323, "step": 5076 }, { "epoch": 0.71, "learning_rate": 4.221217732931329e-06, "loss": 0.8672, "step": 5077 }, { "epoch": 0.71, "learning_rate": 4.217546649496154e-06, "loss": 0.8223, "step": 5078 }, { "epoch": 0.71, "learning_rate": 4.213876736443407e-06, "loss": 0.8718, "step": 5079 }, { "epoch": 0.71, "learning_rate": 4.210207994515883e-06, "loss": 0.8198, "step": 5080 }, { "epoch": 0.71, "learning_rate": 4.206540424456147e-06, "loss": 0.8369, "step": 5081 }, { "epoch": 0.71, "learning_rate": 4.202874027006525e-06, "loss": 0.5757, "step": 5082 }, { "epoch": 0.71, "learning_rate": 4.199208802909098e-06, "loss": 0.8542, "step": 5083 }, { "epoch": 0.71, "learning_rate": 4.195544752905724e-06, "loss": 0.7947, "step": 5084 }, { "epoch": 0.71, "learning_rate": 4.19188187773801e-06, "loss": 0.8354, "step": 5085 }, { "epoch": 0.71, "learning_rate": 4.1882201781473356e-06, "loss": 0.7844, "step": 5086 }, { "epoch": 0.71, "learning_rate": 4.184559654874834e-06, "loss": 0.8474, "step": 5087 }, { "epoch": 0.71, "learning_rate": 4.180900308661402e-06, "loss": 0.8027, "step": 5088 }, { "epoch": 0.71, "learning_rate": 4.177242140247707e-06, "loss": 0.7561, "step": 5089 }, { "epoch": 0.71, "learning_rate": 4.1735851503741665e-06, "loss": 0.8708, "step": 5090 }, { "epoch": 0.71, "learning_rate": 4.1699293397809605e-06, "loss": 0.804, "step": 5091 }, { "epoch": 0.71, "learning_rate": 4.166274709208041e-06, "loss": 0.6241, "step": 5092 }, { "epoch": 0.71, "learning_rate": 4.162621259395108e-06, "loss": 0.8513, "step": 5093 }, { "epoch": 0.71, "learning_rate": 4.158968991081633e-06, "loss": 0.8359, "step": 5094 }, { "epoch": 0.71, "learning_rate": 4.155317905006844e-06, "loss": 0.8096, "step": 5095 }, { "epoch": 0.71, "learning_rate": 4.151668001909723e-06, "loss": 0.7698, "step": 5096 }, { "epoch": 0.71, "learning_rate": 4.148019282529029e-06, "loss": 0.8625, "step": 5097 }, { "epoch": 0.71, "learning_rate": 4.144371747603261e-06, "loss": 0.839, "step": 5098 }, { "epoch": 0.71, "learning_rate": 4.140725397870699e-06, "loss": 0.8291, "step": 5099 }, { "epoch": 0.71, "learning_rate": 4.137080234069368e-06, "loss": 0.8494, "step": 5100 }, { "epoch": 0.71, "learning_rate": 4.1334362569370525e-06, "loss": 0.7773, "step": 5101 }, { "epoch": 0.71, "learning_rate": 4.129793467211313e-06, "loss": 0.8083, "step": 5102 }, { "epoch": 0.71, "learning_rate": 4.126151865629449e-06, "loss": 0.8174, "step": 5103 }, { "epoch": 0.71, "learning_rate": 4.122511452928538e-06, "loss": 0.7188, "step": 5104 }, { "epoch": 0.71, "learning_rate": 4.118872229845405e-06, "loss": 0.759, "step": 5105 }, { "epoch": 0.71, "learning_rate": 4.115234197116633e-06, "loss": 0.5805, "step": 5106 }, { "epoch": 0.71, "learning_rate": 4.111597355478575e-06, "loss": 0.5839, "step": 5107 }, { "epoch": 0.71, "learning_rate": 4.1079617056673305e-06, "loss": 0.808, "step": 5108 }, { "epoch": 0.71, "learning_rate": 4.104327248418771e-06, "loss": 0.8022, "step": 5109 }, { "epoch": 0.71, "learning_rate": 4.100693984468515e-06, "loss": 0.5996, "step": 5110 }, { "epoch": 0.71, "learning_rate": 4.097061914551941e-06, "loss": 0.804, "step": 5111 }, { "epoch": 0.71, "learning_rate": 4.093431039404194e-06, "loss": 0.7692, "step": 5112 }, { "epoch": 0.71, "learning_rate": 4.08980135976017e-06, "loss": 0.7661, "step": 5113 }, { "epoch": 0.71, "learning_rate": 4.0861728763545225e-06, "loss": 0.7942, "step": 5114 }, { "epoch": 0.71, "learning_rate": 4.0825455899216705e-06, "loss": 0.7867, "step": 5115 }, { "epoch": 0.71, "learning_rate": 4.078919501195777e-06, "loss": 0.8625, "step": 5116 }, { "epoch": 0.71, "learning_rate": 4.075294610910782e-06, "loss": 0.8237, "step": 5117 }, { "epoch": 0.71, "learning_rate": 4.071670919800364e-06, "loss": 0.7766, "step": 5118 }, { "epoch": 0.71, "learning_rate": 4.068048428597969e-06, "loss": 0.7966, "step": 5119 }, { "epoch": 0.71, "learning_rate": 4.064427138036798e-06, "loss": 0.8269, "step": 5120 }, { "epoch": 0.71, "learning_rate": 4.0608070488498064e-06, "loss": 0.8472, "step": 5121 }, { "epoch": 0.71, "learning_rate": 4.057188161769716e-06, "loss": 0.8347, "step": 5122 }, { "epoch": 0.71, "learning_rate": 4.053570477528993e-06, "loss": 0.587, "step": 5123 }, { "epoch": 0.71, "learning_rate": 4.049953996859862e-06, "loss": 0.7454, "step": 5124 }, { "epoch": 0.71, "learning_rate": 4.046338720494315e-06, "loss": 0.7966, "step": 5125 }, { "epoch": 0.71, "learning_rate": 4.042724649164086e-06, "loss": 0.8281, "step": 5126 }, { "epoch": 0.71, "learning_rate": 4.039111783600678e-06, "loss": 0.8464, "step": 5127 }, { "epoch": 0.71, "learning_rate": 4.03550012453534e-06, "loss": 0.8391, "step": 5128 }, { "epoch": 0.71, "learning_rate": 4.031889672699077e-06, "loss": 0.835, "step": 5129 }, { "epoch": 0.71, "learning_rate": 4.028280428822661e-06, "loss": 0.817, "step": 5130 }, { "epoch": 0.71, "learning_rate": 4.024672393636604e-06, "loss": 0.7612, "step": 5131 }, { "epoch": 0.71, "learning_rate": 4.021065567871187e-06, "loss": 0.7942, "step": 5132 }, { "epoch": 0.71, "learning_rate": 4.017459952256438e-06, "loss": 0.8855, "step": 5133 }, { "epoch": 0.71, "learning_rate": 4.0138555475221395e-06, "loss": 0.8057, "step": 5134 }, { "epoch": 0.71, "learning_rate": 4.010252354397836e-06, "loss": 0.7612, "step": 5135 }, { "epoch": 0.71, "learning_rate": 4.006650373612823e-06, "loss": 0.8044, "step": 5136 }, { "epoch": 0.71, "learning_rate": 4.003049605896141e-06, "loss": 0.7659, "step": 5137 }, { "epoch": 0.71, "learning_rate": 3.999450051976606e-06, "loss": 0.7732, "step": 5138 }, { "epoch": 0.71, "learning_rate": 3.995851712582767e-06, "loss": 0.786, "step": 5139 }, { "epoch": 0.71, "learning_rate": 3.992254588442943e-06, "loss": 0.7898, "step": 5140 }, { "epoch": 0.71, "learning_rate": 3.988658680285199e-06, "loss": 0.8391, "step": 5141 }, { "epoch": 0.71, "learning_rate": 3.985063988837351e-06, "loss": 0.8508, "step": 5142 }, { "epoch": 0.71, "learning_rate": 3.98147051482698e-06, "loss": 0.7998, "step": 5143 }, { "epoch": 0.71, "learning_rate": 3.977878258981407e-06, "loss": 0.7786, "step": 5144 }, { "epoch": 0.71, "learning_rate": 3.97428722202772e-06, "loss": 0.8523, "step": 5145 }, { "epoch": 0.71, "learning_rate": 3.9706974046927496e-06, "loss": 0.8828, "step": 5146 }, { "epoch": 0.71, "learning_rate": 3.96710880770308e-06, "loss": 0.5997, "step": 5147 }, { "epoch": 0.72, "learning_rate": 3.96352143178506e-06, "loss": 0.6031, "step": 5148 }, { "epoch": 0.72, "learning_rate": 3.959935277664775e-06, "loss": 0.8274, "step": 5149 }, { "epoch": 0.72, "learning_rate": 3.956350346068079e-06, "loss": 0.7942, "step": 5150 }, { "epoch": 0.72, "learning_rate": 3.9527666377205655e-06, "loss": 0.8242, "step": 5151 }, { "epoch": 0.72, "learning_rate": 3.949184153347584e-06, "loss": 0.8186, "step": 5152 }, { "epoch": 0.72, "learning_rate": 3.945602893674245e-06, "loss": 0.7695, "step": 5153 }, { "epoch": 0.72, "learning_rate": 3.942022859425397e-06, "loss": 0.833, "step": 5154 }, { "epoch": 0.72, "learning_rate": 3.938444051325652e-06, "loss": 0.7964, "step": 5155 }, { "epoch": 0.72, "learning_rate": 3.934866470099368e-06, "loss": 0.8386, "step": 5156 }, { "epoch": 0.72, "learning_rate": 3.931290116470653e-06, "loss": 0.7822, "step": 5157 }, { "epoch": 0.72, "learning_rate": 3.927714991163376e-06, "loss": 0.8508, "step": 5158 }, { "epoch": 0.72, "learning_rate": 3.924141094901143e-06, "loss": 0.8014, "step": 5159 }, { "epoch": 0.72, "learning_rate": 3.920568428407328e-06, "loss": 0.5453, "step": 5160 }, { "epoch": 0.72, "learning_rate": 3.916996992405041e-06, "loss": 0.8347, "step": 5161 }, { "epoch": 0.72, "learning_rate": 3.9134267876171494e-06, "loss": 0.5541, "step": 5162 }, { "epoch": 0.72, "learning_rate": 3.909857814766274e-06, "loss": 0.8201, "step": 5163 }, { "epoch": 0.72, "learning_rate": 3.906290074574781e-06, "loss": 0.79, "step": 5164 }, { "epoch": 0.72, "learning_rate": 3.902723567764793e-06, "loss": 0.5205, "step": 5165 }, { "epoch": 0.72, "learning_rate": 3.8991582950581775e-06, "loss": 0.8147, "step": 5166 }, { "epoch": 0.72, "learning_rate": 3.895594257176551e-06, "loss": 0.7996, "step": 5167 }, { "epoch": 0.72, "learning_rate": 3.8920314548412885e-06, "loss": 0.8093, "step": 5168 }, { "epoch": 0.72, "learning_rate": 3.888469888773505e-06, "loss": 0.8254, "step": 5169 }, { "epoch": 0.72, "learning_rate": 3.884909559694077e-06, "loss": 0.8113, "step": 5170 }, { "epoch": 0.72, "learning_rate": 3.881350468323618e-06, "loss": 0.5771, "step": 5171 }, { "epoch": 0.72, "learning_rate": 3.877792615382494e-06, "loss": 0.7821, "step": 5172 }, { "epoch": 0.72, "learning_rate": 3.874236001590832e-06, "loss": 0.7769, "step": 5173 }, { "epoch": 0.72, "learning_rate": 3.87068062766849e-06, "loss": 0.8257, "step": 5174 }, { "epoch": 0.72, "learning_rate": 3.867126494335091e-06, "loss": 0.8008, "step": 5175 }, { "epoch": 0.72, "learning_rate": 3.863573602309997e-06, "loss": 0.8052, "step": 5176 }, { "epoch": 0.72, "learning_rate": 3.860021952312319e-06, "loss": 0.8103, "step": 5177 }, { "epoch": 0.72, "learning_rate": 3.856471545060926e-06, "loss": 0.5273, "step": 5178 }, { "epoch": 0.72, "learning_rate": 3.852922381274423e-06, "loss": 0.8289, "step": 5179 }, { "epoch": 0.72, "learning_rate": 3.849374461671175e-06, "loss": 0.8611, "step": 5180 }, { "epoch": 0.72, "learning_rate": 3.845827786969286e-06, "loss": 0.7305, "step": 5181 }, { "epoch": 0.72, "learning_rate": 3.842282357886609e-06, "loss": 0.8611, "step": 5182 }, { "epoch": 0.72, "learning_rate": 3.838738175140753e-06, "loss": 0.5359, "step": 5183 }, { "epoch": 0.72, "learning_rate": 3.8351952394490625e-06, "loss": 0.8345, "step": 5184 }, { "epoch": 0.72, "learning_rate": 3.831653551528642e-06, "loss": 0.7932, "step": 5185 }, { "epoch": 0.72, "learning_rate": 3.828113112096338e-06, "loss": 0.8811, "step": 5186 }, { "epoch": 0.72, "learning_rate": 3.824573921868737e-06, "loss": 0.8516, "step": 5187 }, { "epoch": 0.72, "learning_rate": 3.821035981562188e-06, "loss": 0.8018, "step": 5188 }, { "epoch": 0.72, "learning_rate": 3.81749929189277e-06, "loss": 0.8296, "step": 5189 }, { "epoch": 0.72, "learning_rate": 3.8139638535763266e-06, "loss": 0.7825, "step": 5190 }, { "epoch": 0.72, "learning_rate": 3.8104296673284346e-06, "loss": 0.8483, "step": 5191 }, { "epoch": 0.72, "learning_rate": 3.806896733864417e-06, "loss": 0.7979, "step": 5192 }, { "epoch": 0.72, "learning_rate": 3.803365053899357e-06, "loss": 0.8491, "step": 5193 }, { "epoch": 0.72, "learning_rate": 3.799834628148068e-06, "loss": 0.8545, "step": 5194 }, { "epoch": 0.72, "learning_rate": 3.796305457325121e-06, "loss": 0.7653, "step": 5195 }, { "epoch": 0.72, "learning_rate": 3.7927775421448286e-06, "loss": 0.803, "step": 5196 }, { "epoch": 0.72, "learning_rate": 3.7892508833212437e-06, "loss": 0.7808, "step": 5197 }, { "epoch": 0.72, "learning_rate": 3.7857254815681787e-06, "loss": 0.8091, "step": 5198 }, { "epoch": 0.72, "learning_rate": 3.782201337599175e-06, "loss": 0.7927, "step": 5199 }, { "epoch": 0.72, "learning_rate": 3.7786784521275353e-06, "loss": 0.7546, "step": 5200 }, { "epoch": 0.72, "learning_rate": 3.7751568258662973e-06, "loss": 0.8271, "step": 5201 }, { "epoch": 0.72, "learning_rate": 3.771636459528243e-06, "loss": 0.8252, "step": 5202 }, { "epoch": 0.72, "learning_rate": 3.7681173538259085e-06, "loss": 0.7615, "step": 5203 }, { "epoch": 0.72, "learning_rate": 3.7645995094715637e-06, "loss": 0.7806, "step": 5204 }, { "epoch": 0.72, "learning_rate": 3.761082927177235e-06, "loss": 0.8125, "step": 5205 }, { "epoch": 0.72, "learning_rate": 3.757567607654685e-06, "loss": 0.8787, "step": 5206 }, { "epoch": 0.72, "learning_rate": 3.7540535516154177e-06, "loss": 0.5649, "step": 5207 }, { "epoch": 0.72, "learning_rate": 3.7505407597706946e-06, "loss": 0.569, "step": 5208 }, { "epoch": 0.72, "learning_rate": 3.747029232831504e-06, "loss": 0.601, "step": 5209 }, { "epoch": 0.72, "learning_rate": 3.7435189715085973e-06, "loss": 0.8938, "step": 5210 }, { "epoch": 0.72, "learning_rate": 3.740009976512454e-06, "loss": 0.7783, "step": 5211 }, { "epoch": 0.72, "learning_rate": 3.736502248553301e-06, "loss": 0.8438, "step": 5212 }, { "epoch": 0.72, "learning_rate": 3.732995788341117e-06, "loss": 0.7947, "step": 5213 }, { "epoch": 0.72, "learning_rate": 3.729490596585612e-06, "loss": 0.8643, "step": 5214 }, { "epoch": 0.72, "learning_rate": 3.7259866739962524e-06, "loss": 0.7976, "step": 5215 }, { "epoch": 0.72, "learning_rate": 3.7224840212822342e-06, "loss": 0.8474, "step": 5216 }, { "epoch": 0.72, "learning_rate": 3.718982639152503e-06, "loss": 0.8425, "step": 5217 }, { "epoch": 0.72, "learning_rate": 3.7154825283157514e-06, "loss": 0.8113, "step": 5218 }, { "epoch": 0.72, "learning_rate": 3.711983689480404e-06, "loss": 0.7759, "step": 5219 }, { "epoch": 0.73, "learning_rate": 3.708486123354642e-06, "loss": 0.8062, "step": 5220 }, { "epoch": 0.73, "learning_rate": 3.704989830646376e-06, "loss": 0.7773, "step": 5221 }, { "epoch": 0.73, "learning_rate": 3.701494812063261e-06, "loss": 0.8032, "step": 5222 }, { "epoch": 0.73, "learning_rate": 3.6980010683127056e-06, "loss": 0.7756, "step": 5223 }, { "epoch": 0.73, "learning_rate": 3.694508600101843e-06, "loss": 0.8198, "step": 5224 }, { "epoch": 0.73, "learning_rate": 3.691017408137565e-06, "loss": 0.8274, "step": 5225 }, { "epoch": 0.73, "learning_rate": 3.6875274931264937e-06, "loss": 0.8252, "step": 5226 }, { "epoch": 0.73, "learning_rate": 3.684038855774994e-06, "loss": 0.8008, "step": 5227 }, { "epoch": 0.73, "learning_rate": 3.6805514967891787e-06, "loss": 0.8406, "step": 5228 }, { "epoch": 0.73, "learning_rate": 3.677065416874893e-06, "loss": 0.8672, "step": 5229 }, { "epoch": 0.73, "learning_rate": 3.673580616737733e-06, "loss": 0.8391, "step": 5230 }, { "epoch": 0.73, "learning_rate": 3.6700970970830297e-06, "loss": 0.8411, "step": 5231 }, { "epoch": 0.73, "learning_rate": 3.66661485861585e-06, "loss": 0.7408, "step": 5232 }, { "epoch": 0.73, "learning_rate": 3.663133902041014e-06, "loss": 0.7759, "step": 5233 }, { "epoch": 0.73, "learning_rate": 3.6596542280630708e-06, "loss": 0.8462, "step": 5234 }, { "epoch": 0.73, "learning_rate": 3.656175837386321e-06, "loss": 0.8059, "step": 5235 }, { "epoch": 0.73, "learning_rate": 3.652698730714794e-06, "loss": 0.5129, "step": 5236 }, { "epoch": 0.73, "learning_rate": 3.6492229087522633e-06, "loss": 0.8359, "step": 5237 }, { "epoch": 0.73, "learning_rate": 3.64574837220225e-06, "loss": 0.7595, "step": 5238 }, { "epoch": 0.73, "learning_rate": 3.642275121768002e-06, "loss": 0.7786, "step": 5239 }, { "epoch": 0.73, "learning_rate": 3.6388031581525185e-06, "loss": 0.781, "step": 5240 }, { "epoch": 0.73, "learning_rate": 3.6353324820585313e-06, "loss": 0.8623, "step": 5241 }, { "epoch": 0.73, "learning_rate": 3.6318630941885102e-06, "loss": 0.783, "step": 5242 }, { "epoch": 0.73, "learning_rate": 3.628394995244674e-06, "loss": 0.7825, "step": 5243 }, { "epoch": 0.73, "learning_rate": 3.6249281859289676e-06, "loss": 0.834, "step": 5244 }, { "epoch": 0.73, "learning_rate": 3.6214626669430885e-06, "loss": 0.8918, "step": 5245 }, { "epoch": 0.73, "learning_rate": 3.6179984389884624e-06, "loss": 0.7966, "step": 5246 }, { "epoch": 0.73, "learning_rate": 3.6145355027662553e-06, "loss": 0.8176, "step": 5247 }, { "epoch": 0.73, "learning_rate": 3.6110738589773776e-06, "loss": 0.8225, "step": 5248 }, { "epoch": 0.73, "learning_rate": 3.6076135083224704e-06, "loss": 0.791, "step": 5249 }, { "epoch": 0.73, "learning_rate": 3.6041544515019223e-06, "loss": 0.8069, "step": 5250 }, { "epoch": 0.73, "learning_rate": 3.600696689215848e-06, "loss": 0.8108, "step": 5251 }, { "epoch": 0.73, "learning_rate": 3.5972402221641144e-06, "loss": 0.7795, "step": 5252 }, { "epoch": 0.73, "learning_rate": 3.593785051046315e-06, "loss": 0.8833, "step": 5253 }, { "epoch": 0.73, "learning_rate": 3.59033117656178e-06, "loss": 0.7817, "step": 5254 }, { "epoch": 0.73, "learning_rate": 3.586878599409591e-06, "loss": 0.7815, "step": 5255 }, { "epoch": 0.73, "learning_rate": 3.5834273202885493e-06, "loss": 0.8022, "step": 5256 }, { "epoch": 0.73, "learning_rate": 3.579977339897209e-06, "loss": 0.8274, "step": 5257 }, { "epoch": 0.73, "learning_rate": 3.5765286589338534e-06, "loss": 0.8525, "step": 5258 }, { "epoch": 0.73, "learning_rate": 3.5730812780964976e-06, "loss": 0.7925, "step": 5259 }, { "epoch": 0.73, "learning_rate": 3.569635198082907e-06, "loss": 0.8252, "step": 5260 }, { "epoch": 0.73, "learning_rate": 3.5661904195905695e-06, "loss": 0.8362, "step": 5261 }, { "epoch": 0.73, "learning_rate": 3.562746943316725e-06, "loss": 0.8525, "step": 5262 }, { "epoch": 0.73, "learning_rate": 3.559304769958337e-06, "loss": 0.6389, "step": 5263 }, { "epoch": 0.73, "learning_rate": 3.5558639002121056e-06, "loss": 0.8066, "step": 5264 }, { "epoch": 0.73, "learning_rate": 3.552424334774479e-06, "loss": 0.8596, "step": 5265 }, { "epoch": 0.73, "learning_rate": 3.548986074341625e-06, "loss": 0.8813, "step": 5266 }, { "epoch": 0.73, "learning_rate": 3.545549119609465e-06, "loss": 0.7886, "step": 5267 }, { "epoch": 0.73, "learning_rate": 3.5421134712736414e-06, "loss": 0.8608, "step": 5268 }, { "epoch": 0.73, "learning_rate": 3.538679130029535e-06, "loss": 0.8191, "step": 5269 }, { "epoch": 0.73, "learning_rate": 3.5352460965722724e-06, "loss": 0.8123, "step": 5270 }, { "epoch": 0.73, "learning_rate": 3.531814371596699e-06, "loss": 0.7996, "step": 5271 }, { "epoch": 0.73, "learning_rate": 3.5283839557974132e-06, "loss": 0.6261, "step": 5272 }, { "epoch": 0.73, "learning_rate": 3.5249548498687336e-06, "loss": 0.8333, "step": 5273 }, { "epoch": 0.73, "learning_rate": 3.5215270545047187e-06, "loss": 0.8743, "step": 5274 }, { "epoch": 0.73, "learning_rate": 3.518100570399167e-06, "loss": 0.7749, "step": 5275 }, { "epoch": 0.73, "learning_rate": 3.5146753982456018e-06, "loss": 0.8467, "step": 5276 }, { "epoch": 0.73, "learning_rate": 3.5112515387372913e-06, "loss": 0.8362, "step": 5277 }, { "epoch": 0.73, "learning_rate": 3.5078289925672315e-06, "loss": 0.8105, "step": 5278 }, { "epoch": 0.73, "learning_rate": 3.5044077604281502e-06, "loss": 0.5779, "step": 5279 }, { "epoch": 0.73, "learning_rate": 3.5009878430125175e-06, "loss": 0.5457, "step": 5280 }, { "epoch": 0.73, "learning_rate": 3.4975692410125296e-06, "loss": 0.7649, "step": 5281 }, { "epoch": 0.73, "learning_rate": 3.4941519551201243e-06, "loss": 0.8489, "step": 5282 }, { "epoch": 0.73, "learning_rate": 3.490735986026965e-06, "loss": 0.8013, "step": 5283 }, { "epoch": 0.73, "learning_rate": 3.4873213344244496e-06, "loss": 0.7991, "step": 5284 }, { "epoch": 0.73, "learning_rate": 3.4839080010037175e-06, "loss": 0.8093, "step": 5285 }, { "epoch": 0.73, "learning_rate": 3.4804959864556296e-06, "loss": 0.8389, "step": 5286 }, { "epoch": 0.73, "learning_rate": 3.477085291470793e-06, "loss": 0.8872, "step": 5287 }, { "epoch": 0.73, "learning_rate": 3.473675916739536e-06, "loss": 0.8623, "step": 5288 }, { "epoch": 0.73, "learning_rate": 3.4702678629519216e-06, "loss": 0.8235, "step": 5289 }, { "epoch": 0.73, "learning_rate": 3.466861130797755e-06, "loss": 0.7905, "step": 5290 }, { "epoch": 0.73, "learning_rate": 3.4634557209665597e-06, "loss": 0.7649, "step": 5291 }, { "epoch": 0.74, "learning_rate": 3.4600516341476055e-06, "loss": 0.8147, "step": 5292 }, { "epoch": 0.74, "learning_rate": 3.456648871029884e-06, "loss": 0.8147, "step": 5293 }, { "epoch": 0.74, "learning_rate": 3.4532474323021205e-06, "loss": 0.5801, "step": 5294 }, { "epoch": 0.74, "learning_rate": 3.4498473186527802e-06, "loss": 0.8103, "step": 5295 }, { "epoch": 0.74, "learning_rate": 3.446448530770048e-06, "loss": 0.5718, "step": 5296 }, { "epoch": 0.74, "learning_rate": 3.4430510693418527e-06, "loss": 0.5566, "step": 5297 }, { "epoch": 0.74, "learning_rate": 3.439654935055846e-06, "loss": 0.8103, "step": 5298 }, { "epoch": 0.74, "learning_rate": 3.4362601285994103e-06, "loss": 0.7529, "step": 5299 }, { "epoch": 0.74, "learning_rate": 3.4328666506596685e-06, "loss": 0.7764, "step": 5300 }, { "epoch": 0.74, "learning_rate": 3.429474501923462e-06, "loss": 0.6271, "step": 5301 }, { "epoch": 0.74, "learning_rate": 3.426083683077378e-06, "loss": 0.8162, "step": 5302 }, { "epoch": 0.74, "learning_rate": 3.422694194807722e-06, "loss": 0.8728, "step": 5303 }, { "epoch": 0.74, "learning_rate": 3.4193060378005306e-06, "loss": 0.8267, "step": 5304 }, { "epoch": 0.74, "learning_rate": 3.415919212741582e-06, "loss": 0.7612, "step": 5305 }, { "epoch": 0.74, "learning_rate": 3.412533720316372e-06, "loss": 0.8022, "step": 5306 }, { "epoch": 0.74, "learning_rate": 3.4091495612101377e-06, "loss": 0.8259, "step": 5307 }, { "epoch": 0.74, "learning_rate": 3.4057667361078397e-06, "loss": 0.811, "step": 5308 }, { "epoch": 0.74, "learning_rate": 3.402385245694163e-06, "loss": 0.8899, "step": 5309 }, { "epoch": 0.74, "learning_rate": 3.3990050906535397e-06, "loss": 0.8484, "step": 5310 }, { "epoch": 0.74, "learning_rate": 3.3956262716701126e-06, "loss": 0.856, "step": 5311 }, { "epoch": 0.74, "learning_rate": 3.39224878942777e-06, "loss": 0.7805, "step": 5312 }, { "epoch": 0.74, "learning_rate": 3.3888726446101193e-06, "loss": 0.557, "step": 5313 }, { "epoch": 0.74, "learning_rate": 3.3854978379004965e-06, "loss": 0.8223, "step": 5314 }, { "epoch": 0.74, "learning_rate": 3.3821243699819784e-06, "loss": 0.7966, "step": 5315 }, { "epoch": 0.74, "learning_rate": 3.3787522415373543e-06, "loss": 0.886, "step": 5316 }, { "epoch": 0.74, "learning_rate": 3.3753814532491593e-06, "loss": 0.7458, "step": 5317 }, { "epoch": 0.74, "learning_rate": 3.3720120057996443e-06, "loss": 0.5706, "step": 5318 }, { "epoch": 0.74, "learning_rate": 3.3686438998707917e-06, "loss": 0.7937, "step": 5319 }, { "epoch": 0.74, "learning_rate": 3.3652771361443203e-06, "loss": 0.8496, "step": 5320 }, { "epoch": 0.74, "learning_rate": 3.3619117153016646e-06, "loss": 0.8147, "step": 5321 }, { "epoch": 0.74, "learning_rate": 3.358547638024e-06, "loss": 0.8289, "step": 5322 }, { "epoch": 0.74, "learning_rate": 3.3551849049922215e-06, "loss": 0.7478, "step": 5323 }, { "epoch": 0.74, "learning_rate": 3.3518235168869506e-06, "loss": 0.7876, "step": 5324 }, { "epoch": 0.74, "learning_rate": 3.3484634743885468e-06, "loss": 0.7915, "step": 5325 }, { "epoch": 0.74, "learning_rate": 3.345104778177083e-06, "loss": 0.8188, "step": 5326 }, { "epoch": 0.74, "learning_rate": 3.341747428932376e-06, "loss": 0.812, "step": 5327 }, { "epoch": 0.74, "learning_rate": 3.3383914273339567e-06, "loss": 0.7656, "step": 5328 }, { "epoch": 0.74, "learning_rate": 3.3350367740610855e-06, "loss": 0.7933, "step": 5329 }, { "epoch": 0.74, "learning_rate": 3.331683469792758e-06, "loss": 0.7693, "step": 5330 }, { "epoch": 0.74, "learning_rate": 3.3283315152076845e-06, "loss": 0.8108, "step": 5331 }, { "epoch": 0.74, "learning_rate": 3.3249809109843157e-06, "loss": 0.5972, "step": 5332 }, { "epoch": 0.74, "learning_rate": 3.321631657800819e-06, "loss": 0.8728, "step": 5333 }, { "epoch": 0.74, "learning_rate": 3.3182837563350867e-06, "loss": 0.8198, "step": 5334 }, { "epoch": 0.74, "learning_rate": 3.31493720726475e-06, "loss": 0.5551, "step": 5335 }, { "epoch": 0.74, "learning_rate": 3.3115920112671505e-06, "loss": 0.8213, "step": 5336 }, { "epoch": 0.74, "learning_rate": 3.3082481690193726e-06, "loss": 0.8369, "step": 5337 }, { "epoch": 0.74, "learning_rate": 3.3049056811982117e-06, "loss": 0.8113, "step": 5338 }, { "epoch": 0.74, "learning_rate": 3.301564548480195e-06, "loss": 0.8267, "step": 5339 }, { "epoch": 0.74, "learning_rate": 3.2982247715415804e-06, "loss": 0.8508, "step": 5340 }, { "epoch": 0.74, "learning_rate": 3.294886351058341e-06, "loss": 0.8052, "step": 5341 }, { "epoch": 0.74, "learning_rate": 3.2915492877061874e-06, "loss": 0.7483, "step": 5342 }, { "epoch": 0.74, "learning_rate": 3.2882135821605467e-06, "loss": 0.8245, "step": 5343 }, { "epoch": 0.74, "learning_rate": 3.284879235096569e-06, "loss": 0.8232, "step": 5344 }, { "epoch": 0.74, "learning_rate": 3.281546247189141e-06, "loss": 0.8682, "step": 5345 }, { "epoch": 0.74, "learning_rate": 3.278214619112863e-06, "loss": 0.8726, "step": 5346 }, { "epoch": 0.74, "learning_rate": 3.274884351542068e-06, "loss": 0.8098, "step": 5347 }, { "epoch": 0.74, "learning_rate": 3.2715554451508093e-06, "loss": 0.7571, "step": 5348 }, { "epoch": 0.74, "learning_rate": 3.2682279006128613e-06, "loss": 0.833, "step": 5349 }, { "epoch": 0.74, "learning_rate": 3.264901718601733e-06, "loss": 0.812, "step": 5350 }, { "epoch": 0.74, "learning_rate": 3.261576899790646e-06, "loss": 0.8401, "step": 5351 }, { "epoch": 0.74, "learning_rate": 3.258253444852557e-06, "loss": 0.7646, "step": 5352 }, { "epoch": 0.74, "learning_rate": 3.25493135446014e-06, "loss": 0.8279, "step": 5353 }, { "epoch": 0.74, "learning_rate": 3.2516106292857883e-06, "loss": 0.5883, "step": 5354 }, { "epoch": 0.74, "learning_rate": 3.2482912700016333e-06, "loss": 0.7891, "step": 5355 }, { "epoch": 0.74, "learning_rate": 3.244973277279513e-06, "loss": 0.7786, "step": 5356 }, { "epoch": 0.74, "learning_rate": 3.2416566517910053e-06, "loss": 0.7693, "step": 5357 }, { "epoch": 0.74, "learning_rate": 3.238341394207398e-06, "loss": 0.804, "step": 5358 }, { "epoch": 0.74, "learning_rate": 3.235027505199706e-06, "loss": 0.8185, "step": 5359 }, { "epoch": 0.74, "learning_rate": 3.2317149854386732e-06, "loss": 0.7896, "step": 5360 }, { "epoch": 0.74, "learning_rate": 3.2284038355947555e-06, "loss": 0.7469, "step": 5361 }, { "epoch": 0.74, "learning_rate": 3.225094056338145e-06, "loss": 0.8176, "step": 5362 }, { "epoch": 0.74, "learning_rate": 3.2217856483387457e-06, "loss": 0.7983, "step": 5363 }, { "epoch": 0.75, "learning_rate": 3.2184786122661815e-06, "loss": 0.8721, "step": 5364 }, { "epoch": 0.75, "learning_rate": 3.215172948789814e-06, "loss": 0.7693, "step": 5365 }, { "epoch": 0.75, "learning_rate": 3.2118686585787096e-06, "loss": 0.8125, "step": 5366 }, { "epoch": 0.75, "learning_rate": 3.2085657423016705e-06, "loss": 0.8167, "step": 5367 }, { "epoch": 0.75, "learning_rate": 3.2052642006272095e-06, "loss": 0.7698, "step": 5368 }, { "epoch": 0.75, "learning_rate": 3.2019640342235724e-06, "loss": 0.7147, "step": 5369 }, { "epoch": 0.75, "learning_rate": 3.1986652437587173e-06, "loss": 0.8638, "step": 5370 }, { "epoch": 0.75, "learning_rate": 3.1953678299003253e-06, "loss": 0.7706, "step": 5371 }, { "epoch": 0.75, "learning_rate": 3.1920717933158065e-06, "loss": 0.7764, "step": 5372 }, { "epoch": 0.75, "learning_rate": 3.1887771346722796e-06, "loss": 0.8237, "step": 5373 }, { "epoch": 0.75, "learning_rate": 3.1854838546365985e-06, "loss": 0.8652, "step": 5374 }, { "epoch": 0.75, "learning_rate": 3.182191953875328e-06, "loss": 0.8696, "step": 5375 }, { "epoch": 0.75, "learning_rate": 3.178901433054753e-06, "loss": 0.8477, "step": 5376 }, { "epoch": 0.75, "learning_rate": 3.1756122928408893e-06, "loss": 0.8074, "step": 5377 }, { "epoch": 0.75, "learning_rate": 3.1723245338994614e-06, "loss": 0.7827, "step": 5378 }, { "epoch": 0.75, "learning_rate": 3.1690381568959237e-06, "loss": 0.8091, "step": 5379 }, { "epoch": 0.75, "learning_rate": 3.1657531624954465e-06, "loss": 0.844, "step": 5380 }, { "epoch": 0.75, "learning_rate": 3.1624695513629146e-06, "loss": 0.7476, "step": 5381 }, { "epoch": 0.75, "learning_rate": 3.1591873241629466e-06, "loss": 0.8174, "step": 5382 }, { "epoch": 0.75, "learning_rate": 3.155906481559866e-06, "loss": 0.8115, "step": 5383 }, { "epoch": 0.75, "learning_rate": 3.1526270242177314e-06, "loss": 0.7771, "step": 5384 }, { "epoch": 0.75, "learning_rate": 3.1493489528003074e-06, "loss": 0.8494, "step": 5385 }, { "epoch": 0.75, "learning_rate": 3.146072267971082e-06, "loss": 0.7733, "step": 5386 }, { "epoch": 0.75, "learning_rate": 3.1427969703932694e-06, "loss": 0.5743, "step": 5387 }, { "epoch": 0.75, "learning_rate": 3.1395230607297913e-06, "loss": 0.5869, "step": 5388 }, { "epoch": 0.75, "learning_rate": 3.136250539643302e-06, "loss": 0.804, "step": 5389 }, { "epoch": 0.75, "learning_rate": 3.132979407796164e-06, "loss": 0.809, "step": 5390 }, { "epoch": 0.75, "learning_rate": 3.129709665850459e-06, "loss": 0.8491, "step": 5391 }, { "epoch": 0.75, "learning_rate": 3.126441314467997e-06, "loss": 0.8088, "step": 5392 }, { "epoch": 0.75, "learning_rate": 3.1231743543102944e-06, "loss": 0.8625, "step": 5393 }, { "epoch": 0.75, "learning_rate": 3.1199087860385966e-06, "loss": 0.8425, "step": 5394 }, { "epoch": 0.75, "learning_rate": 3.11664461031386e-06, "loss": 0.8062, "step": 5395 }, { "epoch": 0.75, "learning_rate": 3.11338182779676e-06, "loss": 0.5139, "step": 5396 }, { "epoch": 0.75, "learning_rate": 3.1101204391476957e-06, "loss": 0.8015, "step": 5397 }, { "epoch": 0.75, "learning_rate": 3.1068604450267745e-06, "loss": 0.8542, "step": 5398 }, { "epoch": 0.75, "learning_rate": 3.1036018460938343e-06, "loss": 0.7986, "step": 5399 }, { "epoch": 0.75, "learning_rate": 3.1003446430084195e-06, "loss": 0.8494, "step": 5400 }, { "epoch": 0.75, "learning_rate": 3.0970888364297914e-06, "loss": 0.8171, "step": 5401 }, { "epoch": 0.75, "learning_rate": 3.0938344270169406e-06, "loss": 0.6033, "step": 5402 }, { "epoch": 0.75, "learning_rate": 3.0905814154285607e-06, "loss": 0.7998, "step": 5403 }, { "epoch": 0.75, "learning_rate": 3.0873298023230757e-06, "loss": 0.7915, "step": 5404 }, { "epoch": 0.75, "learning_rate": 3.084079588358617e-06, "loss": 0.8196, "step": 5405 }, { "epoch": 0.75, "learning_rate": 3.0808307741930323e-06, "loss": 0.8577, "step": 5406 }, { "epoch": 0.75, "learning_rate": 3.0775833604838944e-06, "loss": 0.8433, "step": 5407 }, { "epoch": 0.75, "learning_rate": 3.074337347888483e-06, "loss": 0.8069, "step": 5408 }, { "epoch": 0.75, "learning_rate": 3.0710927370638044e-06, "loss": 0.8772, "step": 5409 }, { "epoch": 0.75, "learning_rate": 3.067849528666573e-06, "loss": 0.7749, "step": 5410 }, { "epoch": 0.75, "learning_rate": 3.064607723353219e-06, "loss": 0.7957, "step": 5411 }, { "epoch": 0.75, "learning_rate": 3.0613673217798967e-06, "loss": 0.8135, "step": 5412 }, { "epoch": 0.75, "learning_rate": 3.058128324602465e-06, "loss": 0.8169, "step": 5413 }, { "epoch": 0.75, "learning_rate": 3.054890732476512e-06, "loss": 0.8369, "step": 5414 }, { "epoch": 0.75, "learning_rate": 3.0516545460573297e-06, "loss": 0.743, "step": 5415 }, { "epoch": 0.75, "learning_rate": 3.0484197659999282e-06, "loss": 0.5999, "step": 5416 }, { "epoch": 0.75, "learning_rate": 3.045186392959041e-06, "loss": 0.8164, "step": 5417 }, { "epoch": 0.75, "learning_rate": 3.0419544275891023e-06, "loss": 0.8792, "step": 5418 }, { "epoch": 0.75, "learning_rate": 3.0387238705442777e-06, "loss": 0.7791, "step": 5419 }, { "epoch": 0.75, "learning_rate": 3.035494722478437e-06, "loss": 0.7876, "step": 5420 }, { "epoch": 0.75, "learning_rate": 3.0322669840451624e-06, "loss": 0.5671, "step": 5421 }, { "epoch": 0.75, "learning_rate": 3.0290406558977638e-06, "loss": 0.5857, "step": 5422 }, { "epoch": 0.75, "learning_rate": 3.0258157386892506e-06, "loss": 0.7531, "step": 5423 }, { "epoch": 0.75, "learning_rate": 3.0225922330723614e-06, "loss": 0.7996, "step": 5424 }, { "epoch": 0.75, "learning_rate": 3.0193701396995358e-06, "loss": 0.8989, "step": 5425 }, { "epoch": 0.75, "learning_rate": 3.0161494592229325e-06, "loss": 0.8616, "step": 5426 }, { "epoch": 0.75, "learning_rate": 3.012930192294431e-06, "loss": 0.782, "step": 5427 }, { "epoch": 0.75, "learning_rate": 3.00971233956561e-06, "loss": 0.832, "step": 5428 }, { "epoch": 0.75, "learning_rate": 3.0064959016877804e-06, "loss": 0.3448, "step": 5429 }, { "epoch": 0.75, "learning_rate": 3.0032808793119515e-06, "loss": 0.801, "step": 5430 }, { "epoch": 0.75, "learning_rate": 3.000067273088848e-06, "loss": 0.812, "step": 5431 }, { "epoch": 0.75, "learning_rate": 2.9968550836689204e-06, "loss": 0.8201, "step": 5432 }, { "epoch": 0.75, "learning_rate": 2.993644311702314e-06, "loss": 0.8223, "step": 5433 }, { "epoch": 0.75, "learning_rate": 2.990434957838906e-06, "loss": 0.8225, "step": 5434 }, { "epoch": 0.75, "learning_rate": 2.9872270227282717e-06, "loss": 0.8164, "step": 5435 }, { "epoch": 0.76, "learning_rate": 2.9840205070197025e-06, "loss": 0.8044, "step": 5436 }, { "epoch": 0.76, "learning_rate": 2.9808154113622125e-06, "loss": 0.8037, "step": 5437 }, { "epoch": 0.76, "learning_rate": 2.977611736404512e-06, "loss": 0.8154, "step": 5438 }, { "epoch": 0.76, "learning_rate": 2.9744094827950422e-06, "loss": 0.8127, "step": 5439 }, { "epoch": 0.76, "learning_rate": 2.9712086511819403e-06, "loss": 0.8433, "step": 5440 }, { "epoch": 0.76, "learning_rate": 2.96800924221306e-06, "loss": 0.7529, "step": 5441 }, { "epoch": 0.76, "learning_rate": 2.9648112565359776e-06, "loss": 0.8169, "step": 5442 }, { "epoch": 0.76, "learning_rate": 2.961614694797965e-06, "loss": 0.7825, "step": 5443 }, { "epoch": 0.76, "learning_rate": 2.9584195576460206e-06, "loss": 0.6136, "step": 5444 }, { "epoch": 0.76, "learning_rate": 2.9552258457268446e-06, "loss": 0.7456, "step": 5445 }, { "epoch": 0.76, "learning_rate": 2.95203355968685e-06, "loss": 0.8157, "step": 5446 }, { "epoch": 0.76, "learning_rate": 2.9488427001721674e-06, "loss": 0.7227, "step": 5447 }, { "epoch": 0.76, "learning_rate": 2.9456532678286286e-06, "loss": 0.5508, "step": 5448 }, { "epoch": 0.76, "learning_rate": 2.9424652633017903e-06, "loss": 0.8145, "step": 5449 }, { "epoch": 0.76, "learning_rate": 2.9392786872369073e-06, "loss": 0.8118, "step": 5450 }, { "epoch": 0.76, "learning_rate": 2.9360935402789483e-06, "loss": 0.7668, "step": 5451 }, { "epoch": 0.76, "learning_rate": 2.9329098230726005e-06, "loss": 0.8257, "step": 5452 }, { "epoch": 0.76, "learning_rate": 2.929727536262249e-06, "loss": 0.7841, "step": 5453 }, { "epoch": 0.76, "learning_rate": 2.9265466804920027e-06, "loss": 0.8687, "step": 5454 }, { "epoch": 0.76, "learning_rate": 2.9233672564056725e-06, "loss": 0.5871, "step": 5455 }, { "epoch": 0.76, "learning_rate": 2.920189264646778e-06, "loss": 0.8112, "step": 5456 }, { "epoch": 0.76, "learning_rate": 2.9170127058585573e-06, "loss": 0.7961, "step": 5457 }, { "epoch": 0.76, "learning_rate": 2.9138375806839494e-06, "loss": 0.7822, "step": 5458 }, { "epoch": 0.76, "learning_rate": 2.9106638897656103e-06, "loss": 0.8291, "step": 5459 }, { "epoch": 0.76, "learning_rate": 2.9074916337459024e-06, "loss": 0.7583, "step": 5460 }, { "epoch": 0.76, "learning_rate": 2.9043208132668945e-06, "loss": 0.8556, "step": 5461 }, { "epoch": 0.76, "learning_rate": 2.9011514289703722e-06, "loss": 0.7188, "step": 5462 }, { "epoch": 0.76, "learning_rate": 2.8979834814978234e-06, "loss": 0.8026, "step": 5463 }, { "epoch": 0.76, "learning_rate": 2.894816971490453e-06, "loss": 0.8127, "step": 5464 }, { "epoch": 0.76, "learning_rate": 2.8916518995891664e-06, "loss": 0.8357, "step": 5465 }, { "epoch": 0.76, "learning_rate": 2.888488266434579e-06, "loss": 0.8196, "step": 5466 }, { "epoch": 0.76, "learning_rate": 2.8853260726670264e-06, "loss": 0.8401, "step": 5467 }, { "epoch": 0.76, "learning_rate": 2.882165318926534e-06, "loss": 0.8059, "step": 5468 }, { "epoch": 0.76, "learning_rate": 2.8790060058528546e-06, "loss": 0.8425, "step": 5469 }, { "epoch": 0.76, "learning_rate": 2.875848134085436e-06, "loss": 0.812, "step": 5470 }, { "epoch": 0.76, "learning_rate": 2.8726917042634383e-06, "loss": 0.8103, "step": 5471 }, { "epoch": 0.76, "learning_rate": 2.869536717025735e-06, "loss": 0.8945, "step": 5472 }, { "epoch": 0.76, "learning_rate": 2.866383173010897e-06, "loss": 0.7673, "step": 5473 }, { "epoch": 0.76, "learning_rate": 2.8632310728572164e-06, "loss": 0.8054, "step": 5474 }, { "epoch": 0.76, "learning_rate": 2.860080417202682e-06, "loss": 0.813, "step": 5475 }, { "epoch": 0.76, "learning_rate": 2.8569312066849896e-06, "loss": 0.803, "step": 5476 }, { "epoch": 0.76, "learning_rate": 2.8537834419415555e-06, "loss": 0.8157, "step": 5477 }, { "epoch": 0.76, "learning_rate": 2.8506371236094876e-06, "loss": 0.8291, "step": 5478 }, { "epoch": 0.76, "learning_rate": 2.8474922523256144e-06, "loss": 0.8257, "step": 5479 }, { "epoch": 0.76, "learning_rate": 2.844348828726462e-06, "loss": 0.8105, "step": 5480 }, { "epoch": 0.76, "learning_rate": 2.841206853448264e-06, "loss": 0.8503, "step": 5481 }, { "epoch": 0.76, "learning_rate": 2.8380663271269706e-06, "loss": 0.7725, "step": 5482 }, { "epoch": 0.76, "learning_rate": 2.834927250398225e-06, "loss": 0.8623, "step": 5483 }, { "epoch": 0.76, "learning_rate": 2.8317896238973898e-06, "loss": 0.8066, "step": 5484 }, { "epoch": 0.76, "learning_rate": 2.828653448259523e-06, "loss": 0.8647, "step": 5485 }, { "epoch": 0.76, "learning_rate": 2.8255187241193995e-06, "loss": 0.7551, "step": 5486 }, { "epoch": 0.76, "learning_rate": 2.822385452111491e-06, "loss": 0.8787, "step": 5487 }, { "epoch": 0.76, "learning_rate": 2.8192536328699784e-06, "loss": 0.8259, "step": 5488 }, { "epoch": 0.76, "learning_rate": 2.816123267028753e-06, "loss": 0.8901, "step": 5489 }, { "epoch": 0.76, "learning_rate": 2.8129943552214046e-06, "loss": 0.7386, "step": 5490 }, { "epoch": 0.76, "learning_rate": 2.809866898081238e-06, "loss": 0.7773, "step": 5491 }, { "epoch": 0.76, "learning_rate": 2.8067408962412535e-06, "loss": 0.8228, "step": 5492 }, { "epoch": 0.76, "learning_rate": 2.8036163503341595e-06, "loss": 0.8207, "step": 5493 }, { "epoch": 0.76, "learning_rate": 2.8004932609923773e-06, "loss": 0.5684, "step": 5494 }, { "epoch": 0.76, "learning_rate": 2.7973716288480224e-06, "loss": 0.8596, "step": 5495 }, { "epoch": 0.76, "learning_rate": 2.794251454532926e-06, "loss": 0.7719, "step": 5496 }, { "epoch": 0.76, "learning_rate": 2.791132738678616e-06, "loss": 0.802, "step": 5497 }, { "epoch": 0.76, "learning_rate": 2.788015481916324e-06, "loss": 0.8357, "step": 5498 }, { "epoch": 0.76, "learning_rate": 2.7848996848769984e-06, "loss": 0.7939, "step": 5499 }, { "epoch": 0.76, "learning_rate": 2.781785348191276e-06, "loss": 0.8252, "step": 5500 }, { "epoch": 0.76, "learning_rate": 2.7786724724895133e-06, "loss": 0.8062, "step": 5501 }, { "epoch": 0.76, "learning_rate": 2.775561058401759e-06, "loss": 0.8086, "step": 5502 }, { "epoch": 0.76, "learning_rate": 2.7724511065577695e-06, "loss": 0.8059, "step": 5503 }, { "epoch": 0.76, "learning_rate": 2.769342617587013e-06, "loss": 0.8425, "step": 5504 }, { "epoch": 0.76, "learning_rate": 2.766235592118648e-06, "loss": 0.8872, "step": 5505 }, { "epoch": 0.76, "learning_rate": 2.763130030781549e-06, "loss": 0.7461, "step": 5506 }, { "epoch": 0.76, "learning_rate": 2.760025934204288e-06, "loss": 0.8596, "step": 5507 }, { "epoch": 0.77, "learning_rate": 2.7569233030151375e-06, "loss": 0.7874, "step": 5508 }, { "epoch": 0.77, "learning_rate": 2.7538221378420837e-06, "loss": 0.8, "step": 5509 }, { "epoch": 0.77, "learning_rate": 2.750722439312804e-06, "loss": 0.8337, "step": 5510 }, { "epoch": 0.77, "learning_rate": 2.74762420805469e-06, "loss": 0.7872, "step": 5511 }, { "epoch": 0.77, "learning_rate": 2.74452744469483e-06, "loss": 0.8391, "step": 5512 }, { "epoch": 0.77, "learning_rate": 2.7414321498600105e-06, "loss": 0.7483, "step": 5513 }, { "epoch": 0.77, "learning_rate": 2.7383383241767358e-06, "loss": 0.8101, "step": 5514 }, { "epoch": 0.77, "learning_rate": 2.7352459682711954e-06, "loss": 0.8364, "step": 5515 }, { "epoch": 0.77, "learning_rate": 2.7321550827692967e-06, "loss": 0.8755, "step": 5516 }, { "epoch": 0.77, "learning_rate": 2.729065668296639e-06, "loss": 0.7759, "step": 5517 }, { "epoch": 0.77, "learning_rate": 2.7259777254785234e-06, "loss": 0.5756, "step": 5518 }, { "epoch": 0.77, "learning_rate": 2.7228912549399635e-06, "loss": 0.8088, "step": 5519 }, { "epoch": 0.77, "learning_rate": 2.7198062573056628e-06, "loss": 0.7214, "step": 5520 }, { "epoch": 0.77, "learning_rate": 2.716722733200038e-06, "loss": 0.5837, "step": 5521 }, { "epoch": 0.77, "learning_rate": 2.7136406832471986e-06, "loss": 0.8472, "step": 5522 }, { "epoch": 0.77, "learning_rate": 2.7105601080709564e-06, "loss": 0.8494, "step": 5523 }, { "epoch": 0.77, "learning_rate": 2.7074810082948323e-06, "loss": 0.8094, "step": 5524 }, { "epoch": 0.77, "learning_rate": 2.7044033845420383e-06, "loss": 0.8416, "step": 5525 }, { "epoch": 0.77, "learning_rate": 2.701327237435498e-06, "loss": 0.8335, "step": 5526 }, { "epoch": 0.77, "learning_rate": 2.698252567597828e-06, "loss": 0.8074, "step": 5527 }, { "epoch": 0.77, "learning_rate": 2.6951793756513466e-06, "loss": 0.8123, "step": 5528 }, { "epoch": 0.77, "learning_rate": 2.692107662218082e-06, "loss": 0.8806, "step": 5529 }, { "epoch": 0.77, "learning_rate": 2.6890374279197507e-06, "loss": 0.7704, "step": 5530 }, { "epoch": 0.77, "learning_rate": 2.6859686733777745e-06, "loss": 0.8191, "step": 5531 }, { "epoch": 0.77, "learning_rate": 2.6829013992132823e-06, "loss": 0.8318, "step": 5532 }, { "epoch": 0.77, "learning_rate": 2.679835606047092e-06, "loss": 0.8435, "step": 5533 }, { "epoch": 0.77, "learning_rate": 2.6767712944997327e-06, "loss": 0.8103, "step": 5534 }, { "epoch": 0.77, "learning_rate": 2.673708465191427e-06, "loss": 0.7983, "step": 5535 }, { "epoch": 0.77, "learning_rate": 2.6706471187420935e-06, "loss": 0.7671, "step": 5536 }, { "epoch": 0.77, "learning_rate": 2.6675872557713634e-06, "loss": 0.7542, "step": 5537 }, { "epoch": 0.77, "learning_rate": 2.6645288768985544e-06, "loss": 0.7308, "step": 5538 }, { "epoch": 0.77, "learning_rate": 2.661471982742695e-06, "loss": 0.7878, "step": 5539 }, { "epoch": 0.77, "learning_rate": 2.6584165739225067e-06, "loss": 0.8342, "step": 5540 }, { "epoch": 0.77, "learning_rate": 2.6553626510564066e-06, "loss": 0.8201, "step": 5541 }, { "epoch": 0.77, "learning_rate": 2.6523102147625223e-06, "loss": 0.8394, "step": 5542 }, { "epoch": 0.77, "learning_rate": 2.649259265658669e-06, "loss": 0.8164, "step": 5543 }, { "epoch": 0.77, "learning_rate": 2.646209804362372e-06, "loss": 0.783, "step": 5544 }, { "epoch": 0.77, "learning_rate": 2.643161831490847e-06, "loss": 0.761, "step": 5545 }, { "epoch": 0.77, "learning_rate": 2.6401153476610065e-06, "loss": 0.8545, "step": 5546 }, { "epoch": 0.77, "learning_rate": 2.6370703534894724e-06, "loss": 0.8191, "step": 5547 }, { "epoch": 0.77, "learning_rate": 2.6340268495925546e-06, "loss": 0.7313, "step": 5548 }, { "epoch": 0.77, "learning_rate": 2.63098483658627e-06, "loss": 0.8271, "step": 5549 }, { "epoch": 0.77, "learning_rate": 2.627944315086326e-06, "loss": 0.8301, "step": 5550 }, { "epoch": 0.77, "learning_rate": 2.62490528570813e-06, "loss": 0.6254, "step": 5551 }, { "epoch": 0.77, "learning_rate": 2.621867749066794e-06, "loss": 0.8206, "step": 5552 }, { "epoch": 0.77, "learning_rate": 2.6188317057771196e-06, "loss": 0.8145, "step": 5553 }, { "epoch": 0.77, "learning_rate": 2.6157971564536068e-06, "loss": 0.8131, "step": 5554 }, { "epoch": 0.77, "learning_rate": 2.612764101710461e-06, "loss": 0.7969, "step": 5555 }, { "epoch": 0.77, "learning_rate": 2.609732542161574e-06, "loss": 0.5528, "step": 5556 }, { "epoch": 0.77, "learning_rate": 2.606702478420546e-06, "loss": 0.5135, "step": 5557 }, { "epoch": 0.77, "learning_rate": 2.603673911100667e-06, "loss": 0.8167, "step": 5558 }, { "epoch": 0.77, "learning_rate": 2.6006468408149234e-06, "loss": 0.7725, "step": 5559 }, { "epoch": 0.77, "learning_rate": 2.5976212681760083e-06, "loss": 0.8833, "step": 5560 }, { "epoch": 0.77, "learning_rate": 2.5945971937962965e-06, "loss": 0.802, "step": 5561 }, { "epoch": 0.77, "learning_rate": 2.5915746182878755e-06, "loss": 0.76, "step": 5562 }, { "epoch": 0.77, "learning_rate": 2.5885535422625187e-06, "loss": 0.8071, "step": 5563 }, { "epoch": 0.77, "learning_rate": 2.585533966331696e-06, "loss": 0.8079, "step": 5564 }, { "epoch": 0.77, "learning_rate": 2.5825158911065817e-06, "loss": 0.8208, "step": 5565 }, { "epoch": 0.77, "learning_rate": 2.5794993171980376e-06, "loss": 0.7957, "step": 5566 }, { "epoch": 0.77, "learning_rate": 2.5764842452166305e-06, "loss": 0.6075, "step": 5567 }, { "epoch": 0.77, "learning_rate": 2.573470675772615e-06, "loss": 0.8381, "step": 5568 }, { "epoch": 0.77, "learning_rate": 2.570458609475942e-06, "loss": 0.7949, "step": 5569 }, { "epoch": 0.77, "learning_rate": 2.567448046936266e-06, "loss": 0.5059, "step": 5570 }, { "epoch": 0.77, "learning_rate": 2.5644389887629284e-06, "loss": 0.7898, "step": 5571 }, { "epoch": 0.77, "learning_rate": 2.561431435564974e-06, "loss": 0.8179, "step": 5572 }, { "epoch": 0.77, "learning_rate": 2.5584253879511356e-06, "loss": 0.7365, "step": 5573 }, { "epoch": 0.77, "learning_rate": 2.5554208465298413e-06, "loss": 0.78, "step": 5574 }, { "epoch": 0.77, "learning_rate": 2.5524178119092257e-06, "loss": 0.7948, "step": 5575 }, { "epoch": 0.77, "learning_rate": 2.549416284697105e-06, "loss": 0.7646, "step": 5576 }, { "epoch": 0.77, "learning_rate": 2.546416265500993e-06, "loss": 0.8323, "step": 5577 }, { "epoch": 0.77, "learning_rate": 2.543417754928107e-06, "loss": 0.8079, "step": 5578 }, { "epoch": 0.77, "learning_rate": 2.5404207535853464e-06, "loss": 0.8242, "step": 5579 }, { "epoch": 0.78, "learning_rate": 2.5374252620793183e-06, "loss": 0.5229, "step": 5580 }, { "epoch": 0.78, "learning_rate": 2.534431281016313e-06, "loss": 0.5486, "step": 5581 }, { "epoch": 0.78, "learning_rate": 2.5314388110023182e-06, "loss": 0.8389, "step": 5582 }, { "epoch": 0.78, "learning_rate": 2.528447852643021e-06, "loss": 0.8042, "step": 5583 }, { "epoch": 0.78, "learning_rate": 2.5254584065437938e-06, "loss": 0.7881, "step": 5584 }, { "epoch": 0.78, "learning_rate": 2.5224704733097137e-06, "loss": 0.564, "step": 5585 }, { "epoch": 0.78, "learning_rate": 2.5194840535455424e-06, "loss": 0.5406, "step": 5586 }, { "epoch": 0.78, "learning_rate": 2.5164991478557353e-06, "loss": 0.8665, "step": 5587 }, { "epoch": 0.78, "learning_rate": 2.5135157568444513e-06, "loss": 0.8401, "step": 5588 }, { "epoch": 0.78, "learning_rate": 2.5105338811155276e-06, "loss": 0.6193, "step": 5589 }, { "epoch": 0.78, "learning_rate": 2.507553521272511e-06, "loss": 0.7903, "step": 5590 }, { "epoch": 0.78, "learning_rate": 2.504574677918631e-06, "loss": 0.734, "step": 5591 }, { "epoch": 0.78, "learning_rate": 2.501597351656807e-06, "loss": 0.8162, "step": 5592 }, { "epoch": 0.78, "learning_rate": 2.4986215430896652e-06, "loss": 0.8235, "step": 5593 }, { "epoch": 0.78, "learning_rate": 2.495647252819511e-06, "loss": 0.8608, "step": 5594 }, { "epoch": 0.78, "learning_rate": 2.492674481448352e-06, "loss": 0.8271, "step": 5595 }, { "epoch": 0.78, "learning_rate": 2.4897032295778813e-06, "loss": 0.8228, "step": 5596 }, { "epoch": 0.78, "learning_rate": 2.486733497809485e-06, "loss": 0.7949, "step": 5597 }, { "epoch": 0.78, "learning_rate": 2.4837652867442496e-06, "loss": 0.8352, "step": 5598 }, { "epoch": 0.78, "learning_rate": 2.480798596982944e-06, "loss": 0.825, "step": 5599 }, { "epoch": 0.78, "learning_rate": 2.4778334291260362e-06, "loss": 0.8735, "step": 5600 }, { "epoch": 0.78, "learning_rate": 2.4748697837736824e-06, "loss": 0.8132, "step": 5601 }, { "epoch": 0.78, "learning_rate": 2.4719076615257285e-06, "loss": 0.5582, "step": 5602 }, { "epoch": 0.78, "learning_rate": 2.46894706298172e-06, "loss": 0.8198, "step": 5603 }, { "epoch": 0.78, "learning_rate": 2.4659879887408877e-06, "loss": 0.9084, "step": 5604 }, { "epoch": 0.78, "learning_rate": 2.463030439402151e-06, "loss": 0.8066, "step": 5605 }, { "epoch": 0.78, "learning_rate": 2.460074415564131e-06, "loss": 0.8298, "step": 5606 }, { "epoch": 0.78, "learning_rate": 2.4571199178251294e-06, "loss": 0.8247, "step": 5607 }, { "epoch": 0.78, "learning_rate": 2.4541669467831475e-06, "loss": 0.8435, "step": 5608 }, { "epoch": 0.78, "learning_rate": 2.451215503035873e-06, "loss": 0.7791, "step": 5609 }, { "epoch": 0.78, "learning_rate": 2.4482655871806803e-06, "loss": 0.7549, "step": 5610 }, { "epoch": 0.78, "learning_rate": 2.445317199814646e-06, "loss": 0.77, "step": 5611 }, { "epoch": 0.78, "learning_rate": 2.4423703415345256e-06, "loss": 0.8105, "step": 5612 }, { "epoch": 0.78, "learning_rate": 2.4394250129367756e-06, "loss": 0.7969, "step": 5613 }, { "epoch": 0.78, "learning_rate": 2.436481214617534e-06, "loss": 0.8706, "step": 5614 }, { "epoch": 0.78, "learning_rate": 2.4335389471726313e-06, "loss": 0.8765, "step": 5615 }, { "epoch": 0.78, "learning_rate": 2.4305982111975946e-06, "loss": 0.7983, "step": 5616 }, { "epoch": 0.78, "learning_rate": 2.4276590072876284e-06, "loss": 0.7634, "step": 5617 }, { "epoch": 0.78, "learning_rate": 2.424721336037643e-06, "loss": 0.7703, "step": 5618 }, { "epoch": 0.78, "learning_rate": 2.4217851980422256e-06, "loss": 0.7983, "step": 5619 }, { "epoch": 0.78, "learning_rate": 2.4188505938956553e-06, "loss": 0.7866, "step": 5620 }, { "epoch": 0.78, "learning_rate": 2.4159175241919098e-06, "loss": 0.5281, "step": 5621 }, { "epoch": 0.78, "learning_rate": 2.412985989524641e-06, "loss": 0.8174, "step": 5622 }, { "epoch": 0.78, "learning_rate": 2.410055990487207e-06, "loss": 0.8403, "step": 5623 }, { "epoch": 0.78, "learning_rate": 2.4071275276726414e-06, "loss": 0.8357, "step": 5624 }, { "epoch": 0.78, "learning_rate": 2.404200601673671e-06, "loss": 0.7864, "step": 5625 }, { "epoch": 0.78, "learning_rate": 2.401275213082718e-06, "loss": 0.8022, "step": 5626 }, { "epoch": 0.78, "learning_rate": 2.398351362491882e-06, "loss": 0.8264, "step": 5627 }, { "epoch": 0.78, "learning_rate": 2.3954290504929635e-06, "loss": 0.5512, "step": 5628 }, { "epoch": 0.78, "learning_rate": 2.3925082776774424e-06, "loss": 0.7692, "step": 5629 }, { "epoch": 0.78, "learning_rate": 2.389589044636487e-06, "loss": 0.8064, "step": 5630 }, { "epoch": 0.78, "learning_rate": 2.386671351960963e-06, "loss": 0.7605, "step": 5631 }, { "epoch": 0.78, "learning_rate": 2.383755200241412e-06, "loss": 0.7893, "step": 5632 }, { "epoch": 0.78, "learning_rate": 2.3808405900680775e-06, "loss": 0.8135, "step": 5633 }, { "epoch": 0.78, "learning_rate": 2.3779275220308797e-06, "loss": 0.7627, "step": 5634 }, { "epoch": 0.78, "learning_rate": 2.3750159967194276e-06, "loss": 0.7795, "step": 5635 }, { "epoch": 0.78, "learning_rate": 2.3721060147230266e-06, "loss": 0.746, "step": 5636 }, { "epoch": 0.78, "learning_rate": 2.3691975766306586e-06, "loss": 0.8109, "step": 5637 }, { "epoch": 0.78, "learning_rate": 2.366290683031004e-06, "loss": 0.8234, "step": 5638 }, { "epoch": 0.78, "learning_rate": 2.3633853345124215e-06, "loss": 0.8047, "step": 5639 }, { "epoch": 0.78, "learning_rate": 2.3604815316629593e-06, "loss": 0.75, "step": 5640 }, { "epoch": 0.78, "learning_rate": 2.3575792750703584e-06, "loss": 0.5394, "step": 5641 }, { "epoch": 0.78, "learning_rate": 2.3546785653220383e-06, "loss": 0.8452, "step": 5642 }, { "epoch": 0.78, "learning_rate": 2.351779403005113e-06, "loss": 0.8193, "step": 5643 }, { "epoch": 0.78, "learning_rate": 2.34888178870638e-06, "loss": 0.8091, "step": 5644 }, { "epoch": 0.78, "learning_rate": 2.345985723012317e-06, "loss": 0.7991, "step": 5645 }, { "epoch": 0.78, "learning_rate": 2.3430912065091038e-06, "loss": 0.8174, "step": 5646 }, { "epoch": 0.78, "learning_rate": 2.3401982397825895e-06, "loss": 0.5854, "step": 5647 }, { "epoch": 0.78, "learning_rate": 2.3373068234183237e-06, "loss": 0.8279, "step": 5648 }, { "epoch": 0.78, "learning_rate": 2.334416958001534e-06, "loss": 0.7822, "step": 5649 }, { "epoch": 0.78, "learning_rate": 2.3315286441171326e-06, "loss": 0.7827, "step": 5650 }, { "epoch": 0.78, "learning_rate": 2.328641882349727e-06, "loss": 0.8274, "step": 5651 }, { "epoch": 0.79, "learning_rate": 2.3257566732835977e-06, "loss": 0.3521, "step": 5652 }, { "epoch": 0.79, "learning_rate": 2.322873017502726e-06, "loss": 0.7075, "step": 5653 }, { "epoch": 0.79, "learning_rate": 2.3199909155907674e-06, "loss": 0.8191, "step": 5654 }, { "epoch": 0.79, "learning_rate": 2.3171103681310616e-06, "loss": 0.7786, "step": 5655 }, { "epoch": 0.79, "learning_rate": 2.3142313757066447e-06, "loss": 0.8196, "step": 5656 }, { "epoch": 0.79, "learning_rate": 2.311353938900227e-06, "loss": 0.7856, "step": 5657 }, { "epoch": 0.79, "learning_rate": 2.3084780582942146e-06, "loss": 0.8179, "step": 5658 }, { "epoch": 0.79, "learning_rate": 2.305603734470687e-06, "loss": 0.8745, "step": 5659 }, { "epoch": 0.79, "learning_rate": 2.302730968011415e-06, "loss": 0.7686, "step": 5660 }, { "epoch": 0.79, "learning_rate": 2.2998597594978568e-06, "loss": 0.8513, "step": 5661 }, { "epoch": 0.79, "learning_rate": 2.296990109511147e-06, "loss": 0.335, "step": 5662 }, { "epoch": 0.79, "learning_rate": 2.2941220186321147e-06, "loss": 0.8489, "step": 5663 }, { "epoch": 0.79, "learning_rate": 2.2912554874412665e-06, "loss": 0.8418, "step": 5664 }, { "epoch": 0.79, "learning_rate": 2.2883905165187915e-06, "loss": 0.7935, "step": 5665 }, { "epoch": 0.79, "learning_rate": 2.285527106444572e-06, "loss": 0.8264, "step": 5666 }, { "epoch": 0.79, "learning_rate": 2.2826652577981645e-06, "loss": 0.8202, "step": 5667 }, { "epoch": 0.79, "learning_rate": 2.27980497115882e-06, "loss": 0.8237, "step": 5668 }, { "epoch": 0.79, "learning_rate": 2.2769462471054627e-06, "loss": 0.8174, "step": 5669 }, { "epoch": 0.79, "learning_rate": 2.274089086216704e-06, "loss": 0.7837, "step": 5670 }, { "epoch": 0.79, "learning_rate": 2.271233489070845e-06, "loss": 0.8203, "step": 5671 }, { "epoch": 0.79, "learning_rate": 2.2683794562458604e-06, "loss": 0.8276, "step": 5672 }, { "epoch": 0.79, "learning_rate": 2.2655269883194185e-06, "loss": 0.8491, "step": 5673 }, { "epoch": 0.79, "learning_rate": 2.2626760858688634e-06, "loss": 0.8618, "step": 5674 }, { "epoch": 0.79, "learning_rate": 2.25982674947122e-06, "loss": 0.8455, "step": 5675 }, { "epoch": 0.79, "learning_rate": 2.2569789797032083e-06, "loss": 0.8125, "step": 5676 }, { "epoch": 0.79, "learning_rate": 2.254132777141218e-06, "loss": 0.7827, "step": 5677 }, { "epoch": 0.79, "learning_rate": 2.251288142361332e-06, "loss": 0.5847, "step": 5678 }, { "epoch": 0.79, "learning_rate": 2.2484450759393084e-06, "loss": 0.8042, "step": 5679 }, { "epoch": 0.79, "learning_rate": 2.245603578450589e-06, "loss": 0.8267, "step": 5680 }, { "epoch": 0.79, "learning_rate": 2.2427636504703045e-06, "loss": 0.8999, "step": 5681 }, { "epoch": 0.79, "learning_rate": 2.2399252925732573e-06, "loss": 0.8149, "step": 5682 }, { "epoch": 0.79, "learning_rate": 2.237088505333943e-06, "loss": 0.8442, "step": 5683 }, { "epoch": 0.79, "learning_rate": 2.2342532893265335e-06, "loss": 0.7595, "step": 5684 }, { "epoch": 0.79, "learning_rate": 2.231419645124878e-06, "loss": 0.7594, "step": 5685 }, { "epoch": 0.79, "learning_rate": 2.228587573302521e-06, "loss": 0.8589, "step": 5686 }, { "epoch": 0.79, "learning_rate": 2.2257570744326728e-06, "loss": 0.8259, "step": 5687 }, { "epoch": 0.79, "learning_rate": 2.222928149088239e-06, "loss": 0.5824, "step": 5688 }, { "epoch": 0.79, "learning_rate": 2.2201007978418e-06, "loss": 0.8723, "step": 5689 }, { "epoch": 0.79, "learning_rate": 2.2172750212656137e-06, "loss": 0.7703, "step": 5690 }, { "epoch": 0.79, "learning_rate": 2.2144508199316305e-06, "loss": 0.8535, "step": 5691 }, { "epoch": 0.79, "learning_rate": 2.2116281944114693e-06, "loss": 0.8423, "step": 5692 }, { "epoch": 0.79, "learning_rate": 2.2088071452764427e-06, "loss": 0.8223, "step": 5693 }, { "epoch": 0.79, "learning_rate": 2.2059876730975348e-06, "loss": 0.7632, "step": 5694 }, { "epoch": 0.79, "learning_rate": 2.2031697784454108e-06, "loss": 0.8582, "step": 5695 }, { "epoch": 0.79, "learning_rate": 2.200353461890424e-06, "loss": 0.7399, "step": 5696 }, { "epoch": 0.79, "learning_rate": 2.197538724002599e-06, "loss": 0.7966, "step": 5697 }, { "epoch": 0.79, "learning_rate": 2.1947255653516506e-06, "loss": 0.8401, "step": 5698 }, { "epoch": 0.79, "learning_rate": 2.191913986506966e-06, "loss": 0.5333, "step": 5699 }, { "epoch": 0.79, "learning_rate": 2.189103988037614e-06, "loss": 0.8625, "step": 5700 }, { "epoch": 0.79, "learning_rate": 2.186295570512349e-06, "loss": 0.5791, "step": 5701 }, { "epoch": 0.79, "learning_rate": 2.183488734499596e-06, "loss": 0.8362, "step": 5702 }, { "epoch": 0.79, "learning_rate": 2.1806834805674714e-06, "loss": 0.7756, "step": 5703 }, { "epoch": 0.79, "learning_rate": 2.177879809283764e-06, "loss": 0.7988, "step": 5704 }, { "epoch": 0.79, "learning_rate": 2.175077721215938e-06, "loss": 0.8027, "step": 5705 }, { "epoch": 0.79, "learning_rate": 2.172277216931149e-06, "loss": 0.7513, "step": 5706 }, { "epoch": 0.79, "learning_rate": 2.1694782969962223e-06, "loss": 0.8601, "step": 5707 }, { "epoch": 0.79, "learning_rate": 2.16668096197767e-06, "loss": 0.8101, "step": 5708 }, { "epoch": 0.79, "learning_rate": 2.1638852124416755e-06, "loss": 0.7742, "step": 5709 }, { "epoch": 0.79, "learning_rate": 2.1610910489541048e-06, "loss": 0.7847, "step": 5710 }, { "epoch": 0.79, "learning_rate": 2.158298472080507e-06, "loss": 0.7891, "step": 5711 }, { "epoch": 0.79, "learning_rate": 2.1555074823861024e-06, "loss": 0.7732, "step": 5712 }, { "epoch": 0.79, "learning_rate": 2.152718080435798e-06, "loss": 0.8152, "step": 5713 }, { "epoch": 0.79, "learning_rate": 2.1499302667941737e-06, "loss": 0.8499, "step": 5714 }, { "epoch": 0.79, "learning_rate": 2.1471440420254864e-06, "loss": 0.8136, "step": 5715 }, { "epoch": 0.79, "learning_rate": 2.1443594066936803e-06, "loss": 0.8323, "step": 5716 }, { "epoch": 0.79, "learning_rate": 2.1415763613623663e-06, "loss": 0.7881, "step": 5717 }, { "epoch": 0.79, "learning_rate": 2.1387949065948464e-06, "loss": 0.8628, "step": 5718 }, { "epoch": 0.79, "learning_rate": 2.1360150429540895e-06, "loss": 0.7729, "step": 5719 }, { "epoch": 0.79, "learning_rate": 2.1332367710027446e-06, "loss": 0.8032, "step": 5720 }, { "epoch": 0.79, "learning_rate": 2.130460091303146e-06, "loss": 0.7969, "step": 5721 }, { "epoch": 0.79, "learning_rate": 2.127685004417295e-06, "loss": 0.7849, "step": 5722 }, { "epoch": 0.79, "learning_rate": 2.1249115109068807e-06, "loss": 0.8274, "step": 5723 }, { "epoch": 0.8, "learning_rate": 2.1221396113332602e-06, "loss": 0.8452, "step": 5724 }, { "epoch": 0.8, "learning_rate": 2.119369306257477e-06, "loss": 0.7998, "step": 5725 }, { "epoch": 0.8, "learning_rate": 2.116600596240246e-06, "loss": 0.877, "step": 5726 }, { "epoch": 0.8, "learning_rate": 2.113833481841957e-06, "loss": 0.7393, "step": 5727 }, { "epoch": 0.8, "learning_rate": 2.1110679636226873e-06, "loss": 0.8606, "step": 5728 }, { "epoch": 0.8, "learning_rate": 2.1083040421421773e-06, "loss": 0.8252, "step": 5729 }, { "epoch": 0.8, "learning_rate": 2.105541717959858e-06, "loss": 0.7805, "step": 5730 }, { "epoch": 0.8, "learning_rate": 2.1027809916348272e-06, "loss": 0.7819, "step": 5731 }, { "epoch": 0.8, "learning_rate": 2.1000218637258607e-06, "loss": 0.8149, "step": 5732 }, { "epoch": 0.8, "learning_rate": 2.0972643347914166e-06, "loss": 0.8074, "step": 5733 }, { "epoch": 0.8, "learning_rate": 2.0945084053896215e-06, "loss": 0.8154, "step": 5734 }, { "epoch": 0.8, "learning_rate": 2.091754076078285e-06, "loss": 0.7822, "step": 5735 }, { "epoch": 0.8, "learning_rate": 2.089001347414891e-06, "loss": 0.5455, "step": 5736 }, { "epoch": 0.8, "learning_rate": 2.0862502199565926e-06, "loss": 0.8101, "step": 5737 }, { "epoch": 0.8, "learning_rate": 2.0835006942602308e-06, "loss": 0.7922, "step": 5738 }, { "epoch": 0.8, "learning_rate": 2.0807527708823106e-06, "loss": 0.8789, "step": 5739 }, { "epoch": 0.8, "learning_rate": 2.0780064503790254e-06, "loss": 0.803, "step": 5740 }, { "epoch": 0.8, "learning_rate": 2.075261733306232e-06, "loss": 0.33, "step": 5741 }, { "epoch": 0.8, "learning_rate": 2.072518620219467e-06, "loss": 0.8093, "step": 5742 }, { "epoch": 0.8, "learning_rate": 2.069777111673946e-06, "loss": 0.7715, "step": 5743 }, { "epoch": 0.8, "learning_rate": 2.067037208224555e-06, "loss": 0.8152, "step": 5744 }, { "epoch": 0.8, "learning_rate": 2.0642989104258593e-06, "loss": 0.8014, "step": 5745 }, { "epoch": 0.8, "learning_rate": 2.061562218832095e-06, "loss": 0.8123, "step": 5746 }, { "epoch": 0.8, "learning_rate": 2.058827133997173e-06, "loss": 0.7837, "step": 5747 }, { "epoch": 0.8, "learning_rate": 2.056093656474687e-06, "loss": 0.8223, "step": 5748 }, { "epoch": 0.8, "learning_rate": 2.0533617868178935e-06, "loss": 0.842, "step": 5749 }, { "epoch": 0.8, "learning_rate": 2.050631525579733e-06, "loss": 0.7859, "step": 5750 }, { "epoch": 0.8, "learning_rate": 2.047902873312817e-06, "loss": 0.7983, "step": 5751 }, { "epoch": 0.8, "learning_rate": 2.045175830569427e-06, "loss": 0.7969, "step": 5752 }, { "epoch": 0.8, "learning_rate": 2.042450397901529e-06, "loss": 0.8032, "step": 5753 }, { "epoch": 0.8, "learning_rate": 2.039726575860751e-06, "loss": 0.8352, "step": 5754 }, { "epoch": 0.8, "learning_rate": 2.037004364998406e-06, "loss": 0.5815, "step": 5755 }, { "epoch": 0.8, "learning_rate": 2.034283765865476e-06, "loss": 0.8174, "step": 5756 }, { "epoch": 0.8, "learning_rate": 2.0315647790126115e-06, "loss": 0.8176, "step": 5757 }, { "epoch": 0.8, "learning_rate": 2.0288474049901484e-06, "loss": 0.7715, "step": 5758 }, { "epoch": 0.8, "learning_rate": 2.026131644348084e-06, "loss": 0.8303, "step": 5759 }, { "epoch": 0.8, "learning_rate": 2.023417497636101e-06, "loss": 0.778, "step": 5760 }, { "epoch": 0.8, "learning_rate": 2.020704965403545e-06, "loss": 0.8386, "step": 5761 }, { "epoch": 0.8, "learning_rate": 2.0179940481994377e-06, "loss": 0.556, "step": 5762 }, { "epoch": 0.8, "learning_rate": 2.015284746572479e-06, "loss": 0.7639, "step": 5763 }, { "epoch": 0.8, "learning_rate": 2.012577061071035e-06, "loss": 0.7747, "step": 5764 }, { "epoch": 0.8, "learning_rate": 2.0098709922431512e-06, "loss": 0.8157, "step": 5765 }, { "epoch": 0.8, "learning_rate": 2.0071665406365404e-06, "loss": 0.7596, "step": 5766 }, { "epoch": 0.8, "learning_rate": 2.004463706798587e-06, "loss": 0.6205, "step": 5767 }, { "epoch": 0.8, "learning_rate": 2.0017624912763577e-06, "loss": 0.7854, "step": 5768 }, { "epoch": 0.8, "learning_rate": 1.999062894616579e-06, "loss": 0.8315, "step": 5769 }, { "epoch": 0.8, "learning_rate": 1.9963649173656596e-06, "loss": 0.8843, "step": 5770 }, { "epoch": 0.8, "learning_rate": 1.993668560069676e-06, "loss": 0.7847, "step": 5771 }, { "epoch": 0.8, "learning_rate": 1.9909738232743736e-06, "loss": 0.799, "step": 5772 }, { "epoch": 0.8, "learning_rate": 1.9882807075251787e-06, "loss": 0.5352, "step": 5773 }, { "epoch": 0.8, "learning_rate": 1.9855892133671806e-06, "loss": 0.8005, "step": 5774 }, { "epoch": 0.8, "learning_rate": 1.982899341345148e-06, "loss": 0.7852, "step": 5775 }, { "epoch": 0.8, "learning_rate": 1.9802110920035145e-06, "loss": 0.7722, "step": 5776 }, { "epoch": 0.8, "learning_rate": 1.9775244658863868e-06, "loss": 0.8413, "step": 5777 }, { "epoch": 0.8, "learning_rate": 1.974839463537549e-06, "loss": 0.8284, "step": 5778 }, { "epoch": 0.8, "learning_rate": 1.972156085500447e-06, "loss": 0.8264, "step": 5779 }, { "epoch": 0.8, "learning_rate": 1.9694743323182087e-06, "loss": 0.8162, "step": 5780 }, { "epoch": 0.8, "learning_rate": 1.966794204533624e-06, "loss": 0.8618, "step": 5781 }, { "epoch": 0.8, "learning_rate": 1.9641157026891544e-06, "loss": 0.8086, "step": 5782 }, { "epoch": 0.8, "learning_rate": 1.9614388273269415e-06, "loss": 0.7146, "step": 5783 }, { "epoch": 0.8, "learning_rate": 1.9587635789887848e-06, "loss": 0.5679, "step": 5784 }, { "epoch": 0.8, "learning_rate": 1.956089958216166e-06, "loss": 0.8682, "step": 5785 }, { "epoch": 0.8, "learning_rate": 1.953417965550232e-06, "loss": 0.7544, "step": 5786 }, { "epoch": 0.8, "learning_rate": 1.950747601531795e-06, "loss": 0.803, "step": 5787 }, { "epoch": 0.8, "learning_rate": 1.9480788667013507e-06, "loss": 0.5399, "step": 5788 }, { "epoch": 0.8, "learning_rate": 1.94541176159905e-06, "loss": 0.7847, "step": 5789 }, { "epoch": 0.8, "learning_rate": 1.9427462867647285e-06, "loss": 0.8269, "step": 5790 }, { "epoch": 0.8, "learning_rate": 1.9400824427378816e-06, "loss": 0.7993, "step": 5791 }, { "epoch": 0.8, "learning_rate": 1.937420230057674e-06, "loss": 0.7339, "step": 5792 }, { "epoch": 0.8, "learning_rate": 1.9347596492629505e-06, "loss": 0.824, "step": 5793 }, { "epoch": 0.8, "learning_rate": 1.9321007008922134e-06, "loss": 0.8208, "step": 5794 }, { "epoch": 0.8, "learning_rate": 1.929443385483646e-06, "loss": 0.8545, "step": 5795 }, { "epoch": 0.81, "learning_rate": 1.9267877035750916e-06, "loss": 0.821, "step": 5796 }, { "epoch": 0.81, "learning_rate": 1.9241336557040637e-06, "loss": 0.7849, "step": 5797 }, { "epoch": 0.81, "learning_rate": 1.9214812424077545e-06, "loss": 0.7917, "step": 5798 }, { "epoch": 0.81, "learning_rate": 1.9188304642230125e-06, "loss": 0.7054, "step": 5799 }, { "epoch": 0.81, "learning_rate": 1.916181321686368e-06, "loss": 0.8323, "step": 5800 }, { "epoch": 0.81, "learning_rate": 1.91353381533401e-06, "loss": 0.8242, "step": 5801 }, { "epoch": 0.81, "learning_rate": 1.910887945701798e-06, "loss": 0.8042, "step": 5802 }, { "epoch": 0.81, "learning_rate": 1.9082437133252686e-06, "loss": 0.7844, "step": 5803 }, { "epoch": 0.81, "learning_rate": 1.905601118739614e-06, "loss": 0.7565, "step": 5804 }, { "epoch": 0.81, "learning_rate": 1.9029601624797067e-06, "loss": 0.7747, "step": 5805 }, { "epoch": 0.81, "learning_rate": 1.9003208450800814e-06, "loss": 0.5264, "step": 5806 }, { "epoch": 0.81, "learning_rate": 1.8976831670749386e-06, "loss": 0.8441, "step": 5807 }, { "epoch": 0.81, "learning_rate": 1.8950471289981565e-06, "loss": 0.552, "step": 5808 }, { "epoch": 0.81, "learning_rate": 1.8924127313832708e-06, "loss": 0.8616, "step": 5809 }, { "epoch": 0.81, "learning_rate": 1.8897799747634938e-06, "loss": 0.8379, "step": 5810 }, { "epoch": 0.81, "learning_rate": 1.8871488596716992e-06, "loss": 0.8125, "step": 5811 }, { "epoch": 0.81, "learning_rate": 1.8845193866404288e-06, "loss": 0.8157, "step": 5812 }, { "epoch": 0.81, "learning_rate": 1.8818915562019003e-06, "loss": 0.8206, "step": 5813 }, { "epoch": 0.81, "learning_rate": 1.8792653688879869e-06, "loss": 0.8447, "step": 5814 }, { "epoch": 0.81, "learning_rate": 1.8766408252302404e-06, "loss": 0.8022, "step": 5815 }, { "epoch": 0.81, "learning_rate": 1.8740179257598723e-06, "loss": 0.8469, "step": 5816 }, { "epoch": 0.81, "learning_rate": 1.8713966710077602e-06, "loss": 0.8318, "step": 5817 }, { "epoch": 0.81, "learning_rate": 1.8687770615044586e-06, "loss": 0.8159, "step": 5818 }, { "epoch": 0.81, "learning_rate": 1.866159097780178e-06, "loss": 0.8049, "step": 5819 }, { "epoch": 0.81, "learning_rate": 1.8635427803648054e-06, "loss": 0.7561, "step": 5820 }, { "epoch": 0.81, "learning_rate": 1.8609281097878862e-06, "loss": 0.7708, "step": 5821 }, { "epoch": 0.81, "learning_rate": 1.8583150865786338e-06, "loss": 0.7766, "step": 5822 }, { "epoch": 0.81, "learning_rate": 1.855703711265936e-06, "loss": 0.821, "step": 5823 }, { "epoch": 0.81, "learning_rate": 1.8530939843783358e-06, "loss": 0.823, "step": 5824 }, { "epoch": 0.81, "learning_rate": 1.8504859064440539e-06, "loss": 0.8579, "step": 5825 }, { "epoch": 0.81, "learning_rate": 1.847879477990968e-06, "loss": 0.7848, "step": 5826 }, { "epoch": 0.81, "learning_rate": 1.8452746995466242e-06, "loss": 0.8276, "step": 5827 }, { "epoch": 0.81, "learning_rate": 1.8426715716382394e-06, "loss": 0.8516, "step": 5828 }, { "epoch": 0.81, "learning_rate": 1.8400700947926898e-06, "loss": 0.8296, "step": 5829 }, { "epoch": 0.81, "learning_rate": 1.8374702695365232e-06, "loss": 0.749, "step": 5830 }, { "epoch": 0.81, "learning_rate": 1.834872096395951e-06, "loss": 0.7754, "step": 5831 }, { "epoch": 0.81, "learning_rate": 1.8322755758968447e-06, "loss": 0.8147, "step": 5832 }, { "epoch": 0.81, "learning_rate": 1.8296807085647517e-06, "loss": 0.8486, "step": 5833 }, { "epoch": 0.81, "learning_rate": 1.827087494924875e-06, "loss": 0.7136, "step": 5834 }, { "epoch": 0.81, "learning_rate": 1.824495935502092e-06, "loss": 0.7919, "step": 5835 }, { "epoch": 0.81, "learning_rate": 1.821906030820938e-06, "loss": 0.8135, "step": 5836 }, { "epoch": 0.81, "learning_rate": 1.8193177814056129e-06, "loss": 0.7981, "step": 5837 }, { "epoch": 0.81, "learning_rate": 1.816731187779991e-06, "loss": 0.8206, "step": 5838 }, { "epoch": 0.81, "learning_rate": 1.8141462504675988e-06, "loss": 0.7837, "step": 5839 }, { "epoch": 0.81, "learning_rate": 1.8115629699916392e-06, "loss": 0.7577, "step": 5840 }, { "epoch": 0.81, "learning_rate": 1.8089813468749694e-06, "loss": 0.7479, "step": 5841 }, { "epoch": 0.81, "learning_rate": 1.8064013816401217e-06, "loss": 0.8125, "step": 5842 }, { "epoch": 0.81, "learning_rate": 1.8038230748092833e-06, "loss": 0.8184, "step": 5843 }, { "epoch": 0.81, "learning_rate": 1.8012464269043083e-06, "loss": 0.7366, "step": 5844 }, { "epoch": 0.81, "learning_rate": 1.798671438446722e-06, "loss": 0.7727, "step": 5845 }, { "epoch": 0.81, "learning_rate": 1.7960981099577013e-06, "loss": 0.8071, "step": 5846 }, { "epoch": 0.81, "learning_rate": 1.7935264419581e-06, "loss": 0.8384, "step": 5847 }, { "epoch": 0.81, "learning_rate": 1.7909564349684272e-06, "loss": 0.8069, "step": 5848 }, { "epoch": 0.81, "learning_rate": 1.788388089508858e-06, "loss": 0.7571, "step": 5849 }, { "epoch": 0.81, "learning_rate": 1.785821406099233e-06, "loss": 0.7754, "step": 5850 }, { "epoch": 0.81, "learning_rate": 1.7832563852590534e-06, "loss": 0.856, "step": 5851 }, { "epoch": 0.81, "learning_rate": 1.7806930275074885e-06, "loss": 0.8623, "step": 5852 }, { "epoch": 0.81, "learning_rate": 1.7781313333633666e-06, "loss": 0.8162, "step": 5853 }, { "epoch": 0.81, "learning_rate": 1.7755713033451771e-06, "loss": 0.8577, "step": 5854 }, { "epoch": 0.81, "learning_rate": 1.7730129379710824e-06, "loss": 0.7633, "step": 5855 }, { "epoch": 0.81, "learning_rate": 1.7704562377588975e-06, "loss": 0.5608, "step": 5856 }, { "epoch": 0.81, "learning_rate": 1.7679012032261079e-06, "loss": 0.7971, "step": 5857 }, { "epoch": 0.81, "learning_rate": 1.7653478348898557e-06, "loss": 0.8176, "step": 5858 }, { "epoch": 0.81, "learning_rate": 1.7627961332669485e-06, "loss": 0.8711, "step": 5859 }, { "epoch": 0.81, "learning_rate": 1.7602460988738613e-06, "loss": 0.8579, "step": 5860 }, { "epoch": 0.81, "learning_rate": 1.7576977322267208e-06, "loss": 0.8264, "step": 5861 }, { "epoch": 0.81, "learning_rate": 1.755151033841328e-06, "loss": 0.8157, "step": 5862 }, { "epoch": 0.81, "learning_rate": 1.7526060042331394e-06, "loss": 0.7942, "step": 5863 }, { "epoch": 0.81, "learning_rate": 1.7500626439172718e-06, "loss": 0.7656, "step": 5864 }, { "epoch": 0.81, "learning_rate": 1.7475209534085124e-06, "loss": 0.7533, "step": 5865 }, { "epoch": 0.81, "learning_rate": 1.7449809332212996e-06, "loss": 0.7815, "step": 5866 }, { "epoch": 0.81, "learning_rate": 1.7424425838697468e-06, "loss": 0.7915, "step": 5867 }, { "epoch": 0.82, "learning_rate": 1.7399059058676182e-06, "loss": 0.7837, "step": 5868 }, { "epoch": 0.82, "learning_rate": 1.73737089972834e-06, "loss": 0.8132, "step": 5869 }, { "epoch": 0.82, "learning_rate": 1.7348375659650097e-06, "loss": 0.7874, "step": 5870 }, { "epoch": 0.82, "learning_rate": 1.7323059050903757e-06, "loss": 0.7959, "step": 5871 }, { "epoch": 0.82, "learning_rate": 1.7297759176168561e-06, "loss": 0.7947, "step": 5872 }, { "epoch": 0.82, "learning_rate": 1.7272476040565234e-06, "loss": 0.5139, "step": 5873 }, { "epoch": 0.82, "learning_rate": 1.7247209649211138e-06, "loss": 0.8567, "step": 5874 }, { "epoch": 0.82, "learning_rate": 1.7221960007220284e-06, "loss": 0.7957, "step": 5875 }, { "epoch": 0.82, "learning_rate": 1.7196727119703226e-06, "loss": 0.8179, "step": 5876 }, { "epoch": 0.82, "learning_rate": 1.7171510991767192e-06, "loss": 0.8425, "step": 5877 }, { "epoch": 0.82, "learning_rate": 1.7146311628515976e-06, "loss": 0.6609, "step": 5878 }, { "epoch": 0.82, "learning_rate": 1.7121129035049955e-06, "loss": 0.5386, "step": 5879 }, { "epoch": 0.82, "learning_rate": 1.7095963216466216e-06, "loss": 0.8145, "step": 5880 }, { "epoch": 0.82, "learning_rate": 1.7070814177858297e-06, "loss": 0.8215, "step": 5881 }, { "epoch": 0.82, "learning_rate": 1.7045681924316503e-06, "loss": 0.8745, "step": 5882 }, { "epoch": 0.82, "learning_rate": 1.7020566460927624e-06, "loss": 0.8105, "step": 5883 }, { "epoch": 0.82, "learning_rate": 1.6995467792775079e-06, "loss": 0.5931, "step": 5884 }, { "epoch": 0.82, "learning_rate": 1.6970385924938927e-06, "loss": 0.8304, "step": 5885 }, { "epoch": 0.82, "learning_rate": 1.6945320862495763e-06, "loss": 0.8704, "step": 5886 }, { "epoch": 0.82, "learning_rate": 1.6920272610518862e-06, "loss": 0.8053, "step": 5887 }, { "epoch": 0.82, "learning_rate": 1.6895241174078015e-06, "loss": 0.6049, "step": 5888 }, { "epoch": 0.82, "learning_rate": 1.6870226558239645e-06, "loss": 0.8066, "step": 5889 }, { "epoch": 0.82, "learning_rate": 1.6845228768066802e-06, "loss": 0.8447, "step": 5890 }, { "epoch": 0.82, "learning_rate": 1.682024780861904e-06, "loss": 0.854, "step": 5891 }, { "epoch": 0.82, "learning_rate": 1.6795283684952635e-06, "loss": 0.792, "step": 5892 }, { "epoch": 0.82, "learning_rate": 1.6770336402120357e-06, "loss": 0.6206, "step": 5893 }, { "epoch": 0.82, "learning_rate": 1.674540596517157e-06, "loss": 0.7659, "step": 5894 }, { "epoch": 0.82, "learning_rate": 1.6720492379152287e-06, "loss": 0.8442, "step": 5895 }, { "epoch": 0.82, "learning_rate": 1.6695595649105044e-06, "loss": 0.8772, "step": 5896 }, { "epoch": 0.82, "learning_rate": 1.6670715780069058e-06, "loss": 0.8728, "step": 5897 }, { "epoch": 0.82, "learning_rate": 1.6645852777080028e-06, "loss": 0.7548, "step": 5898 }, { "epoch": 0.82, "learning_rate": 1.6621006645170268e-06, "loss": 0.8074, "step": 5899 }, { "epoch": 0.82, "learning_rate": 1.6596177389368751e-06, "loss": 0.7932, "step": 5900 }, { "epoch": 0.82, "learning_rate": 1.6571365014700914e-06, "loss": 0.8247, "step": 5901 }, { "epoch": 0.82, "learning_rate": 1.6546569526188915e-06, "loss": 0.8306, "step": 5902 }, { "epoch": 0.82, "learning_rate": 1.6521790928851367e-06, "loss": 0.8484, "step": 5903 }, { "epoch": 0.82, "learning_rate": 1.649702922770352e-06, "loss": 0.8333, "step": 5904 }, { "epoch": 0.82, "learning_rate": 1.6472284427757224e-06, "loss": 0.8633, "step": 5905 }, { "epoch": 0.82, "learning_rate": 1.6447556534020858e-06, "loss": 0.7932, "step": 5906 }, { "epoch": 0.82, "learning_rate": 1.6422845551499444e-06, "loss": 0.7853, "step": 5907 }, { "epoch": 0.82, "learning_rate": 1.6398151485194525e-06, "loss": 0.8318, "step": 5908 }, { "epoch": 0.82, "learning_rate": 1.6373474340104222e-06, "loss": 0.812, "step": 5909 }, { "epoch": 0.82, "learning_rate": 1.6348814121223278e-06, "loss": 0.7944, "step": 5910 }, { "epoch": 0.82, "learning_rate": 1.632417083354295e-06, "loss": 0.741, "step": 5911 }, { "epoch": 0.82, "learning_rate": 1.6299544482051133e-06, "loss": 0.5693, "step": 5912 }, { "epoch": 0.82, "learning_rate": 1.6274935071732245e-06, "loss": 0.8535, "step": 5913 }, { "epoch": 0.82, "learning_rate": 1.625034260756727e-06, "loss": 0.7622, "step": 5914 }, { "epoch": 0.82, "learning_rate": 1.6225767094533818e-06, "loss": 0.7625, "step": 5915 }, { "epoch": 0.82, "learning_rate": 1.6201208537605984e-06, "loss": 0.7686, "step": 5916 }, { "epoch": 0.82, "learning_rate": 1.6176666941754526e-06, "loss": 0.8616, "step": 5917 }, { "epoch": 0.82, "learning_rate": 1.6152142311946717e-06, "loss": 0.8411, "step": 5918 }, { "epoch": 0.82, "learning_rate": 1.6127634653146352e-06, "loss": 0.8015, "step": 5919 }, { "epoch": 0.82, "learning_rate": 1.6103143970313905e-06, "loss": 0.8721, "step": 5920 }, { "epoch": 0.82, "learning_rate": 1.6078670268406293e-06, "loss": 0.7683, "step": 5921 }, { "epoch": 0.82, "learning_rate": 1.6054213552377096e-06, "loss": 0.7772, "step": 5922 }, { "epoch": 0.82, "learning_rate": 1.6029773827176398e-06, "loss": 0.8013, "step": 5923 }, { "epoch": 0.82, "learning_rate": 1.6005351097750832e-06, "loss": 0.8191, "step": 5924 }, { "epoch": 0.82, "learning_rate": 1.5980945369043655e-06, "loss": 0.6083, "step": 5925 }, { "epoch": 0.82, "learning_rate": 1.5956556645994614e-06, "loss": 0.5444, "step": 5926 }, { "epoch": 0.82, "learning_rate": 1.5932184933540084e-06, "loss": 0.7791, "step": 5927 }, { "epoch": 0.82, "learning_rate": 1.590783023661292e-06, "loss": 0.8091, "step": 5928 }, { "epoch": 0.82, "learning_rate": 1.5883492560142577e-06, "loss": 0.8296, "step": 5929 }, { "epoch": 0.82, "learning_rate": 1.5859171909055083e-06, "loss": 0.7642, "step": 5930 }, { "epoch": 0.82, "learning_rate": 1.5834868288272954e-06, "loss": 0.8914, "step": 5931 }, { "epoch": 0.82, "learning_rate": 1.5810581702715356e-06, "loss": 0.8569, "step": 5932 }, { "epoch": 0.82, "learning_rate": 1.5786312157297922e-06, "loss": 0.7595, "step": 5933 }, { "epoch": 0.82, "learning_rate": 1.5762059656932837e-06, "loss": 0.5765, "step": 5934 }, { "epoch": 0.82, "learning_rate": 1.5737824206528928e-06, "loss": 0.8091, "step": 5935 }, { "epoch": 0.82, "learning_rate": 1.571360581099145e-06, "loss": 0.8357, "step": 5936 }, { "epoch": 0.82, "learning_rate": 1.5689404475222314e-06, "loss": 0.7703, "step": 5937 }, { "epoch": 0.82, "learning_rate": 1.5665220204119903e-06, "loss": 0.8213, "step": 5938 }, { "epoch": 0.82, "learning_rate": 1.5641053002579153e-06, "loss": 0.7861, "step": 5939 }, { "epoch": 0.83, "learning_rate": 1.56169028754916e-06, "loss": 0.821, "step": 5940 }, { "epoch": 0.83, "learning_rate": 1.5592769827745258e-06, "loss": 0.855, "step": 5941 }, { "epoch": 0.83, "learning_rate": 1.5568653864224737e-06, "loss": 0.8623, "step": 5942 }, { "epoch": 0.83, "learning_rate": 1.5544554989811166e-06, "loss": 0.774, "step": 5943 }, { "epoch": 0.83, "learning_rate": 1.552047320938218e-06, "loss": 0.7898, "step": 5944 }, { "epoch": 0.83, "learning_rate": 1.5496408527812034e-06, "loss": 0.8896, "step": 5945 }, { "epoch": 0.83, "learning_rate": 1.5472360949971444e-06, "loss": 0.8191, "step": 5946 }, { "epoch": 0.83, "learning_rate": 1.5448330480727725e-06, "loss": 0.833, "step": 5947 }, { "epoch": 0.83, "learning_rate": 1.5424317124944687e-06, "loss": 0.7905, "step": 5948 }, { "epoch": 0.83, "learning_rate": 1.5400320887482668e-06, "loss": 0.7771, "step": 5949 }, { "epoch": 0.83, "learning_rate": 1.5376341773198611e-06, "loss": 0.8125, "step": 5950 }, { "epoch": 0.83, "learning_rate": 1.5352379786945904e-06, "loss": 0.8171, "step": 5951 }, { "epoch": 0.83, "learning_rate": 1.5328434933574554e-06, "loss": 0.801, "step": 5952 }, { "epoch": 0.83, "learning_rate": 1.530450721793102e-06, "loss": 0.769, "step": 5953 }, { "epoch": 0.83, "learning_rate": 1.5280596644858325e-06, "loss": 0.8518, "step": 5954 }, { "epoch": 0.83, "learning_rate": 1.5256703219196068e-06, "loss": 0.8354, "step": 5955 }, { "epoch": 0.83, "learning_rate": 1.5232826945780278e-06, "loss": 0.8215, "step": 5956 }, { "epoch": 0.83, "learning_rate": 1.5208967829443633e-06, "loss": 0.8657, "step": 5957 }, { "epoch": 0.83, "learning_rate": 1.5185125875015216e-06, "loss": 0.7837, "step": 5958 }, { "epoch": 0.83, "learning_rate": 1.5161301087320746e-06, "loss": 0.7949, "step": 5959 }, { "epoch": 0.83, "learning_rate": 1.5137493471182396e-06, "loss": 0.7844, "step": 5960 }, { "epoch": 0.83, "learning_rate": 1.5113703031418859e-06, "loss": 0.822, "step": 5961 }, { "epoch": 0.83, "learning_rate": 1.5089929772845424e-06, "loss": 0.8157, "step": 5962 }, { "epoch": 0.83, "learning_rate": 1.5066173700273812e-06, "loss": 0.7822, "step": 5963 }, { "epoch": 0.83, "learning_rate": 1.5042434818512353e-06, "loss": 0.5808, "step": 5964 }, { "epoch": 0.83, "learning_rate": 1.5018713132365837e-06, "loss": 0.8525, "step": 5965 }, { "epoch": 0.83, "learning_rate": 1.4995008646635546e-06, "loss": 0.74, "step": 5966 }, { "epoch": 0.83, "learning_rate": 1.4971321366119395e-06, "loss": 0.8303, "step": 5967 }, { "epoch": 0.83, "learning_rate": 1.4947651295611698e-06, "loss": 0.8357, "step": 5968 }, { "epoch": 0.83, "learning_rate": 1.4923998439903364e-06, "loss": 0.8511, "step": 5969 }, { "epoch": 0.83, "learning_rate": 1.4900362803781776e-06, "loss": 0.7668, "step": 5970 }, { "epoch": 0.83, "learning_rate": 1.4876744392030817e-06, "loss": 0.7637, "step": 5971 }, { "epoch": 0.83, "learning_rate": 1.4853143209430954e-06, "loss": 0.8091, "step": 5972 }, { "epoch": 0.83, "learning_rate": 1.4829559260759086e-06, "loss": 0.7711, "step": 5973 }, { "epoch": 0.83, "learning_rate": 1.4805992550788706e-06, "loss": 0.7864, "step": 5974 }, { "epoch": 0.83, "learning_rate": 1.4782443084289734e-06, "loss": 0.7632, "step": 5975 }, { "epoch": 0.83, "learning_rate": 1.475891086602863e-06, "loss": 0.8048, "step": 5976 }, { "epoch": 0.83, "learning_rate": 1.4735395900768411e-06, "loss": 0.7952, "step": 5977 }, { "epoch": 0.83, "learning_rate": 1.4711898193268527e-06, "loss": 0.7766, "step": 5978 }, { "epoch": 0.83, "learning_rate": 1.4688417748285e-06, "loss": 0.8618, "step": 5979 }, { "epoch": 0.83, "learning_rate": 1.4664954570570322e-06, "loss": 0.5341, "step": 5980 }, { "epoch": 0.83, "learning_rate": 1.464150866487346e-06, "loss": 0.7769, "step": 5981 }, { "epoch": 0.83, "learning_rate": 1.4618080035939974e-06, "loss": 0.7949, "step": 5982 }, { "epoch": 0.83, "learning_rate": 1.4594668688511826e-06, "loss": 0.7762, "step": 5983 }, { "epoch": 0.83, "learning_rate": 1.4571274627327581e-06, "loss": 0.8318, "step": 5984 }, { "epoch": 0.83, "learning_rate": 1.4547897857122217e-06, "loss": 0.7686, "step": 5985 }, { "epoch": 0.83, "learning_rate": 1.4524538382627241e-06, "loss": 0.8638, "step": 5986 }, { "epoch": 0.83, "learning_rate": 1.45011962085707e-06, "loss": 0.7174, "step": 5987 }, { "epoch": 0.83, "learning_rate": 1.4477871339677073e-06, "loss": 0.8289, "step": 5988 }, { "epoch": 0.83, "learning_rate": 1.4454563780667398e-06, "loss": 0.686, "step": 5989 }, { "epoch": 0.83, "learning_rate": 1.4431273536259171e-06, "loss": 0.855, "step": 5990 }, { "epoch": 0.83, "learning_rate": 1.4408000611166372e-06, "loss": 0.8346, "step": 5991 }, { "epoch": 0.83, "learning_rate": 1.4384745010099533e-06, "loss": 0.782, "step": 5992 }, { "epoch": 0.83, "learning_rate": 1.436150673776563e-06, "loss": 0.8025, "step": 5993 }, { "epoch": 0.83, "learning_rate": 1.4338285798868113e-06, "loss": 0.8018, "step": 5994 }, { "epoch": 0.83, "learning_rate": 1.4315082198107012e-06, "loss": 0.7942, "step": 5995 }, { "epoch": 0.83, "learning_rate": 1.4291895940178724e-06, "loss": 0.7842, "step": 5996 }, { "epoch": 0.83, "learning_rate": 1.4268727029776276e-06, "loss": 0.79, "step": 5997 }, { "epoch": 0.83, "learning_rate": 1.424557547158908e-06, "loss": 0.5934, "step": 5998 }, { "epoch": 0.83, "learning_rate": 1.4222441270303034e-06, "loss": 0.7881, "step": 5999 }, { "epoch": 0.83, "learning_rate": 1.4199324430600614e-06, "loss": 0.8474, "step": 6000 }, { "epoch": 0.83, "learning_rate": 1.4176224957160668e-06, "loss": 0.8445, "step": 6001 }, { "epoch": 0.83, "learning_rate": 1.4153142854658631e-06, "loss": 0.5626, "step": 6002 }, { "epoch": 0.83, "learning_rate": 1.4130078127766367e-06, "loss": 0.7925, "step": 6003 }, { "epoch": 0.83, "learning_rate": 1.4107030781152188e-06, "loss": 0.8276, "step": 6004 }, { "epoch": 0.83, "learning_rate": 1.4084000819481002e-06, "loss": 0.5524, "step": 6005 }, { "epoch": 0.83, "learning_rate": 1.4060988247414064e-06, "loss": 0.8267, "step": 6006 }, { "epoch": 0.83, "learning_rate": 1.4037993069609223e-06, "loss": 0.8032, "step": 6007 }, { "epoch": 0.83, "learning_rate": 1.4015015290720734e-06, "loss": 0.7549, "step": 6008 }, { "epoch": 0.83, "learning_rate": 1.3992054915399344e-06, "loss": 0.7998, "step": 6009 }, { "epoch": 0.83, "learning_rate": 1.3969111948292314e-06, "loss": 0.8492, "step": 6010 }, { "epoch": 0.83, "learning_rate": 1.3946186394043326e-06, "loss": 0.8425, "step": 6011 }, { "epoch": 0.84, "learning_rate": 1.3923278257292615e-06, "loss": 0.791, "step": 6012 }, { "epoch": 0.84, "learning_rate": 1.3900387542676808e-06, "loss": 0.7969, "step": 6013 }, { "epoch": 0.84, "learning_rate": 1.3877514254829017e-06, "loss": 0.7791, "step": 6014 }, { "epoch": 0.84, "learning_rate": 1.3854658398378907e-06, "loss": 0.7932, "step": 6015 }, { "epoch": 0.84, "learning_rate": 1.3831819977952532e-06, "loss": 0.8013, "step": 6016 }, { "epoch": 0.84, "learning_rate": 1.3808998998172406e-06, "loss": 0.8279, "step": 6017 }, { "epoch": 0.84, "learning_rate": 1.3786195463657626e-06, "loss": 0.8169, "step": 6018 }, { "epoch": 0.84, "learning_rate": 1.3763409379023607e-06, "loss": 0.7247, "step": 6019 }, { "epoch": 0.84, "learning_rate": 1.374064074888236e-06, "loss": 0.8271, "step": 6020 }, { "epoch": 0.84, "learning_rate": 1.371788957784229e-06, "loss": 0.8293, "step": 6021 }, { "epoch": 0.84, "learning_rate": 1.3695155870508282e-06, "loss": 0.7694, "step": 6022 }, { "epoch": 0.84, "learning_rate": 1.3672439631481716e-06, "loss": 0.7734, "step": 6023 }, { "epoch": 0.84, "learning_rate": 1.3649740865360373e-06, "loss": 0.7496, "step": 6024 }, { "epoch": 0.84, "learning_rate": 1.3627059576738588e-06, "loss": 0.7567, "step": 6025 }, { "epoch": 0.84, "learning_rate": 1.3604395770207079e-06, "loss": 0.8694, "step": 6026 }, { "epoch": 0.84, "learning_rate": 1.3581749450353044e-06, "loss": 0.8325, "step": 6027 }, { "epoch": 0.84, "learning_rate": 1.355912062176018e-06, "loss": 0.8335, "step": 6028 }, { "epoch": 0.84, "learning_rate": 1.3536509289008582e-06, "loss": 0.5734, "step": 6029 }, { "epoch": 0.84, "learning_rate": 1.3513915456674887e-06, "loss": 0.8384, "step": 6030 }, { "epoch": 0.84, "learning_rate": 1.3491339129332115e-06, "loss": 0.7998, "step": 6031 }, { "epoch": 0.84, "learning_rate": 1.3468780311549744e-06, "loss": 0.8176, "step": 6032 }, { "epoch": 0.84, "learning_rate": 1.3446239007893768e-06, "loss": 0.7979, "step": 6033 }, { "epoch": 0.84, "learning_rate": 1.342371522292658e-06, "loss": 0.8079, "step": 6034 }, { "epoch": 0.84, "learning_rate": 1.340120896120707e-06, "loss": 0.7645, "step": 6035 }, { "epoch": 0.84, "learning_rate": 1.3378720227290553e-06, "loss": 0.8584, "step": 6036 }, { "epoch": 0.84, "learning_rate": 1.3356249025728773e-06, "loss": 0.8013, "step": 6037 }, { "epoch": 0.84, "learning_rate": 1.333379536106999e-06, "loss": 0.855, "step": 6038 }, { "epoch": 0.84, "learning_rate": 1.3311359237858857e-06, "loss": 0.7986, "step": 6039 }, { "epoch": 0.84, "learning_rate": 1.3288940660636528e-06, "loss": 0.7854, "step": 6040 }, { "epoch": 0.84, "learning_rate": 1.3266539633940555e-06, "loss": 0.8196, "step": 6041 }, { "epoch": 0.84, "learning_rate": 1.3244156162304945e-06, "loss": 0.8103, "step": 6042 }, { "epoch": 0.84, "learning_rate": 1.3221790250260203e-06, "loss": 0.7249, "step": 6043 }, { "epoch": 0.84, "learning_rate": 1.3199441902333231e-06, "loss": 0.772, "step": 6044 }, { "epoch": 0.84, "learning_rate": 1.317711112304736e-06, "loss": 0.8154, "step": 6045 }, { "epoch": 0.84, "learning_rate": 1.3154797916922423e-06, "loss": 0.7993, "step": 6046 }, { "epoch": 0.84, "learning_rate": 1.3132502288474659e-06, "loss": 0.7856, "step": 6047 }, { "epoch": 0.84, "learning_rate": 1.3110224242216762e-06, "loss": 0.7711, "step": 6048 }, { "epoch": 0.84, "learning_rate": 1.3087963782657852e-06, "loss": 0.8491, "step": 6049 }, { "epoch": 0.84, "learning_rate": 1.3065720914303493e-06, "loss": 0.8149, "step": 6050 }, { "epoch": 0.84, "learning_rate": 1.3043495641655725e-06, "loss": 0.8835, "step": 6051 }, { "epoch": 0.84, "learning_rate": 1.302128796921296e-06, "loss": 0.7859, "step": 6052 }, { "epoch": 0.84, "learning_rate": 1.2999097901470114e-06, "loss": 0.8523, "step": 6053 }, { "epoch": 0.84, "learning_rate": 1.2976925442918498e-06, "loss": 0.748, "step": 6054 }, { "epoch": 0.84, "learning_rate": 1.2954770598045852e-06, "loss": 0.8391, "step": 6055 }, { "epoch": 0.84, "learning_rate": 1.2932633371336411e-06, "loss": 0.8201, "step": 6056 }, { "epoch": 0.84, "learning_rate": 1.291051376727075e-06, "loss": 0.8113, "step": 6057 }, { "epoch": 0.84, "learning_rate": 1.2888411790325983e-06, "loss": 0.8298, "step": 6058 }, { "epoch": 0.84, "learning_rate": 1.2866327444975578e-06, "loss": 0.7729, "step": 6059 }, { "epoch": 0.84, "learning_rate": 1.284426073568945e-06, "loss": 0.7991, "step": 6060 }, { "epoch": 0.84, "learning_rate": 1.2822211666933982e-06, "loss": 0.8118, "step": 6061 }, { "epoch": 0.84, "learning_rate": 1.2800180243171912e-06, "loss": 0.865, "step": 6062 }, { "epoch": 0.84, "learning_rate": 1.2778166468862507e-06, "loss": 0.7712, "step": 6063 }, { "epoch": 0.84, "learning_rate": 1.2756170348461383e-06, "loss": 0.8684, "step": 6064 }, { "epoch": 0.84, "learning_rate": 1.273419188642059e-06, "loss": 0.8071, "step": 6065 }, { "epoch": 0.84, "learning_rate": 1.2712231087188654e-06, "loss": 0.8188, "step": 6066 }, { "epoch": 0.84, "learning_rate": 1.2690287955210479e-06, "loss": 0.7927, "step": 6067 }, { "epoch": 0.84, "learning_rate": 1.266836249492739e-06, "loss": 0.7996, "step": 6068 }, { "epoch": 0.84, "learning_rate": 1.2646454710777189e-06, "loss": 0.8043, "step": 6069 }, { "epoch": 0.84, "learning_rate": 1.2624564607194022e-06, "loss": 0.823, "step": 6070 }, { "epoch": 0.84, "learning_rate": 1.2602692188608546e-06, "loss": 0.8041, "step": 6071 }, { "epoch": 0.84, "learning_rate": 1.258083745944776e-06, "loss": 0.8533, "step": 6072 }, { "epoch": 0.84, "learning_rate": 1.2559000424135103e-06, "loss": 0.8196, "step": 6073 }, { "epoch": 0.84, "learning_rate": 1.2537181087090477e-06, "loss": 0.802, "step": 6074 }, { "epoch": 0.84, "learning_rate": 1.2515379452730137e-06, "loss": 0.8931, "step": 6075 }, { "epoch": 0.84, "learning_rate": 1.2493595525466817e-06, "loss": 0.7688, "step": 6076 }, { "epoch": 0.84, "learning_rate": 1.2471829309709615e-06, "loss": 0.8806, "step": 6077 }, { "epoch": 0.84, "learning_rate": 1.2450080809864063e-06, "loss": 0.7488, "step": 6078 }, { "epoch": 0.84, "learning_rate": 1.2428350030332126e-06, "loss": 0.8315, "step": 6079 }, { "epoch": 0.84, "learning_rate": 1.2406636975512132e-06, "loss": 0.8472, "step": 6080 }, { "epoch": 0.84, "learning_rate": 1.2384941649798897e-06, "loss": 0.7898, "step": 6081 }, { "epoch": 0.84, "learning_rate": 1.2363264057583601e-06, "loss": 0.8336, "step": 6082 }, { "epoch": 0.84, "learning_rate": 1.2341604203253798e-06, "loss": 0.8057, "step": 6083 }, { "epoch": 0.85, "learning_rate": 1.231996209119356e-06, "loss": 0.7797, "step": 6084 }, { "epoch": 0.85, "learning_rate": 1.2298337725783238e-06, "loss": 0.7981, "step": 6085 }, { "epoch": 0.85, "learning_rate": 1.2276731111399697e-06, "loss": 0.8098, "step": 6086 }, { "epoch": 0.85, "learning_rate": 1.2255142252416174e-06, "loss": 0.8252, "step": 6087 }, { "epoch": 0.85, "learning_rate": 1.223357115320225e-06, "loss": 0.8267, "step": 6088 }, { "epoch": 0.85, "learning_rate": 1.2212017818124033e-06, "loss": 0.8435, "step": 6089 }, { "epoch": 0.85, "learning_rate": 1.2190482251543923e-06, "loss": 0.8293, "step": 6090 }, { "epoch": 0.85, "learning_rate": 1.2168964457820808e-06, "loss": 0.824, "step": 6091 }, { "epoch": 0.85, "learning_rate": 1.2147464441309919e-06, "loss": 0.8335, "step": 6092 }, { "epoch": 0.85, "learning_rate": 1.2125982206362896e-06, "loss": 0.8508, "step": 6093 }, { "epoch": 0.85, "learning_rate": 1.2104517757327838e-06, "loss": 0.7631, "step": 6094 }, { "epoch": 0.85, "learning_rate": 1.2083071098549148e-06, "loss": 0.8031, "step": 6095 }, { "epoch": 0.85, "learning_rate": 1.2061642234367733e-06, "loss": 0.7576, "step": 6096 }, { "epoch": 0.85, "learning_rate": 1.204023116912082e-06, "loss": 0.8359, "step": 6097 }, { "epoch": 0.85, "learning_rate": 1.2018837907142046e-06, "loss": 0.7982, "step": 6098 }, { "epoch": 0.85, "learning_rate": 1.199746245276149e-06, "loss": 0.8457, "step": 6099 }, { "epoch": 0.85, "learning_rate": 1.1976104810305556e-06, "loss": 0.8096, "step": 6100 }, { "epoch": 0.85, "learning_rate": 1.1954764984097133e-06, "loss": 0.7776, "step": 6101 }, { "epoch": 0.85, "learning_rate": 1.1933442978455423e-06, "loss": 0.5606, "step": 6102 }, { "epoch": 0.85, "learning_rate": 1.1912138797696037e-06, "loss": 0.8127, "step": 6103 }, { "epoch": 0.85, "learning_rate": 1.189085244613103e-06, "loss": 0.8267, "step": 6104 }, { "epoch": 0.85, "learning_rate": 1.1869583928068763e-06, "loss": 0.7808, "step": 6105 }, { "epoch": 0.85, "learning_rate": 1.1848333247814093e-06, "loss": 0.752, "step": 6106 }, { "epoch": 0.85, "learning_rate": 1.1827100409668169e-06, "loss": 0.8481, "step": 6107 }, { "epoch": 0.85, "learning_rate": 1.1805885417928553e-06, "loss": 0.7427, "step": 6108 }, { "epoch": 0.85, "learning_rate": 1.1784688276889268e-06, "loss": 0.7554, "step": 6109 }, { "epoch": 0.85, "learning_rate": 1.17635089908406e-06, "loss": 0.8423, "step": 6110 }, { "epoch": 0.85, "learning_rate": 1.1742347564069345e-06, "loss": 0.8163, "step": 6111 }, { "epoch": 0.85, "learning_rate": 1.17212040008586e-06, "loss": 0.7605, "step": 6112 }, { "epoch": 0.85, "learning_rate": 1.1700078305487861e-06, "loss": 0.8373, "step": 6113 }, { "epoch": 0.85, "learning_rate": 1.1678970482233043e-06, "loss": 0.7732, "step": 6114 }, { "epoch": 0.85, "learning_rate": 1.1657880535366395e-06, "loss": 0.8076, "step": 6115 }, { "epoch": 0.85, "learning_rate": 1.1636808469156601e-06, "loss": 0.7424, "step": 6116 }, { "epoch": 0.85, "learning_rate": 1.1615754287868697e-06, "loss": 0.8477, "step": 6117 }, { "epoch": 0.85, "learning_rate": 1.159471799576406e-06, "loss": 0.5876, "step": 6118 }, { "epoch": 0.85, "learning_rate": 1.157369959710053e-06, "loss": 0.8142, "step": 6119 }, { "epoch": 0.85, "learning_rate": 1.1552699096132247e-06, "loss": 0.7693, "step": 6120 }, { "epoch": 0.85, "learning_rate": 1.1531716497109802e-06, "loss": 0.7686, "step": 6121 }, { "epoch": 0.85, "learning_rate": 1.1510751804280096e-06, "loss": 0.7756, "step": 6122 }, { "epoch": 0.85, "learning_rate": 1.1489805021886414e-06, "loss": 0.8342, "step": 6123 }, { "epoch": 0.85, "learning_rate": 1.1468876154168495e-06, "loss": 0.845, "step": 6124 }, { "epoch": 0.85, "learning_rate": 1.1447965205362321e-06, "loss": 0.593, "step": 6125 }, { "epoch": 0.85, "learning_rate": 1.1427072179700383e-06, "loss": 0.8184, "step": 6126 }, { "epoch": 0.85, "learning_rate": 1.1406197081411452e-06, "loss": 0.7878, "step": 6127 }, { "epoch": 0.85, "learning_rate": 1.1385339914720673e-06, "loss": 0.8167, "step": 6128 }, { "epoch": 0.85, "learning_rate": 1.1364500683849623e-06, "loss": 0.8281, "step": 6129 }, { "epoch": 0.85, "learning_rate": 1.1343679393016182e-06, "loss": 0.7729, "step": 6130 }, { "epoch": 0.85, "learning_rate": 1.1322876046434673e-06, "loss": 0.7217, "step": 6131 }, { "epoch": 0.85, "learning_rate": 1.130209064831571e-06, "loss": 0.7745, "step": 6132 }, { "epoch": 0.85, "learning_rate": 1.1281323202866302e-06, "loss": 0.853, "step": 6133 }, { "epoch": 0.85, "learning_rate": 1.1260573714289847e-06, "loss": 0.7998, "step": 6134 }, { "epoch": 0.85, "learning_rate": 1.1239842186786077e-06, "loss": 0.8271, "step": 6135 }, { "epoch": 0.85, "learning_rate": 1.1219128624551134e-06, "loss": 0.8164, "step": 6136 }, { "epoch": 0.85, "learning_rate": 1.1198433031777466e-06, "loss": 0.8069, "step": 6137 }, { "epoch": 0.85, "learning_rate": 1.117775541265389e-06, "loss": 0.8467, "step": 6138 }, { "epoch": 0.85, "learning_rate": 1.1157095771365655e-06, "loss": 0.5923, "step": 6139 }, { "epoch": 0.85, "learning_rate": 1.1136454112094275e-06, "loss": 0.8096, "step": 6140 }, { "epoch": 0.85, "learning_rate": 1.1115830439017717e-06, "loss": 0.8115, "step": 6141 }, { "epoch": 0.85, "learning_rate": 1.1095224756310241e-06, "loss": 0.7297, "step": 6142 }, { "epoch": 0.85, "learning_rate": 1.1074637068142469e-06, "loss": 0.8247, "step": 6143 }, { "epoch": 0.85, "learning_rate": 1.105406737868142e-06, "loss": 0.7744, "step": 6144 }, { "epoch": 0.85, "learning_rate": 1.1033515692090436e-06, "loss": 0.5688, "step": 6145 }, { "epoch": 0.85, "learning_rate": 1.101298201252924e-06, "loss": 0.7329, "step": 6146 }, { "epoch": 0.85, "learning_rate": 1.0992466344153906e-06, "loss": 0.7473, "step": 6147 }, { "epoch": 0.85, "learning_rate": 1.0971968691116807e-06, "loss": 0.8018, "step": 6148 }, { "epoch": 0.85, "learning_rate": 1.0951489057566778e-06, "loss": 0.7759, "step": 6149 }, { "epoch": 0.85, "learning_rate": 1.09310274476489e-06, "loss": 0.7788, "step": 6150 }, { "epoch": 0.85, "learning_rate": 1.0910583865504688e-06, "loss": 0.8298, "step": 6151 }, { "epoch": 0.85, "learning_rate": 1.0890158315271959e-06, "loss": 0.8223, "step": 6152 }, { "epoch": 0.85, "learning_rate": 1.0869750801084867e-06, "loss": 0.8257, "step": 6153 }, { "epoch": 0.85, "learning_rate": 1.0849361327073983e-06, "loss": 0.7993, "step": 6154 }, { "epoch": 0.85, "learning_rate": 1.0828989897366138e-06, "loss": 0.8508, "step": 6155 }, { "epoch": 0.86, "learning_rate": 1.0808636516084613e-06, "loss": 0.7756, "step": 6156 }, { "epoch": 0.86, "learning_rate": 1.0788301187348959e-06, "loss": 0.8198, "step": 6157 }, { "epoch": 0.86, "learning_rate": 1.0767983915275071e-06, "loss": 0.8765, "step": 6158 }, { "epoch": 0.86, "learning_rate": 1.0747684703975247e-06, "loss": 0.7997, "step": 6159 }, { "epoch": 0.86, "learning_rate": 1.072740355755807e-06, "loss": 0.8064, "step": 6160 }, { "epoch": 0.86, "learning_rate": 1.070714048012852e-06, "loss": 0.8025, "step": 6161 }, { "epoch": 0.86, "learning_rate": 1.0686895475787873e-06, "loss": 0.7644, "step": 6162 }, { "epoch": 0.86, "learning_rate": 1.0666668548633764e-06, "loss": 0.7874, "step": 6163 }, { "epoch": 0.86, "learning_rate": 1.0646459702760182e-06, "loss": 0.5715, "step": 6164 }, { "epoch": 0.86, "learning_rate": 1.0626268942257433e-06, "loss": 0.804, "step": 6165 }, { "epoch": 0.86, "learning_rate": 1.0606096271212207e-06, "loss": 0.8147, "step": 6166 }, { "epoch": 0.86, "learning_rate": 1.058594169370748e-06, "loss": 0.8174, "step": 6167 }, { "epoch": 0.86, "learning_rate": 1.0565805213822555e-06, "loss": 0.8018, "step": 6168 }, { "epoch": 0.86, "learning_rate": 1.0545686835633161e-06, "loss": 0.8318, "step": 6169 }, { "epoch": 0.86, "learning_rate": 1.0525586563211255e-06, "loss": 0.7925, "step": 6170 }, { "epoch": 0.86, "learning_rate": 1.0505504400625233e-06, "loss": 0.7643, "step": 6171 }, { "epoch": 0.86, "learning_rate": 1.0485440351939735e-06, "loss": 0.8328, "step": 6172 }, { "epoch": 0.86, "learning_rate": 1.046539442121577e-06, "loss": 0.797, "step": 6173 }, { "epoch": 0.86, "learning_rate": 1.044536661251072e-06, "loss": 0.8047, "step": 6174 }, { "epoch": 0.86, "learning_rate": 1.0425356929878205e-06, "loss": 0.791, "step": 6175 }, { "epoch": 0.86, "learning_rate": 1.0405365377368292e-06, "loss": 0.7422, "step": 6176 }, { "epoch": 0.86, "learning_rate": 1.038539195902728e-06, "loss": 0.8506, "step": 6177 }, { "epoch": 0.86, "learning_rate": 1.0365436678897834e-06, "loss": 0.8188, "step": 6178 }, { "epoch": 0.86, "learning_rate": 1.0345499541018989e-06, "loss": 0.785, "step": 6179 }, { "epoch": 0.86, "learning_rate": 1.0325580549426017e-06, "loss": 0.8276, "step": 6180 }, { "epoch": 0.86, "learning_rate": 1.030567970815063e-06, "loss": 0.7937, "step": 6181 }, { "epoch": 0.86, "learning_rate": 1.0285797021220768e-06, "loss": 0.7852, "step": 6182 }, { "epoch": 0.86, "learning_rate": 1.0265932492660713e-06, "loss": 0.8423, "step": 6183 }, { "epoch": 0.86, "learning_rate": 1.024608612649115e-06, "loss": 0.8391, "step": 6184 }, { "epoch": 0.86, "learning_rate": 1.0226257926728977e-06, "loss": 0.7688, "step": 6185 }, { "epoch": 0.86, "learning_rate": 1.0206447897387506e-06, "loss": 0.8127, "step": 6186 }, { "epoch": 0.86, "learning_rate": 1.018665604247634e-06, "loss": 0.8125, "step": 6187 }, { "epoch": 0.86, "learning_rate": 1.0166882366001341e-06, "loss": 0.8467, "step": 6188 }, { "epoch": 0.86, "learning_rate": 1.014712687196482e-06, "loss": 0.7664, "step": 6189 }, { "epoch": 0.86, "learning_rate": 1.0127389564365287e-06, "loss": 0.7662, "step": 6190 }, { "epoch": 0.86, "learning_rate": 1.0107670447197648e-06, "loss": 0.7715, "step": 6191 }, { "epoch": 0.86, "learning_rate": 1.0087969524453089e-06, "loss": 0.7957, "step": 6192 }, { "epoch": 0.86, "learning_rate": 1.0068286800119109e-06, "loss": 0.8303, "step": 6193 }, { "epoch": 0.86, "learning_rate": 1.0048622278179577e-06, "loss": 0.8601, "step": 6194 }, { "epoch": 0.86, "learning_rate": 1.0028975962614585e-06, "loss": 0.7468, "step": 6195 }, { "epoch": 0.86, "learning_rate": 1.0009347857400653e-06, "loss": 0.7932, "step": 6196 }, { "epoch": 0.86, "learning_rate": 9.989737966510504e-07, "loss": 0.7784, "step": 6197 }, { "epoch": 0.86, "learning_rate": 9.970146293913275e-07, "loss": 0.8457, "step": 6198 }, { "epoch": 0.86, "learning_rate": 9.950572843574346e-07, "loss": 0.8589, "step": 6199 }, { "epoch": 0.86, "learning_rate": 9.931017619455408e-07, "loss": 0.75, "step": 6200 }, { "epoch": 0.86, "learning_rate": 9.911480625514525e-07, "loss": 0.884, "step": 6201 }, { "epoch": 0.86, "learning_rate": 9.89196186570599e-07, "loss": 0.7732, "step": 6202 }, { "epoch": 0.86, "learning_rate": 9.872461343980488e-07, "loss": 0.772, "step": 6203 }, { "epoch": 0.86, "learning_rate": 9.852979064284961e-07, "loss": 0.8042, "step": 6204 }, { "epoch": 0.86, "learning_rate": 9.833515030562634e-07, "loss": 0.8813, "step": 6205 }, { "epoch": 0.86, "learning_rate": 9.814069246753122e-07, "loss": 0.7495, "step": 6206 }, { "epoch": 0.86, "learning_rate": 9.794641716792265e-07, "loss": 0.7963, "step": 6207 }, { "epoch": 0.86, "learning_rate": 9.77523244461226e-07, "loss": 0.7271, "step": 6208 }, { "epoch": 0.86, "learning_rate": 9.755841434141589e-07, "loss": 0.7585, "step": 6209 }, { "epoch": 0.86, "learning_rate": 9.736468689305024e-07, "loss": 0.7754, "step": 6210 }, { "epoch": 0.86, "learning_rate": 9.71711421402367e-07, "loss": 0.782, "step": 6211 }, { "epoch": 0.86, "learning_rate": 9.697778012214899e-07, "loss": 0.5442, "step": 6212 }, { "epoch": 0.86, "learning_rate": 9.678460087792442e-07, "loss": 0.8333, "step": 6213 }, { "epoch": 0.86, "learning_rate": 9.659160444666272e-07, "loss": 0.8274, "step": 6214 }, { "epoch": 0.86, "learning_rate": 9.639879086742666e-07, "loss": 0.814, "step": 6215 }, { "epoch": 0.86, "learning_rate": 9.620616017924245e-07, "loss": 0.7915, "step": 6216 }, { "epoch": 0.86, "learning_rate": 9.60137124210987e-07, "loss": 0.7297, "step": 6217 }, { "epoch": 0.86, "learning_rate": 9.582144763194767e-07, "loss": 0.7856, "step": 6218 }, { "epoch": 0.86, "learning_rate": 9.562936585070404e-07, "loss": 0.7988, "step": 6219 }, { "epoch": 0.86, "learning_rate": 9.543746711624546e-07, "loss": 0.8245, "step": 6220 }, { "epoch": 0.86, "learning_rate": 9.524575146741299e-07, "loss": 0.7876, "step": 6221 }, { "epoch": 0.86, "learning_rate": 9.505421894301003e-07, "loss": 0.7773, "step": 6222 }, { "epoch": 0.86, "learning_rate": 9.486286958180357e-07, "loss": 0.7402, "step": 6223 }, { "epoch": 0.86, "learning_rate": 9.467170342252297e-07, "loss": 0.8325, "step": 6224 }, { "epoch": 0.86, "learning_rate": 9.448072050386048e-07, "loss": 0.7253, "step": 6225 }, { "epoch": 0.86, "learning_rate": 9.428992086447208e-07, "loss": 0.8206, "step": 6226 }, { "epoch": 0.86, "learning_rate": 9.409930454297556e-07, "loss": 0.7876, "step": 6227 }, { "epoch": 0.87, "learning_rate": 9.390887157795247e-07, "loss": 0.7917, "step": 6228 }, { "epoch": 0.87, "learning_rate": 9.371862200794668e-07, "loss": 0.736, "step": 6229 }, { "epoch": 0.87, "learning_rate": 9.352855587146514e-07, "loss": 0.7947, "step": 6230 }, { "epoch": 0.87, "learning_rate": 9.333867320697798e-07, "loss": 0.8479, "step": 6231 }, { "epoch": 0.87, "learning_rate": 9.314897405291746e-07, "loss": 0.8589, "step": 6232 }, { "epoch": 0.87, "learning_rate": 9.295945844767962e-07, "loss": 0.8464, "step": 6233 }, { "epoch": 0.87, "learning_rate": 9.277012642962258e-07, "loss": 0.8345, "step": 6234 }, { "epoch": 0.87, "learning_rate": 9.258097803706745e-07, "loss": 0.791, "step": 6235 }, { "epoch": 0.87, "learning_rate": 9.239201330829883e-07, "loss": 0.8274, "step": 6236 }, { "epoch": 0.87, "learning_rate": 9.220323228156302e-07, "loss": 0.5745, "step": 6237 }, { "epoch": 0.87, "learning_rate": 9.201463499507035e-07, "loss": 0.8235, "step": 6238 }, { "epoch": 0.87, "learning_rate": 9.182622148699305e-07, "loss": 0.5691, "step": 6239 }, { "epoch": 0.87, "learning_rate": 9.163799179546617e-07, "loss": 0.7991, "step": 6240 }, { "epoch": 0.87, "learning_rate": 9.144994595858858e-07, "loss": 0.5288, "step": 6241 }, { "epoch": 0.87, "learning_rate": 9.12620840144205e-07, "loss": 0.7125, "step": 6242 }, { "epoch": 0.87, "learning_rate": 9.107440600098605e-07, "loss": 0.8423, "step": 6243 }, { "epoch": 0.87, "learning_rate": 9.088691195627164e-07, "loss": 0.5308, "step": 6244 }, { "epoch": 0.87, "learning_rate": 9.069960191822635e-07, "loss": 0.8713, "step": 6245 }, { "epoch": 0.87, "learning_rate": 9.051247592476254e-07, "loss": 0.6292, "step": 6246 }, { "epoch": 0.87, "learning_rate": 9.032553401375444e-07, "loss": 0.8065, "step": 6247 }, { "epoch": 0.87, "learning_rate": 9.013877622304001e-07, "loss": 0.7615, "step": 6248 }, { "epoch": 0.87, "learning_rate": 8.995220259041926e-07, "loss": 0.8325, "step": 6249 }, { "epoch": 0.87, "learning_rate": 8.976581315365506e-07, "loss": 0.798, "step": 6250 }, { "epoch": 0.87, "learning_rate": 8.957960795047327e-07, "loss": 0.7798, "step": 6251 }, { "epoch": 0.87, "learning_rate": 8.939358701856216e-07, "loss": 0.7563, "step": 6252 }, { "epoch": 0.87, "learning_rate": 8.920775039557294e-07, "loss": 0.7573, "step": 6253 }, { "epoch": 0.87, "learning_rate": 8.902209811911921e-07, "loss": 0.8048, "step": 6254 }, { "epoch": 0.87, "learning_rate": 8.883663022677746e-07, "loss": 0.7939, "step": 6255 }, { "epoch": 0.87, "learning_rate": 8.8651346756087e-07, "loss": 0.5874, "step": 6256 }, { "epoch": 0.87, "learning_rate": 8.846624774454937e-07, "loss": 0.7856, "step": 6257 }, { "epoch": 0.87, "learning_rate": 8.828133322962939e-07, "loss": 0.7369, "step": 6258 }, { "epoch": 0.87, "learning_rate": 8.809660324875413e-07, "loss": 0.7937, "step": 6259 }, { "epoch": 0.87, "learning_rate": 8.7912057839313e-07, "loss": 0.7883, "step": 6260 }, { "epoch": 0.87, "learning_rate": 8.772769703865891e-07, "loss": 0.8123, "step": 6261 }, { "epoch": 0.87, "learning_rate": 8.754352088410655e-07, "loss": 0.7623, "step": 6262 }, { "epoch": 0.87, "learning_rate": 8.735952941293402e-07, "loss": 0.7915, "step": 6263 }, { "epoch": 0.87, "learning_rate": 8.71757226623815e-07, "loss": 0.7888, "step": 6264 }, { "epoch": 0.87, "learning_rate": 8.699210066965158e-07, "loss": 0.8513, "step": 6265 }, { "epoch": 0.87, "learning_rate": 8.68086634719102e-07, "loss": 0.813, "step": 6266 }, { "epoch": 0.87, "learning_rate": 8.662541110628509e-07, "loss": 0.7935, "step": 6267 }, { "epoch": 0.87, "learning_rate": 8.644234360986747e-07, "loss": 0.8315, "step": 6268 }, { "epoch": 0.87, "learning_rate": 8.625946101971039e-07, "loss": 0.7668, "step": 6269 }, { "epoch": 0.87, "learning_rate": 8.607676337282955e-07, "loss": 0.7537, "step": 6270 }, { "epoch": 0.87, "learning_rate": 8.589425070620372e-07, "loss": 0.8274, "step": 6271 }, { "epoch": 0.87, "learning_rate": 8.571192305677368e-07, "loss": 0.7635, "step": 6272 }, { "epoch": 0.87, "learning_rate": 8.552978046144311e-07, "loss": 0.8411, "step": 6273 }, { "epoch": 0.87, "learning_rate": 8.5347822957078e-07, "loss": 0.771, "step": 6274 }, { "epoch": 0.87, "learning_rate": 8.516605058050686e-07, "loss": 0.7642, "step": 6275 }, { "epoch": 0.87, "learning_rate": 8.498446336852128e-07, "loss": 0.7472, "step": 6276 }, { "epoch": 0.87, "learning_rate": 8.480306135787453e-07, "loss": 0.5669, "step": 6277 }, { "epoch": 0.87, "learning_rate": 8.4621844585283e-07, "loss": 0.7841, "step": 6278 }, { "epoch": 0.87, "learning_rate": 8.444081308742546e-07, "loss": 0.7888, "step": 6279 }, { "epoch": 0.87, "learning_rate": 8.425996690094295e-07, "loss": 0.7521, "step": 6280 }, { "epoch": 0.87, "learning_rate": 8.407930606243931e-07, "loss": 0.7817, "step": 6281 }, { "epoch": 0.87, "learning_rate": 8.389883060848059e-07, "loss": 0.8286, "step": 6282 }, { "epoch": 0.87, "learning_rate": 8.371854057559558e-07, "loss": 0.7795, "step": 6283 }, { "epoch": 0.87, "learning_rate": 8.353843600027544e-07, "loss": 0.5349, "step": 6284 }, { "epoch": 0.87, "learning_rate": 8.335851691897356e-07, "loss": 0.8062, "step": 6285 }, { "epoch": 0.87, "learning_rate": 8.317878336810625e-07, "loss": 0.8291, "step": 6286 }, { "epoch": 0.87, "learning_rate": 8.299923538405175e-07, "loss": 0.8569, "step": 6287 }, { "epoch": 0.87, "learning_rate": 8.28198730031513e-07, "loss": 0.7888, "step": 6288 }, { "epoch": 0.87, "learning_rate": 8.264069626170812e-07, "loss": 0.7942, "step": 6289 }, { "epoch": 0.87, "learning_rate": 8.246170519598784e-07, "loss": 0.792, "step": 6290 }, { "epoch": 0.87, "learning_rate": 8.228289984221905e-07, "loss": 0.8149, "step": 6291 }, { "epoch": 0.87, "learning_rate": 8.2104280236592e-07, "loss": 0.7603, "step": 6292 }, { "epoch": 0.87, "learning_rate": 8.192584641526014e-07, "loss": 0.561, "step": 6293 }, { "epoch": 0.87, "learning_rate": 8.174759841433866e-07, "loss": 0.7837, "step": 6294 }, { "epoch": 0.87, "learning_rate": 8.156953626990516e-07, "loss": 0.7397, "step": 6295 }, { "epoch": 0.87, "learning_rate": 8.139166001800036e-07, "loss": 0.8284, "step": 6296 }, { "epoch": 0.87, "learning_rate": 8.121396969462625e-07, "loss": 0.8188, "step": 6297 }, { "epoch": 0.87, "learning_rate": 8.103646533574838e-07, "loss": 0.866, "step": 6298 }, { "epoch": 0.87, "learning_rate": 8.08591469772938e-07, "loss": 0.8689, "step": 6299 }, { "epoch": 0.88, "learning_rate": 8.068201465515191e-07, "loss": 0.772, "step": 6300 }, { "epoch": 0.88, "learning_rate": 8.050506840517513e-07, "loss": 0.8337, "step": 6301 }, { "epoch": 0.88, "learning_rate": 8.032830826317739e-07, "loss": 0.8018, "step": 6302 }, { "epoch": 0.88, "learning_rate": 8.015173426493583e-07, "loss": 0.7769, "step": 6303 }, { "epoch": 0.88, "learning_rate": 7.997534644618921e-07, "loss": 0.7161, "step": 6304 }, { "epoch": 0.88, "learning_rate": 7.979914484263873e-07, "loss": 0.7603, "step": 6305 }, { "epoch": 0.88, "learning_rate": 7.962312948994822e-07, "loss": 0.7844, "step": 6306 }, { "epoch": 0.88, "learning_rate": 7.944730042374349e-07, "loss": 0.7339, "step": 6307 }, { "epoch": 0.88, "learning_rate": 7.927165767961286e-07, "loss": 0.8789, "step": 6308 }, { "epoch": 0.88, "learning_rate": 7.909620129310691e-07, "loss": 0.8262, "step": 6309 }, { "epoch": 0.88, "learning_rate": 7.89209312997381e-07, "loss": 0.5512, "step": 6310 }, { "epoch": 0.88, "learning_rate": 7.874584773498184e-07, "loss": 0.781, "step": 6311 }, { "epoch": 0.88, "learning_rate": 7.857095063427522e-07, "loss": 0.8547, "step": 6312 }, { "epoch": 0.88, "learning_rate": 7.839624003301804e-07, "loss": 0.7385, "step": 6313 }, { "epoch": 0.88, "learning_rate": 7.822171596657202e-07, "loss": 0.7966, "step": 6314 }, { "epoch": 0.88, "learning_rate": 7.804737847026134e-07, "loss": 0.8235, "step": 6315 }, { "epoch": 0.88, "learning_rate": 7.787322757937233e-07, "loss": 0.8369, "step": 6316 }, { "epoch": 0.88, "learning_rate": 7.769926332915323e-07, "loss": 0.8335, "step": 6317 }, { "epoch": 0.88, "learning_rate": 7.752548575481533e-07, "loss": 0.8059, "step": 6318 }, { "epoch": 0.88, "learning_rate": 7.735189489153128e-07, "loss": 0.7075, "step": 6319 }, { "epoch": 0.88, "learning_rate": 7.71784907744364e-07, "loss": 0.8264, "step": 6320 }, { "epoch": 0.88, "learning_rate": 7.700527343862818e-07, "loss": 0.7671, "step": 6321 }, { "epoch": 0.88, "learning_rate": 7.683224291916592e-07, "loss": 0.8252, "step": 6322 }, { "epoch": 0.88, "learning_rate": 7.66593992510718e-07, "loss": 0.8115, "step": 6323 }, { "epoch": 0.88, "learning_rate": 7.648674246932941e-07, "loss": 0.8203, "step": 6324 }, { "epoch": 0.88, "learning_rate": 7.631427260888536e-07, "loss": 0.8522, "step": 6325 }, { "epoch": 0.88, "learning_rate": 7.61419897046477e-07, "loss": 0.844, "step": 6326 }, { "epoch": 0.88, "learning_rate": 7.596989379148667e-07, "loss": 0.8096, "step": 6327 }, { "epoch": 0.88, "learning_rate": 7.579798490423529e-07, "loss": 0.8545, "step": 6328 }, { "epoch": 0.88, "learning_rate": 7.562626307768805e-07, "loss": 0.822, "step": 6329 }, { "epoch": 0.88, "learning_rate": 7.545472834660217e-07, "loss": 0.8306, "step": 6330 }, { "epoch": 0.88, "learning_rate": 7.528338074569642e-07, "loss": 0.8323, "step": 6331 }, { "epoch": 0.88, "learning_rate": 7.511222030965193e-07, "loss": 0.8384, "step": 6332 }, { "epoch": 0.88, "learning_rate": 7.494124707311235e-07, "loss": 0.7988, "step": 6333 }, { "epoch": 0.88, "learning_rate": 7.477046107068253e-07, "loss": 0.7727, "step": 6334 }, { "epoch": 0.88, "learning_rate": 7.459986233693051e-07, "loss": 0.782, "step": 6335 }, { "epoch": 0.88, "learning_rate": 7.442945090638554e-07, "loss": 0.8459, "step": 6336 }, { "epoch": 0.88, "learning_rate": 7.425922681353937e-07, "loss": 0.8379, "step": 6337 }, { "epoch": 0.88, "learning_rate": 7.408919009284588e-07, "loss": 0.7747, "step": 6338 }, { "epoch": 0.88, "learning_rate": 7.391934077872065e-07, "loss": 0.77, "step": 6339 }, { "epoch": 0.88, "learning_rate": 7.374967890554185e-07, "loss": 0.8213, "step": 6340 }, { "epoch": 0.88, "learning_rate": 7.358020450764947e-07, "loss": 0.8269, "step": 6341 }, { "epoch": 0.88, "learning_rate": 7.341091761934527e-07, "loss": 0.783, "step": 6342 }, { "epoch": 0.88, "learning_rate": 7.324181827489352e-07, "loss": 0.8118, "step": 6343 }, { "epoch": 0.88, "learning_rate": 7.307290650852028e-07, "loss": 0.7487, "step": 6344 }, { "epoch": 0.88, "learning_rate": 7.290418235441377e-07, "loss": 0.7917, "step": 6345 }, { "epoch": 0.88, "learning_rate": 7.27356458467241e-07, "loss": 0.7759, "step": 6346 }, { "epoch": 0.88, "learning_rate": 7.256729701956334e-07, "loss": 0.8245, "step": 6347 }, { "epoch": 0.88, "learning_rate": 7.239913590700598e-07, "loss": 0.8167, "step": 6348 }, { "epoch": 0.88, "learning_rate": 7.223116254308793e-07, "loss": 0.7944, "step": 6349 }, { "epoch": 0.88, "learning_rate": 7.206337696180765e-07, "loss": 0.803, "step": 6350 }, { "epoch": 0.88, "learning_rate": 7.18957791971252e-07, "loss": 0.7701, "step": 6351 }, { "epoch": 0.88, "learning_rate": 7.172836928296278e-07, "loss": 0.8047, "step": 6352 }, { "epoch": 0.88, "learning_rate": 7.156114725320463e-07, "loss": 0.7542, "step": 6353 }, { "epoch": 0.88, "learning_rate": 7.139411314169675e-07, "loss": 0.8398, "step": 6354 }, { "epoch": 0.88, "learning_rate": 7.122726698224747e-07, "loss": 0.7791, "step": 6355 }, { "epoch": 0.88, "learning_rate": 7.106060880862675e-07, "loss": 0.7776, "step": 6356 }, { "epoch": 0.88, "learning_rate": 7.08941386545664e-07, "loss": 0.8088, "step": 6357 }, { "epoch": 0.88, "learning_rate": 7.072785655376069e-07, "loss": 0.8042, "step": 6358 }, { "epoch": 0.88, "learning_rate": 7.056176253986524e-07, "loss": 0.7876, "step": 6359 }, { "epoch": 0.88, "learning_rate": 7.039585664649817e-07, "loss": 0.7712, "step": 6360 }, { "epoch": 0.88, "learning_rate": 7.023013890723906e-07, "loss": 0.9084, "step": 6361 }, { "epoch": 0.88, "learning_rate": 7.006460935562942e-07, "loss": 0.74, "step": 6362 }, { "epoch": 0.88, "learning_rate": 6.989926802517322e-07, "loss": 0.8093, "step": 6363 }, { "epoch": 0.88, "learning_rate": 6.973411494933558e-07, "loss": 0.7672, "step": 6364 }, { "epoch": 0.88, "learning_rate": 6.956915016154408e-07, "loss": 0.7856, "step": 6365 }, { "epoch": 0.88, "learning_rate": 6.940437369518805e-07, "loss": 0.804, "step": 6366 }, { "epoch": 0.88, "learning_rate": 6.923978558361833e-07, "loss": 0.8521, "step": 6367 }, { "epoch": 0.88, "learning_rate": 6.907538586014828e-07, "loss": 0.7625, "step": 6368 }, { "epoch": 0.88, "learning_rate": 6.891117455805252e-07, "loss": 0.8171, "step": 6369 }, { "epoch": 0.88, "learning_rate": 6.874715171056811e-07, "loss": 0.8198, "step": 6370 }, { "epoch": 0.88, "learning_rate": 6.858331735089352e-07, "loss": 0.7458, "step": 6371 }, { "epoch": 0.89, "learning_rate": 6.841967151218898e-07, "loss": 0.8328, "step": 6372 }, { "epoch": 0.89, "learning_rate": 6.825621422757733e-07, "loss": 0.7684, "step": 6373 }, { "epoch": 0.89, "learning_rate": 6.809294553014212e-07, "loss": 0.7986, "step": 6374 }, { "epoch": 0.89, "learning_rate": 6.79298654529299e-07, "loss": 0.7864, "step": 6375 }, { "epoch": 0.89, "learning_rate": 6.776697402894805e-07, "loss": 0.5878, "step": 6376 }, { "epoch": 0.89, "learning_rate": 6.760427129116632e-07, "loss": 0.7734, "step": 6377 }, { "epoch": 0.89, "learning_rate": 6.744175727251612e-07, "loss": 0.8032, "step": 6378 }, { "epoch": 0.89, "learning_rate": 6.727943200589071e-07, "loss": 0.7737, "step": 6379 }, { "epoch": 0.89, "learning_rate": 6.711729552414515e-07, "loss": 0.7864, "step": 6380 }, { "epoch": 0.89, "learning_rate": 6.695534786009628e-07, "loss": 0.8594, "step": 6381 }, { "epoch": 0.89, "learning_rate": 6.679358904652234e-07, "loss": 0.7922, "step": 6382 }, { "epoch": 0.89, "learning_rate": 6.663201911616423e-07, "loss": 0.8589, "step": 6383 }, { "epoch": 0.89, "learning_rate": 6.647063810172361e-07, "loss": 0.8608, "step": 6384 }, { "epoch": 0.89, "learning_rate": 6.630944603586486e-07, "loss": 0.8499, "step": 6385 }, { "epoch": 0.89, "learning_rate": 6.614844295121337e-07, "loss": 0.8315, "step": 6386 }, { "epoch": 0.89, "learning_rate": 6.598762888035637e-07, "loss": 0.791, "step": 6387 }, { "epoch": 0.89, "learning_rate": 6.58270038558434e-07, "loss": 0.8132, "step": 6388 }, { "epoch": 0.89, "learning_rate": 6.566656791018511e-07, "loss": 0.8245, "step": 6389 }, { "epoch": 0.89, "learning_rate": 6.55063210758542e-07, "loss": 0.8064, "step": 6390 }, { "epoch": 0.89, "learning_rate": 6.534626338528504e-07, "loss": 0.8596, "step": 6391 }, { "epoch": 0.89, "learning_rate": 6.518639487087353e-07, "loss": 0.5543, "step": 6392 }, { "epoch": 0.89, "learning_rate": 6.502671556497764e-07, "loss": 0.8091, "step": 6393 }, { "epoch": 0.89, "learning_rate": 6.486722549991664e-07, "loss": 0.8157, "step": 6394 }, { "epoch": 0.89, "learning_rate": 6.470792470797204e-07, "loss": 0.8416, "step": 6395 }, { "epoch": 0.89, "learning_rate": 6.45488132213864e-07, "loss": 0.7402, "step": 6396 }, { "epoch": 0.89, "learning_rate": 6.438989107236415e-07, "loss": 0.8618, "step": 6397 }, { "epoch": 0.89, "learning_rate": 6.423115829307203e-07, "loss": 0.8547, "step": 6398 }, { "epoch": 0.89, "learning_rate": 6.407261491563732e-07, "loss": 0.5459, "step": 6399 }, { "epoch": 0.89, "learning_rate": 6.391426097215004e-07, "loss": 0.8414, "step": 6400 }, { "epoch": 0.89, "learning_rate": 6.37560964946613e-07, "loss": 0.5508, "step": 6401 }, { "epoch": 0.89, "learning_rate": 6.359812151518374e-07, "loss": 0.5423, "step": 6402 }, { "epoch": 0.89, "learning_rate": 6.344033606569223e-07, "loss": 0.6057, "step": 6403 }, { "epoch": 0.89, "learning_rate": 6.328274017812252e-07, "loss": 0.8171, "step": 6404 }, { "epoch": 0.89, "learning_rate": 6.312533388437292e-07, "loss": 0.7471, "step": 6405 }, { "epoch": 0.89, "learning_rate": 6.296811721630236e-07, "loss": 0.8179, "step": 6406 }, { "epoch": 0.89, "learning_rate": 6.281109020573206e-07, "loss": 0.7778, "step": 6407 }, { "epoch": 0.89, "learning_rate": 6.265425288444471e-07, "loss": 0.8628, "step": 6408 }, { "epoch": 0.89, "learning_rate": 6.249760528418436e-07, "loss": 0.823, "step": 6409 }, { "epoch": 0.89, "learning_rate": 6.23411474366572e-07, "loss": 0.8359, "step": 6410 }, { "epoch": 0.89, "learning_rate": 6.218487937353046e-07, "loss": 0.791, "step": 6411 }, { "epoch": 0.89, "learning_rate": 6.202880112643305e-07, "loss": 0.8296, "step": 6412 }, { "epoch": 0.89, "learning_rate": 6.187291272695584e-07, "loss": 0.8218, "step": 6413 }, { "epoch": 0.89, "learning_rate": 6.171721420665078e-07, "loss": 0.8337, "step": 6414 }, { "epoch": 0.89, "learning_rate": 6.156170559703179e-07, "loss": 0.7821, "step": 6415 }, { "epoch": 0.89, "learning_rate": 6.140638692957424e-07, "loss": 0.8254, "step": 6416 }, { "epoch": 0.89, "learning_rate": 6.125125823571476e-07, "loss": 0.7725, "step": 6417 }, { "epoch": 0.89, "learning_rate": 6.109631954685202e-07, "loss": 0.8047, "step": 6418 }, { "epoch": 0.89, "learning_rate": 6.094157089434571e-07, "loss": 0.6111, "step": 6419 }, { "epoch": 0.89, "learning_rate": 6.078701230951767e-07, "loss": 0.8259, "step": 6420 }, { "epoch": 0.89, "learning_rate": 6.063264382365075e-07, "loss": 0.7649, "step": 6421 }, { "epoch": 0.89, "learning_rate": 6.04784654679893e-07, "loss": 0.5779, "step": 6422 }, { "epoch": 0.89, "learning_rate": 6.032447727373969e-07, "loss": 0.8171, "step": 6423 }, { "epoch": 0.89, "learning_rate": 6.017067927206932e-07, "loss": 0.8264, "step": 6424 }, { "epoch": 0.89, "learning_rate": 6.001707149410752e-07, "loss": 0.782, "step": 6425 }, { "epoch": 0.89, "learning_rate": 5.986365397094463e-07, "loss": 0.7388, "step": 6426 }, { "epoch": 0.89, "learning_rate": 5.97104267336327e-07, "loss": 0.7773, "step": 6427 }, { "epoch": 0.89, "learning_rate": 5.95573898131856e-07, "loss": 0.7729, "step": 6428 }, { "epoch": 0.89, "learning_rate": 5.940454324057788e-07, "loss": 0.7954, "step": 6429 }, { "epoch": 0.89, "learning_rate": 5.925188704674656e-07, "loss": 0.7969, "step": 6430 }, { "epoch": 0.89, "learning_rate": 5.909942126258928e-07, "loss": 0.7712, "step": 6431 }, { "epoch": 0.89, "learning_rate": 5.894714591896567e-07, "loss": 0.7913, "step": 6432 }, { "epoch": 0.89, "learning_rate": 5.879506104669653e-07, "loss": 0.7781, "step": 6433 }, { "epoch": 0.89, "learning_rate": 5.864316667656411e-07, "loss": 0.7517, "step": 6434 }, { "epoch": 0.89, "learning_rate": 5.84914628393124e-07, "loss": 0.557, "step": 6435 }, { "epoch": 0.89, "learning_rate": 5.833994956564648e-07, "loss": 0.7954, "step": 6436 }, { "epoch": 0.89, "learning_rate": 5.818862688623306e-07, "loss": 0.8071, "step": 6437 }, { "epoch": 0.89, "learning_rate": 5.803749483170029e-07, "loss": 0.5889, "step": 6438 }, { "epoch": 0.89, "learning_rate": 5.788655343263739e-07, "loss": 0.7576, "step": 6439 }, { "epoch": 0.89, "learning_rate": 5.773580271959555e-07, "loss": 0.8201, "step": 6440 }, { "epoch": 0.89, "learning_rate": 5.758524272308685e-07, "loss": 0.824, "step": 6441 }, { "epoch": 0.89, "learning_rate": 5.743487347358534e-07, "loss": 0.5836, "step": 6442 }, { "epoch": 0.89, "learning_rate": 5.728469500152578e-07, "loss": 0.813, "step": 6443 }, { "epoch": 0.9, "learning_rate": 5.713470733730465e-07, "loss": 0.8542, "step": 6444 }, { "epoch": 0.9, "learning_rate": 5.698491051127997e-07, "loss": 0.8013, "step": 6445 }, { "epoch": 0.9, "learning_rate": 5.683530455377095e-07, "loss": 0.8726, "step": 6446 }, { "epoch": 0.9, "learning_rate": 5.668588949505816e-07, "loss": 0.6318, "step": 6447 }, { "epoch": 0.9, "learning_rate": 5.653666536538371e-07, "loss": 0.8762, "step": 6448 }, { "epoch": 0.9, "learning_rate": 5.638763219495058e-07, "loss": 0.811, "step": 6449 }, { "epoch": 0.9, "learning_rate": 5.623879001392373e-07, "loss": 0.5594, "step": 6450 }, { "epoch": 0.9, "learning_rate": 5.609013885242909e-07, "loss": 0.8555, "step": 6451 }, { "epoch": 0.9, "learning_rate": 5.594167874055412e-07, "loss": 0.7766, "step": 6452 }, { "epoch": 0.9, "learning_rate": 5.579340970834734e-07, "loss": 0.8062, "step": 6453 }, { "epoch": 0.9, "learning_rate": 5.564533178581866e-07, "loss": 0.8579, "step": 6454 }, { "epoch": 0.9, "learning_rate": 5.549744500293974e-07, "loss": 0.8372, "step": 6455 }, { "epoch": 0.9, "learning_rate": 5.53497493896431e-07, "loss": 0.782, "step": 6456 }, { "epoch": 0.9, "learning_rate": 5.520224497582249e-07, "loss": 0.5421, "step": 6457 }, { "epoch": 0.9, "learning_rate": 5.505493179133336e-07, "loss": 0.5312, "step": 6458 }, { "epoch": 0.9, "learning_rate": 5.490780986599209e-07, "loss": 0.5364, "step": 6459 }, { "epoch": 0.9, "learning_rate": 5.476087922957674e-07, "loss": 0.7839, "step": 6460 }, { "epoch": 0.9, "learning_rate": 5.461413991182629e-07, "loss": 0.7678, "step": 6461 }, { "epoch": 0.9, "learning_rate": 5.4467591942441e-07, "loss": 0.7524, "step": 6462 }, { "epoch": 0.9, "learning_rate": 5.432123535108281e-07, "loss": 0.5758, "step": 6463 }, { "epoch": 0.9, "learning_rate": 5.417507016737433e-07, "loss": 0.7795, "step": 6464 }, { "epoch": 0.9, "learning_rate": 5.402909642090015e-07, "loss": 0.7566, "step": 6465 }, { "epoch": 0.9, "learning_rate": 5.38833141412054e-07, "loss": 0.8347, "step": 6466 }, { "epoch": 0.9, "learning_rate": 5.373772335779659e-07, "loss": 0.8145, "step": 6467 }, { "epoch": 0.9, "learning_rate": 5.359232410014215e-07, "loss": 0.8521, "step": 6468 }, { "epoch": 0.9, "learning_rate": 5.344711639767086e-07, "loss": 0.8086, "step": 6469 }, { "epoch": 0.9, "learning_rate": 5.330210027977323e-07, "loss": 0.8108, "step": 6470 }, { "epoch": 0.9, "learning_rate": 5.315727577580099e-07, "loss": 0.5401, "step": 6471 }, { "epoch": 0.9, "learning_rate": 5.301264291506658e-07, "loss": 0.834, "step": 6472 }, { "epoch": 0.9, "learning_rate": 5.286820172684449e-07, "loss": 0.7803, "step": 6473 }, { "epoch": 0.9, "learning_rate": 5.272395224036963e-07, "loss": 0.8118, "step": 6474 }, { "epoch": 0.9, "learning_rate": 5.25798944848388e-07, "loss": 0.7419, "step": 6475 }, { "epoch": 0.9, "learning_rate": 5.243602848940932e-07, "loss": 0.8184, "step": 6476 }, { "epoch": 0.9, "learning_rate": 5.229235428320001e-07, "loss": 0.7108, "step": 6477 }, { "epoch": 0.9, "learning_rate": 5.214887189529105e-07, "loss": 0.8041, "step": 6478 }, { "epoch": 0.9, "learning_rate": 5.200558135472344e-07, "loss": 0.7461, "step": 6479 }, { "epoch": 0.9, "learning_rate": 5.186248269049976e-07, "loss": 0.7852, "step": 6480 }, { "epoch": 0.9, "learning_rate": 5.171957593158339e-07, "loss": 0.7876, "step": 6481 }, { "epoch": 0.9, "learning_rate": 5.157686110689886e-07, "loss": 0.5597, "step": 6482 }, { "epoch": 0.9, "learning_rate": 5.143433824533239e-07, "loss": 0.7365, "step": 6483 }, { "epoch": 0.9, "learning_rate": 5.129200737573059e-07, "loss": 0.6233, "step": 6484 }, { "epoch": 0.9, "learning_rate": 5.114986852690151e-07, "loss": 0.7542, "step": 6485 }, { "epoch": 0.9, "learning_rate": 5.10079217276147e-07, "loss": 0.8235, "step": 6486 }, { "epoch": 0.9, "learning_rate": 5.08661670066003e-07, "loss": 0.7827, "step": 6487 }, { "epoch": 0.9, "learning_rate": 5.072460439255e-07, "loss": 0.7977, "step": 6488 }, { "epoch": 0.9, "learning_rate": 5.058323391411634e-07, "loss": 0.8186, "step": 6489 }, { "epoch": 0.9, "learning_rate": 5.044205559991288e-07, "loss": 0.7964, "step": 6490 }, { "epoch": 0.9, "learning_rate": 5.030106947851476e-07, "loss": 0.7316, "step": 6491 }, { "epoch": 0.9, "learning_rate": 5.016027557845749e-07, "loss": 0.8225, "step": 6492 }, { "epoch": 0.9, "learning_rate": 5.001967392823859e-07, "loss": 0.8091, "step": 6493 }, { "epoch": 0.9, "learning_rate": 4.987926455631586e-07, "loss": 0.5923, "step": 6494 }, { "epoch": 0.9, "learning_rate": 4.973904749110836e-07, "loss": 0.8298, "step": 6495 }, { "epoch": 0.9, "learning_rate": 4.959902276099671e-07, "loss": 0.8704, "step": 6496 }, { "epoch": 0.9, "learning_rate": 4.945919039432201e-07, "loss": 0.8247, "step": 6497 }, { "epoch": 0.9, "learning_rate": 4.931955041938686e-07, "loss": 0.8374, "step": 6498 }, { "epoch": 0.9, "learning_rate": 4.918010286445452e-07, "loss": 0.7988, "step": 6499 }, { "epoch": 0.9, "learning_rate": 4.904084775774964e-07, "loss": 0.8494, "step": 6500 }, { "epoch": 0.9, "learning_rate": 4.89017851274578e-07, "loss": 0.8015, "step": 6501 }, { "epoch": 0.9, "learning_rate": 4.876291500172536e-07, "loss": 0.8508, "step": 6502 }, { "epoch": 0.9, "learning_rate": 4.86242374086604e-07, "loss": 0.7837, "step": 6503 }, { "epoch": 0.9, "learning_rate": 4.848575237633136e-07, "loss": 0.7484, "step": 6504 }, { "epoch": 0.9, "learning_rate": 4.834745993276768e-07, "loss": 0.8408, "step": 6505 }, { "epoch": 0.9, "learning_rate": 4.820936010596066e-07, "loss": 0.8145, "step": 6506 }, { "epoch": 0.9, "learning_rate": 4.807145292386162e-07, "loss": 0.7606, "step": 6507 }, { "epoch": 0.9, "learning_rate": 4.793373841438332e-07, "loss": 0.7991, "step": 6508 }, { "epoch": 0.9, "learning_rate": 4.779621660539969e-07, "loss": 0.8411, "step": 6509 }, { "epoch": 0.9, "learning_rate": 4.7658887524745237e-07, "loss": 0.7639, "step": 6510 }, { "epoch": 0.9, "learning_rate": 4.752175120021607e-07, "loss": 0.7944, "step": 6511 }, { "epoch": 0.9, "learning_rate": 4.7384807659568543e-07, "loss": 0.7578, "step": 6512 }, { "epoch": 0.9, "learning_rate": 4.724805693052048e-07, "loss": 0.738, "step": 6513 }, { "epoch": 0.9, "learning_rate": 4.711149904075063e-07, "loss": 0.7643, "step": 6514 }, { "epoch": 0.9, "learning_rate": 4.697513401789844e-07, "loss": 0.5946, "step": 6515 }, { "epoch": 0.91, "learning_rate": 4.6838961889564826e-07, "loss": 0.7825, "step": 6516 }, { "epoch": 0.91, "learning_rate": 4.6702982683311193e-07, "loss": 0.8149, "step": 6517 }, { "epoch": 0.91, "learning_rate": 4.6567196426659964e-07, "loss": 0.8159, "step": 6518 }, { "epoch": 0.91, "learning_rate": 4.6431603147094716e-07, "loss": 0.5881, "step": 6519 }, { "epoch": 0.91, "learning_rate": 4.6296202872059714e-07, "loss": 0.8154, "step": 6520 }, { "epoch": 0.91, "learning_rate": 4.616099562896059e-07, "loss": 0.8267, "step": 6521 }, { "epoch": 0.91, "learning_rate": 4.602598144516335e-07, "loss": 0.7733, "step": 6522 }, { "epoch": 0.91, "learning_rate": 4.5891160347995234e-07, "loss": 0.8281, "step": 6523 }, { "epoch": 0.91, "learning_rate": 4.575653236474442e-07, "loss": 0.7703, "step": 6524 }, { "epoch": 0.91, "learning_rate": 4.562209752265989e-07, "loss": 0.8057, "step": 6525 }, { "epoch": 0.91, "learning_rate": 4.5487855848951656e-07, "loss": 0.8176, "step": 6526 }, { "epoch": 0.91, "learning_rate": 4.5353807370790537e-07, "loss": 0.7659, "step": 6527 }, { "epoch": 0.91, "learning_rate": 4.521995211530805e-07, "loss": 0.7871, "step": 6528 }, { "epoch": 0.91, "learning_rate": 4.5086290109597195e-07, "loss": 0.7991, "step": 6529 }, { "epoch": 0.91, "learning_rate": 4.495282138071122e-07, "loss": 0.8271, "step": 6530 }, { "epoch": 0.91, "learning_rate": 4.481954595566451e-07, "loss": 0.8091, "step": 6531 }, { "epoch": 0.91, "learning_rate": 4.4686463861432384e-07, "loss": 0.8063, "step": 6532 }, { "epoch": 0.91, "learning_rate": 4.4553575124951065e-07, "loss": 0.7659, "step": 6533 }, { "epoch": 0.91, "learning_rate": 4.442087977311749e-07, "loss": 0.7991, "step": 6534 }, { "epoch": 0.91, "learning_rate": 4.42883778327895e-07, "loss": 0.8547, "step": 6535 }, { "epoch": 0.91, "learning_rate": 4.4156069330785647e-07, "loss": 0.7533, "step": 6536 }, { "epoch": 0.91, "learning_rate": 4.402395429388584e-07, "loss": 0.7427, "step": 6537 }, { "epoch": 0.91, "learning_rate": 4.389203274883014e-07, "loss": 0.7246, "step": 6538 }, { "epoch": 0.91, "learning_rate": 4.376030472232018e-07, "loss": 0.7368, "step": 6539 }, { "epoch": 0.91, "learning_rate": 4.3628770241017637e-07, "loss": 0.7974, "step": 6540 }, { "epoch": 0.91, "learning_rate": 4.349742933154544e-07, "loss": 0.8459, "step": 6541 }, { "epoch": 0.91, "learning_rate": 4.336628202048765e-07, "loss": 0.734, "step": 6542 }, { "epoch": 0.91, "learning_rate": 4.323532833438837e-07, "loss": 0.7812, "step": 6543 }, { "epoch": 0.91, "learning_rate": 4.310456829975318e-07, "loss": 0.7515, "step": 6544 }, { "epoch": 0.91, "learning_rate": 4.297400194304835e-07, "loss": 0.7537, "step": 6545 }, { "epoch": 0.91, "learning_rate": 4.284362929070041e-07, "loss": 0.7573, "step": 6546 }, { "epoch": 0.91, "learning_rate": 4.2713450369097466e-07, "loss": 0.7837, "step": 6547 }, { "epoch": 0.91, "learning_rate": 4.2583465204587783e-07, "loss": 0.8027, "step": 6548 }, { "epoch": 0.91, "learning_rate": 4.245367382348098e-07, "loss": 0.8308, "step": 6549 }, { "epoch": 0.91, "learning_rate": 4.2324076252046933e-07, "loss": 0.7524, "step": 6550 }, { "epoch": 0.91, "learning_rate": 4.2194672516516435e-07, "loss": 0.8262, "step": 6551 }, { "epoch": 0.91, "learning_rate": 4.2065462643081424e-07, "loss": 0.5345, "step": 6552 }, { "epoch": 0.91, "learning_rate": 4.193644665789387e-07, "loss": 0.781, "step": 6553 }, { "epoch": 0.91, "learning_rate": 4.180762458706722e-07, "loss": 0.7859, "step": 6554 }, { "epoch": 0.91, "learning_rate": 4.167899645667528e-07, "loss": 0.791, "step": 6555 }, { "epoch": 0.91, "learning_rate": 4.1550562292752563e-07, "loss": 0.8201, "step": 6556 }, { "epoch": 0.91, "learning_rate": 4.142232212129471e-07, "loss": 0.7993, "step": 6557 }, { "epoch": 0.91, "learning_rate": 4.1294275968257636e-07, "loss": 0.8137, "step": 6558 }, { "epoch": 0.91, "learning_rate": 4.116642385955838e-07, "loss": 0.8474, "step": 6559 }, { "epoch": 0.91, "learning_rate": 4.1038765821074353e-07, "loss": 0.7847, "step": 6560 }, { "epoch": 0.91, "learning_rate": 4.0911301878643783e-07, "loss": 0.7979, "step": 6561 }, { "epoch": 0.91, "learning_rate": 4.0784032058065916e-07, "loss": 0.5411, "step": 6562 }, { "epoch": 0.91, "learning_rate": 4.065695638510014e-07, "loss": 0.8538, "step": 6563 }, { "epoch": 0.91, "learning_rate": 4.053007488546734e-07, "loss": 0.8291, "step": 6564 }, { "epoch": 0.91, "learning_rate": 4.04033875848483e-07, "loss": 0.8, "step": 6565 }, { "epoch": 0.91, "learning_rate": 4.0276894508884723e-07, "loss": 0.8308, "step": 6566 }, { "epoch": 0.91, "learning_rate": 4.015059568317947e-07, "loss": 0.7457, "step": 6567 }, { "epoch": 0.91, "learning_rate": 4.0024491133295427e-07, "loss": 0.8296, "step": 6568 }, { "epoch": 0.91, "learning_rate": 3.989858088475673e-07, "loss": 0.8501, "step": 6569 }, { "epoch": 0.91, "learning_rate": 3.9772864963047666e-07, "loss": 0.8259, "step": 6570 }, { "epoch": 0.91, "learning_rate": 3.964734339361354e-07, "loss": 0.7991, "step": 6571 }, { "epoch": 0.91, "learning_rate": 3.9522016201860245e-07, "loss": 0.618, "step": 6572 }, { "epoch": 0.91, "learning_rate": 3.9396883413154176e-07, "loss": 0.7382, "step": 6573 }, { "epoch": 0.91, "learning_rate": 3.927194505282272e-07, "loss": 0.7981, "step": 6574 }, { "epoch": 0.91, "learning_rate": 3.914720114615356e-07, "loss": 0.8059, "step": 6575 }, { "epoch": 0.91, "learning_rate": 3.9022651718395145e-07, "loss": 0.5801, "step": 6576 }, { "epoch": 0.91, "learning_rate": 3.889829679475676e-07, "loss": 0.7454, "step": 6577 }, { "epoch": 0.91, "learning_rate": 3.8774136400407833e-07, "loss": 0.8557, "step": 6578 }, { "epoch": 0.91, "learning_rate": 3.865017056047904e-07, "loss": 0.5574, "step": 6579 }, { "epoch": 0.91, "learning_rate": 3.852639930006119e-07, "loss": 0.7959, "step": 6580 }, { "epoch": 0.91, "learning_rate": 3.840282264420581e-07, "loss": 0.7979, "step": 6581 }, { "epoch": 0.91, "learning_rate": 3.8279440617925324e-07, "loss": 0.5905, "step": 6582 }, { "epoch": 0.91, "learning_rate": 3.8156253246192323e-07, "loss": 0.5657, "step": 6583 }, { "epoch": 0.91, "learning_rate": 3.8033260553940407e-07, "loss": 0.856, "step": 6584 }, { "epoch": 0.91, "learning_rate": 3.791046256606368e-07, "loss": 0.8334, "step": 6585 }, { "epoch": 0.91, "learning_rate": 3.7787859307416353e-07, "loss": 0.8157, "step": 6586 }, { "epoch": 0.91, "learning_rate": 3.766545080281403e-07, "loss": 0.7971, "step": 6587 }, { "epoch": 0.92, "learning_rate": 3.7543237077032224e-07, "loss": 0.7681, "step": 6588 }, { "epoch": 0.92, "learning_rate": 3.742121815480748e-07, "loss": 0.8147, "step": 6589 }, { "epoch": 0.92, "learning_rate": 3.72993940608366e-07, "loss": 0.7952, "step": 6590 }, { "epoch": 0.92, "learning_rate": 3.7177764819776975e-07, "loss": 0.7676, "step": 6591 }, { "epoch": 0.92, "learning_rate": 3.70563304562469e-07, "loss": 0.7374, "step": 6592 }, { "epoch": 0.92, "learning_rate": 3.693509099482473e-07, "loss": 0.7288, "step": 6593 }, { "epoch": 0.92, "learning_rate": 3.6814046460049935e-07, "loss": 0.8059, "step": 6594 }, { "epoch": 0.92, "learning_rate": 3.6693196876422035e-07, "loss": 0.7716, "step": 6595 }, { "epoch": 0.92, "learning_rate": 3.6572542268401124e-07, "loss": 0.8027, "step": 6596 }, { "epoch": 0.92, "learning_rate": 3.6452082660408226e-07, "loss": 0.8345, "step": 6597 }, { "epoch": 0.92, "learning_rate": 3.6331818076824397e-07, "loss": 0.843, "step": 6598 }, { "epoch": 0.92, "learning_rate": 3.6211748541991944e-07, "loss": 0.7483, "step": 6599 }, { "epoch": 0.92, "learning_rate": 3.609187408021275e-07, "loss": 0.7729, "step": 6600 }, { "epoch": 0.92, "learning_rate": 3.5972194715749865e-07, "loss": 0.749, "step": 6601 }, { "epoch": 0.92, "learning_rate": 3.585271047282679e-07, "loss": 0.8596, "step": 6602 }, { "epoch": 0.92, "learning_rate": 3.5733421375627074e-07, "loss": 0.8392, "step": 6603 }, { "epoch": 0.92, "learning_rate": 3.5614327448295625e-07, "loss": 0.8374, "step": 6604 }, { "epoch": 0.92, "learning_rate": 3.5495428714937053e-07, "loss": 0.8279, "step": 6605 }, { "epoch": 0.92, "learning_rate": 3.5376725199616655e-07, "loss": 0.8125, "step": 6606 }, { "epoch": 0.92, "learning_rate": 3.5258216926360447e-07, "loss": 0.5635, "step": 6607 }, { "epoch": 0.92, "learning_rate": 3.513990391915478e-07, "loss": 0.8022, "step": 6608 }, { "epoch": 0.92, "learning_rate": 3.502178620194652e-07, "loss": 0.8384, "step": 6609 }, { "epoch": 0.92, "learning_rate": 3.490386379864297e-07, "loss": 0.785, "step": 6610 }, { "epoch": 0.92, "learning_rate": 3.4786136733111707e-07, "loss": 0.7363, "step": 6611 }, { "epoch": 0.92, "learning_rate": 3.4668605029181233e-07, "loss": 0.7568, "step": 6612 }, { "epoch": 0.92, "learning_rate": 3.455126871064007e-07, "loss": 0.7759, "step": 6613 }, { "epoch": 0.92, "learning_rate": 3.443412780123756e-07, "loss": 0.8523, "step": 6614 }, { "epoch": 0.92, "learning_rate": 3.431718232468317e-07, "loss": 0.7183, "step": 6615 }, { "epoch": 0.92, "learning_rate": 3.4200432304646757e-07, "loss": 0.8215, "step": 6616 }, { "epoch": 0.92, "learning_rate": 3.40838777647593e-07, "loss": 0.8113, "step": 6617 }, { "epoch": 0.92, "learning_rate": 3.396751872861126e-07, "loss": 0.8015, "step": 6618 }, { "epoch": 0.92, "learning_rate": 3.3851355219754243e-07, "loss": 0.7993, "step": 6619 }, { "epoch": 0.92, "learning_rate": 3.373538726169989e-07, "loss": 0.5846, "step": 6620 }, { "epoch": 0.92, "learning_rate": 3.3619614877920425e-07, "loss": 0.7615, "step": 6621 }, { "epoch": 0.92, "learning_rate": 3.350403809184843e-07, "loss": 0.8762, "step": 6622 }, { "epoch": 0.92, "learning_rate": 3.3388656926876983e-07, "loss": 0.7781, "step": 6623 }, { "epoch": 0.92, "learning_rate": 3.327347140635961e-07, "loss": 0.7639, "step": 6624 }, { "epoch": 0.92, "learning_rate": 3.31584815536099e-07, "loss": 0.8271, "step": 6625 }, { "epoch": 0.92, "learning_rate": 3.3043687391902225e-07, "loss": 0.813, "step": 6626 }, { "epoch": 0.92, "learning_rate": 3.292908894447111e-07, "loss": 0.741, "step": 6627 }, { "epoch": 0.92, "learning_rate": 3.281468623451156e-07, "loss": 0.7405, "step": 6628 }, { "epoch": 0.92, "learning_rate": 3.2700479285179165e-07, "loss": 0.7367, "step": 6629 }, { "epoch": 0.92, "learning_rate": 3.2586468119589545e-07, "loss": 0.5553, "step": 6630 }, { "epoch": 0.92, "learning_rate": 3.247265276081868e-07, "loss": 0.856, "step": 6631 }, { "epoch": 0.92, "learning_rate": 3.2359033231903257e-07, "loss": 0.7229, "step": 6632 }, { "epoch": 0.92, "learning_rate": 3.2245609555839997e-07, "loss": 0.8435, "step": 6633 }, { "epoch": 0.92, "learning_rate": 3.2132381755586415e-07, "loss": 0.8982, "step": 6634 }, { "epoch": 0.92, "learning_rate": 3.2019349854059744e-07, "loss": 0.7454, "step": 6635 }, { "epoch": 0.92, "learning_rate": 3.190651387413801e-07, "loss": 0.5814, "step": 6636 }, { "epoch": 0.92, "learning_rate": 3.179387383865973e-07, "loss": 0.792, "step": 6637 }, { "epoch": 0.92, "learning_rate": 3.16814297704231e-07, "loss": 0.5475, "step": 6638 }, { "epoch": 0.92, "learning_rate": 3.156918169218748e-07, "loss": 0.7766, "step": 6639 }, { "epoch": 0.92, "learning_rate": 3.145712962667191e-07, "loss": 0.5472, "step": 6640 }, { "epoch": 0.92, "learning_rate": 3.1345273596556034e-07, "loss": 0.7285, "step": 6641 }, { "epoch": 0.92, "learning_rate": 3.123361362447985e-07, "loss": 0.8894, "step": 6642 }, { "epoch": 0.92, "learning_rate": 3.1122149733043394e-07, "loss": 0.7644, "step": 6643 }, { "epoch": 0.92, "learning_rate": 3.1010881944807505e-07, "loss": 0.5924, "step": 6644 }, { "epoch": 0.92, "learning_rate": 3.0899810282292943e-07, "loss": 0.843, "step": 6645 }, { "epoch": 0.92, "learning_rate": 3.0788934767980726e-07, "loss": 0.7815, "step": 6646 }, { "epoch": 0.92, "learning_rate": 3.0678255424312577e-07, "loss": 0.584, "step": 6647 }, { "epoch": 0.92, "learning_rate": 3.056777227369012e-07, "loss": 0.8118, "step": 6648 }, { "epoch": 0.92, "learning_rate": 3.0457485338475477e-07, "loss": 0.7056, "step": 6649 }, { "epoch": 0.92, "learning_rate": 3.03473946409909e-07, "loss": 0.7734, "step": 6650 }, { "epoch": 0.92, "learning_rate": 3.023750020351901e-07, "loss": 0.7952, "step": 6651 }, { "epoch": 0.92, "learning_rate": 3.012780204830279e-07, "loss": 0.7998, "step": 6652 }, { "epoch": 0.92, "learning_rate": 3.001830019754537e-07, "loss": 0.7159, "step": 6653 }, { "epoch": 0.92, "learning_rate": 2.990899467341024e-07, "loss": 0.7991, "step": 6654 }, { "epoch": 0.92, "learning_rate": 2.979988549802104e-07, "loss": 0.814, "step": 6655 }, { "epoch": 0.92, "learning_rate": 2.969097269346155e-07, "loss": 0.7961, "step": 6656 }, { "epoch": 0.92, "learning_rate": 2.9582256281776355e-07, "loss": 0.7688, "step": 6657 }, { "epoch": 0.92, "learning_rate": 2.9473736284969635e-07, "loss": 0.8196, "step": 6658 }, { "epoch": 0.92, "learning_rate": 2.936541272500637e-07, "loss": 0.8101, "step": 6659 }, { "epoch": 0.93, "learning_rate": 2.925728562381114e-07, "loss": 0.7787, "step": 6660 }, { "epoch": 0.93, "learning_rate": 2.914935500326932e-07, "loss": 0.8175, "step": 6661 }, { "epoch": 0.93, "learning_rate": 2.904162088522644e-07, "loss": 0.8433, "step": 6662 }, { "epoch": 0.93, "learning_rate": 2.8934083291487946e-07, "loss": 0.8013, "step": 6663 }, { "epoch": 0.93, "learning_rate": 2.882674224381987e-07, "loss": 0.8044, "step": 6664 }, { "epoch": 0.93, "learning_rate": 2.871959776394828e-07, "loss": 0.54, "step": 6665 }, { "epoch": 0.93, "learning_rate": 2.861264987355916e-07, "loss": 0.8301, "step": 6666 }, { "epoch": 0.93, "learning_rate": 2.850589859429953e-07, "loss": 0.8367, "step": 6667 }, { "epoch": 0.93, "learning_rate": 2.8399343947775657e-07, "loss": 0.8491, "step": 6668 }, { "epoch": 0.93, "learning_rate": 2.8292985955554744e-07, "loss": 0.7461, "step": 6669 }, { "epoch": 0.93, "learning_rate": 2.8186824639163777e-07, "loss": 0.8071, "step": 6670 }, { "epoch": 0.93, "learning_rate": 2.808086002009014e-07, "loss": 0.8284, "step": 6671 }, { "epoch": 0.93, "learning_rate": 2.797509211978122e-07, "loss": 0.7749, "step": 6672 }, { "epoch": 0.93, "learning_rate": 2.786952095964479e-07, "loss": 0.8455, "step": 6673 }, { "epoch": 0.93, "learning_rate": 2.7764146561048646e-07, "loss": 0.7727, "step": 6674 }, { "epoch": 0.93, "learning_rate": 2.765896894532083e-07, "loss": 0.783, "step": 6675 }, { "epoch": 0.93, "learning_rate": 2.7553988133749544e-07, "loss": 0.8411, "step": 6676 }, { "epoch": 0.93, "learning_rate": 2.744920414758323e-07, "loss": 0.7324, "step": 6677 }, { "epoch": 0.93, "learning_rate": 2.734461700803026e-07, "loss": 0.8301, "step": 6678 }, { "epoch": 0.93, "learning_rate": 2.724022673625959e-07, "loss": 0.8389, "step": 6679 }, { "epoch": 0.93, "learning_rate": 2.7136033353399647e-07, "loss": 0.76, "step": 6680 }, { "epoch": 0.93, "learning_rate": 2.703203688053979e-07, "loss": 0.803, "step": 6681 }, { "epoch": 0.93, "learning_rate": 2.692823733872907e-07, "loss": 0.8164, "step": 6682 }, { "epoch": 0.93, "learning_rate": 2.6824634748976675e-07, "loss": 0.8149, "step": 6683 }, { "epoch": 0.93, "learning_rate": 2.672122913225206e-07, "loss": 0.5682, "step": 6684 }, { "epoch": 0.93, "learning_rate": 2.66180205094847e-07, "loss": 0.8301, "step": 6685 }, { "epoch": 0.93, "learning_rate": 2.6515008901564445e-07, "loss": 0.8359, "step": 6686 }, { "epoch": 0.93, "learning_rate": 2.641219432934106e-07, "loss": 0.7209, "step": 6687 }, { "epoch": 0.93, "learning_rate": 2.6309576813624114e-07, "loss": 0.7932, "step": 6688 }, { "epoch": 0.93, "learning_rate": 2.620715637518412e-07, "loss": 0.5855, "step": 6689 }, { "epoch": 0.93, "learning_rate": 2.610493303475092e-07, "loss": 0.731, "step": 6690 }, { "epoch": 0.93, "learning_rate": 2.6002906813014983e-07, "loss": 0.7808, "step": 6691 }, { "epoch": 0.93, "learning_rate": 2.5901077730626446e-07, "loss": 0.6808, "step": 6692 }, { "epoch": 0.93, "learning_rate": 2.5799445808195824e-07, "loss": 0.7803, "step": 6693 }, { "epoch": 0.93, "learning_rate": 2.569801106629377e-07, "loss": 0.6158, "step": 6694 }, { "epoch": 0.93, "learning_rate": 2.559677352545065e-07, "loss": 0.7538, "step": 6695 }, { "epoch": 0.93, "learning_rate": 2.5495733206157613e-07, "loss": 0.887, "step": 6696 }, { "epoch": 0.93, "learning_rate": 2.539489012886509e-07, "loss": 0.8445, "step": 6697 }, { "epoch": 0.93, "learning_rate": 2.5294244313984086e-07, "loss": 0.8271, "step": 6698 }, { "epoch": 0.93, "learning_rate": 2.519379578188552e-07, "loss": 0.7833, "step": 6699 }, { "epoch": 0.93, "learning_rate": 2.5093544552900473e-07, "loss": 0.8333, "step": 6700 }, { "epoch": 0.93, "learning_rate": 2.499349064732004e-07, "loss": 0.8191, "step": 6701 }, { "epoch": 0.93, "learning_rate": 2.489363408539547e-07, "loss": 0.7786, "step": 6702 }, { "epoch": 0.93, "learning_rate": 2.479397488733759e-07, "loss": 0.8032, "step": 6703 }, { "epoch": 0.93, "learning_rate": 2.469451307331816e-07, "loss": 0.8845, "step": 6704 }, { "epoch": 0.93, "learning_rate": 2.4595248663468075e-07, "loss": 0.7981, "step": 6705 }, { "epoch": 0.93, "learning_rate": 2.4496181677878926e-07, "loss": 0.8137, "step": 6706 }, { "epoch": 0.93, "learning_rate": 2.439731213660212e-07, "loss": 0.8469, "step": 6707 }, { "epoch": 0.93, "learning_rate": 2.429864005964888e-07, "loss": 0.6119, "step": 6708 }, { "epoch": 0.93, "learning_rate": 2.4200165466990887e-07, "loss": 0.8057, "step": 6709 }, { "epoch": 0.93, "learning_rate": 2.4101888378559537e-07, "loss": 0.7925, "step": 6710 }, { "epoch": 0.93, "learning_rate": 2.4003808814246355e-07, "loss": 0.7957, "step": 6711 }, { "epoch": 0.93, "learning_rate": 2.390592679390291e-07, "loss": 0.8496, "step": 6712 }, { "epoch": 0.93, "learning_rate": 2.3808242337340693e-07, "loss": 0.8218, "step": 6713 }, { "epoch": 0.93, "learning_rate": 2.3710755464331324e-07, "loss": 0.6263, "step": 6714 }, { "epoch": 0.93, "learning_rate": 2.361346619460636e-07, "loss": 0.553, "step": 6715 }, { "epoch": 0.93, "learning_rate": 2.351637454785749e-07, "loss": 0.7822, "step": 6716 }, { "epoch": 0.93, "learning_rate": 2.3419480543736106e-07, "loss": 0.7556, "step": 6717 }, { "epoch": 0.93, "learning_rate": 2.3322784201853855e-07, "loss": 0.8406, "step": 6718 }, { "epoch": 0.93, "learning_rate": 2.3226285541782523e-07, "loss": 0.7999, "step": 6719 }, { "epoch": 0.93, "learning_rate": 2.3129984583053267e-07, "loss": 0.7883, "step": 6720 }, { "epoch": 0.93, "learning_rate": 2.3033881345157938e-07, "loss": 0.7749, "step": 6721 }, { "epoch": 0.93, "learning_rate": 2.2937975847547978e-07, "loss": 0.8447, "step": 6722 }, { "epoch": 0.93, "learning_rate": 2.2842268109634858e-07, "loss": 0.8398, "step": 6723 }, { "epoch": 0.93, "learning_rate": 2.2746758150790083e-07, "loss": 0.803, "step": 6724 }, { "epoch": 0.93, "learning_rate": 2.2651445990345078e-07, "loss": 0.7643, "step": 6725 }, { "epoch": 0.93, "learning_rate": 2.25563316475913e-07, "loss": 0.7727, "step": 6726 }, { "epoch": 0.93, "learning_rate": 2.246141514178013e-07, "loss": 0.8198, "step": 6727 }, { "epoch": 0.93, "learning_rate": 2.2366696492122752e-07, "loss": 0.7739, "step": 6728 }, { "epoch": 0.93, "learning_rate": 2.227217571779061e-07, "loss": 0.718, "step": 6729 }, { "epoch": 0.93, "learning_rate": 2.217785283791485e-07, "loss": 0.7638, "step": 6730 }, { "epoch": 0.93, "learning_rate": 2.2083727871586636e-07, "loss": 0.7771, "step": 6731 }, { "epoch": 0.94, "learning_rate": 2.1989800837857288e-07, "loss": 0.8455, "step": 6732 }, { "epoch": 0.94, "learning_rate": 2.1896071755737492e-07, "loss": 0.8291, "step": 6733 }, { "epoch": 0.94, "learning_rate": 2.1802540644198622e-07, "loss": 0.8452, "step": 6734 }, { "epoch": 0.94, "learning_rate": 2.1709207522171204e-07, "loss": 0.515, "step": 6735 }, { "epoch": 0.94, "learning_rate": 2.1616072408546573e-07, "loss": 0.7822, "step": 6736 }, { "epoch": 0.94, "learning_rate": 2.1523135322175094e-07, "loss": 0.8599, "step": 6737 }, { "epoch": 0.94, "learning_rate": 2.1430396281867604e-07, "loss": 0.7891, "step": 6738 }, { "epoch": 0.94, "learning_rate": 2.1337855306394761e-07, "loss": 0.8762, "step": 6739 }, { "epoch": 0.94, "learning_rate": 2.1245512414486802e-07, "loss": 0.7444, "step": 6740 }, { "epoch": 0.94, "learning_rate": 2.1153367624834665e-07, "loss": 0.8523, "step": 6741 }, { "epoch": 0.94, "learning_rate": 2.1061420956088208e-07, "loss": 0.863, "step": 6742 }, { "epoch": 0.94, "learning_rate": 2.096967242685777e-07, "loss": 0.7292, "step": 6743 }, { "epoch": 0.94, "learning_rate": 2.087812205571371e-07, "loss": 0.8191, "step": 6744 }, { "epoch": 0.94, "learning_rate": 2.0786769861185664e-07, "loss": 0.8101, "step": 6745 }, { "epoch": 0.94, "learning_rate": 2.069561586176394e-07, "loss": 0.8191, "step": 6746 }, { "epoch": 0.94, "learning_rate": 2.0604660075898008e-07, "loss": 0.7614, "step": 6747 }, { "epoch": 0.94, "learning_rate": 2.0513902521997587e-07, "loss": 0.5812, "step": 6748 }, { "epoch": 0.94, "learning_rate": 2.0423343218432422e-07, "loss": 0.8376, "step": 6749 }, { "epoch": 0.94, "learning_rate": 2.0332982183531636e-07, "loss": 0.8167, "step": 6750 }, { "epoch": 0.94, "learning_rate": 2.0242819435584816e-07, "loss": 0.8259, "step": 6751 }, { "epoch": 0.94, "learning_rate": 2.015285499284092e-07, "loss": 0.8672, "step": 6752 }, { "epoch": 0.94, "learning_rate": 2.006308887350905e-07, "loss": 0.8335, "step": 6753 }, { "epoch": 0.94, "learning_rate": 1.997352109575812e-07, "loss": 0.8071, "step": 6754 }, { "epoch": 0.94, "learning_rate": 1.9884151677716622e-07, "loss": 0.77, "step": 6755 }, { "epoch": 0.94, "learning_rate": 1.9794980637473538e-07, "loss": 0.813, "step": 6756 }, { "epoch": 0.94, "learning_rate": 1.9706007993076982e-07, "loss": 0.8108, "step": 6757 }, { "epoch": 0.94, "learning_rate": 1.9617233762535325e-07, "loss": 0.8201, "step": 6758 }, { "epoch": 0.94, "learning_rate": 1.9528657963816754e-07, "loss": 0.6197, "step": 6759 }, { "epoch": 0.94, "learning_rate": 1.944028061484904e-07, "loss": 0.7971, "step": 6760 }, { "epoch": 0.94, "learning_rate": 1.93521017335202e-07, "loss": 0.8271, "step": 6761 }, { "epoch": 0.94, "learning_rate": 1.9264121337677742e-07, "loss": 0.7971, "step": 6762 }, { "epoch": 0.94, "learning_rate": 1.917633944512909e-07, "loss": 0.8274, "step": 6763 }, { "epoch": 0.94, "learning_rate": 1.908875607364158e-07, "loss": 0.8162, "step": 6764 }, { "epoch": 0.94, "learning_rate": 1.9001371240942146e-07, "loss": 0.7207, "step": 6765 }, { "epoch": 0.94, "learning_rate": 1.8914184964717864e-07, "loss": 0.5861, "step": 6766 }, { "epoch": 0.94, "learning_rate": 1.8827197262615392e-07, "loss": 0.7756, "step": 6767 }, { "epoch": 0.94, "learning_rate": 1.8740408152241096e-07, "loss": 0.8318, "step": 6768 }, { "epoch": 0.94, "learning_rate": 1.8653817651161587e-07, "loss": 0.8291, "step": 6769 }, { "epoch": 0.94, "learning_rate": 1.8567425776902736e-07, "loss": 0.8135, "step": 6770 }, { "epoch": 0.94, "learning_rate": 1.8481232546950667e-07, "loss": 0.7925, "step": 6771 }, { "epoch": 0.94, "learning_rate": 1.839523797875098e-07, "loss": 0.8201, "step": 6772 }, { "epoch": 0.94, "learning_rate": 1.8309442089709085e-07, "loss": 0.8337, "step": 6773 }, { "epoch": 0.94, "learning_rate": 1.8223844897190424e-07, "loss": 0.7961, "step": 6774 }, { "epoch": 0.94, "learning_rate": 1.8138446418520028e-07, "loss": 0.7466, "step": 6775 }, { "epoch": 0.94, "learning_rate": 1.805324667098285e-07, "loss": 0.7935, "step": 6776 }, { "epoch": 0.94, "learning_rate": 1.7968245671823425e-07, "loss": 0.7224, "step": 6777 }, { "epoch": 0.94, "learning_rate": 1.7883443438246106e-07, "loss": 0.8108, "step": 6778 }, { "epoch": 0.94, "learning_rate": 1.7798839987415162e-07, "loss": 0.8621, "step": 6779 }, { "epoch": 0.94, "learning_rate": 1.771443533645445e-07, "loss": 0.8013, "step": 6780 }, { "epoch": 0.94, "learning_rate": 1.763022950244786e-07, "loss": 0.7607, "step": 6781 }, { "epoch": 0.94, "learning_rate": 1.7546222502438648e-07, "loss": 0.7472, "step": 6782 }, { "epoch": 0.94, "learning_rate": 1.7462414353429992e-07, "loss": 0.7871, "step": 6783 }, { "epoch": 0.94, "learning_rate": 1.7378805072385209e-07, "loss": 0.8325, "step": 6784 }, { "epoch": 0.94, "learning_rate": 1.729539467622654e-07, "loss": 0.7928, "step": 6785 }, { "epoch": 0.94, "learning_rate": 1.7212183181836928e-07, "loss": 0.7954, "step": 6786 }, { "epoch": 0.94, "learning_rate": 1.7129170606058121e-07, "loss": 0.7404, "step": 6787 }, { "epoch": 0.94, "learning_rate": 1.7046356965692456e-07, "loss": 0.7869, "step": 6788 }, { "epoch": 0.94, "learning_rate": 1.6963742277501415e-07, "loss": 0.8679, "step": 6789 }, { "epoch": 0.94, "learning_rate": 1.6881326558206402e-07, "loss": 0.7959, "step": 6790 }, { "epoch": 0.94, "learning_rate": 1.6799109824488736e-07, "loss": 0.7693, "step": 6791 }, { "epoch": 0.94, "learning_rate": 1.6717092092988885e-07, "loss": 0.8516, "step": 6792 }, { "epoch": 0.94, "learning_rate": 1.6635273380307905e-07, "loss": 0.8171, "step": 6793 }, { "epoch": 0.94, "learning_rate": 1.655365370300588e-07, "loss": 0.8096, "step": 6794 }, { "epoch": 0.94, "learning_rate": 1.6472233077602707e-07, "loss": 0.8313, "step": 6795 }, { "epoch": 0.94, "learning_rate": 1.6391011520578314e-07, "loss": 0.7515, "step": 6796 }, { "epoch": 0.94, "learning_rate": 1.6309989048372e-07, "loss": 0.7729, "step": 6797 }, { "epoch": 0.94, "learning_rate": 1.6229165677383086e-07, "loss": 0.7861, "step": 6798 }, { "epoch": 0.94, "learning_rate": 1.6148541423970266e-07, "loss": 0.7876, "step": 6799 }, { "epoch": 0.94, "learning_rate": 1.606811630445204e-07, "loss": 0.7598, "step": 6800 }, { "epoch": 0.94, "learning_rate": 1.5987890335106725e-07, "loss": 0.7604, "step": 6801 }, { "epoch": 0.94, "learning_rate": 1.590786353217233e-07, "loss": 0.7988, "step": 6802 }, { "epoch": 0.94, "learning_rate": 1.582803591184634e-07, "loss": 0.7915, "step": 6803 }, { "epoch": 0.95, "learning_rate": 1.5748407490286167e-07, "loss": 0.8123, "step": 6804 }, { "epoch": 0.95, "learning_rate": 1.5668978283608694e-07, "loss": 0.7495, "step": 6805 }, { "epoch": 0.95, "learning_rate": 1.5589748307890616e-07, "loss": 0.7715, "step": 6806 }, { "epoch": 0.95, "learning_rate": 1.5510717579168333e-07, "loss": 0.8254, "step": 6807 }, { "epoch": 0.95, "learning_rate": 1.543188611343771e-07, "loss": 0.7791, "step": 6808 }, { "epoch": 0.95, "learning_rate": 1.5353253926654655e-07, "loss": 0.8003, "step": 6809 }, { "epoch": 0.95, "learning_rate": 1.5274821034734212e-07, "loss": 0.8511, "step": 6810 }, { "epoch": 0.95, "learning_rate": 1.519658745355168e-07, "loss": 0.7812, "step": 6811 }, { "epoch": 0.95, "learning_rate": 1.511855319894151e-07, "loss": 0.7876, "step": 6812 }, { "epoch": 0.95, "learning_rate": 1.5040718286698063e-07, "loss": 0.7034, "step": 6813 }, { "epoch": 0.95, "learning_rate": 1.4963082732575517e-07, "loss": 0.7385, "step": 6814 }, { "epoch": 0.95, "learning_rate": 1.488564655228708e-07, "loss": 0.7412, "step": 6815 }, { "epoch": 0.95, "learning_rate": 1.4808409761506437e-07, "loss": 0.7367, "step": 6816 }, { "epoch": 0.95, "learning_rate": 1.4731372375866305e-07, "loss": 0.7567, "step": 6817 }, { "epoch": 0.95, "learning_rate": 1.465453441095932e-07, "loss": 0.7854, "step": 6818 }, { "epoch": 0.95, "learning_rate": 1.457789588233749e-07, "loss": 0.845, "step": 6819 }, { "epoch": 0.95, "learning_rate": 1.4501456805512848e-07, "loss": 0.8191, "step": 6820 }, { "epoch": 0.95, "learning_rate": 1.4425217195956686e-07, "loss": 0.7654, "step": 6821 }, { "epoch": 0.95, "learning_rate": 1.4349177069100218e-07, "loss": 0.8457, "step": 6822 }, { "epoch": 0.95, "learning_rate": 1.4273336440334018e-07, "loss": 0.8689, "step": 6823 }, { "epoch": 0.95, "learning_rate": 1.4197695325008586e-07, "loss": 0.8257, "step": 6824 }, { "epoch": 0.95, "learning_rate": 1.412225373843368e-07, "loss": 0.8101, "step": 6825 }, { "epoch": 0.95, "learning_rate": 1.4047011695878964e-07, "loss": 0.8645, "step": 6826 }, { "epoch": 0.95, "learning_rate": 1.3971969212573487e-07, "loss": 0.6364, "step": 6827 }, { "epoch": 0.95, "learning_rate": 1.389712630370621e-07, "loss": 0.8577, "step": 6828 }, { "epoch": 0.95, "learning_rate": 1.3822482984425457e-07, "loss": 0.8464, "step": 6829 }, { "epoch": 0.95, "learning_rate": 1.3748039269839032e-07, "loss": 0.8184, "step": 6830 }, { "epoch": 0.95, "learning_rate": 1.3673795175014881e-07, "loss": 0.7568, "step": 6831 }, { "epoch": 0.95, "learning_rate": 1.3599750714979765e-07, "loss": 0.7949, "step": 6832 }, { "epoch": 0.95, "learning_rate": 1.3525905904720804e-07, "loss": 0.5999, "step": 6833 }, { "epoch": 0.95, "learning_rate": 1.3452260759184267e-07, "loss": 0.7922, "step": 6834 }, { "epoch": 0.95, "learning_rate": 1.3378815293276004e-07, "loss": 0.8242, "step": 6835 }, { "epoch": 0.95, "learning_rate": 1.3305569521861682e-07, "loss": 0.7975, "step": 6836 }, { "epoch": 0.95, "learning_rate": 1.3232523459766334e-07, "loss": 0.7937, "step": 6837 }, { "epoch": 0.95, "learning_rate": 1.3159677121774684e-07, "loss": 0.7559, "step": 6838 }, { "epoch": 0.95, "learning_rate": 1.308703052263105e-07, "loss": 0.7703, "step": 6839 }, { "epoch": 0.95, "learning_rate": 1.3014583677039118e-07, "loss": 0.8376, "step": 6840 }, { "epoch": 0.95, "learning_rate": 1.2942336599662596e-07, "loss": 0.8092, "step": 6841 }, { "epoch": 0.95, "learning_rate": 1.2870289305124128e-07, "loss": 0.77, "step": 6842 }, { "epoch": 0.95, "learning_rate": 1.27984418080066e-07, "loss": 0.8167, "step": 6843 }, { "epoch": 0.95, "learning_rate": 1.2726794122851826e-07, "loss": 0.801, "step": 6844 }, { "epoch": 0.95, "learning_rate": 1.2655346264161538e-07, "loss": 0.7637, "step": 6845 }, { "epoch": 0.95, "learning_rate": 1.258409824639717e-07, "loss": 0.8882, "step": 6846 }, { "epoch": 0.95, "learning_rate": 1.2513050083979184e-07, "loss": 0.7832, "step": 6847 }, { "epoch": 0.95, "learning_rate": 1.2442201791288077e-07, "loss": 0.7705, "step": 6848 }, { "epoch": 0.95, "learning_rate": 1.2371553382663716e-07, "loss": 0.8562, "step": 6849 }, { "epoch": 0.95, "learning_rate": 1.2301104872405322e-07, "loss": 0.7766, "step": 6850 }, { "epoch": 0.95, "learning_rate": 1.2230856274772163e-07, "loss": 0.8184, "step": 6851 }, { "epoch": 0.95, "learning_rate": 1.2160807603982415e-07, "loss": 0.8014, "step": 6852 }, { "epoch": 0.95, "learning_rate": 1.2090958874214298e-07, "loss": 0.7456, "step": 6853 }, { "epoch": 0.95, "learning_rate": 1.2021310099605387e-07, "loss": 0.8567, "step": 6854 }, { "epoch": 0.95, "learning_rate": 1.1951861294252521e-07, "loss": 0.8037, "step": 6855 }, { "epoch": 0.95, "learning_rate": 1.1882612472212563e-07, "loss": 0.8057, "step": 6856 }, { "epoch": 0.95, "learning_rate": 1.1813563647501414e-07, "loss": 0.8315, "step": 6857 }, { "epoch": 0.95, "learning_rate": 1.1744714834094895e-07, "loss": 0.8098, "step": 6858 }, { "epoch": 0.95, "learning_rate": 1.167606604592808e-07, "loss": 0.804, "step": 6859 }, { "epoch": 0.95, "learning_rate": 1.1607617296895745e-07, "loss": 0.7786, "step": 6860 }, { "epoch": 0.95, "learning_rate": 1.153936860085203e-07, "loss": 0.8101, "step": 6861 }, { "epoch": 0.95, "learning_rate": 1.147131997161044e-07, "loss": 0.7645, "step": 6862 }, { "epoch": 0.95, "learning_rate": 1.1403471422944623e-07, "loss": 0.8235, "step": 6863 }, { "epoch": 0.95, "learning_rate": 1.133582296858693e-07, "loss": 0.594, "step": 6864 }, { "epoch": 0.95, "learning_rate": 1.1268374622229516e-07, "loss": 0.7617, "step": 6865 }, { "epoch": 0.95, "learning_rate": 1.1201126397524464e-07, "loss": 0.8462, "step": 6866 }, { "epoch": 0.95, "learning_rate": 1.1134078308082552e-07, "loss": 0.822, "step": 6867 }, { "epoch": 0.95, "learning_rate": 1.1067230367474813e-07, "loss": 0.8232, "step": 6868 }, { "epoch": 0.95, "learning_rate": 1.1000582589231312e-07, "loss": 0.7673, "step": 6869 }, { "epoch": 0.95, "learning_rate": 1.0934134986841593e-07, "loss": 0.8506, "step": 6870 }, { "epoch": 0.95, "learning_rate": 1.0867887573755009e-07, "loss": 0.7954, "step": 6871 }, { "epoch": 0.95, "learning_rate": 1.0801840363379944e-07, "loss": 0.8242, "step": 6872 }, { "epoch": 0.95, "learning_rate": 1.0735993369084818e-07, "loss": 0.8079, "step": 6873 }, { "epoch": 0.95, "learning_rate": 1.067034660419708e-07, "loss": 0.8005, "step": 6874 }, { "epoch": 0.95, "learning_rate": 1.0604900082003766e-07, "loss": 0.7292, "step": 6875 }, { "epoch": 0.96, "learning_rate": 1.0539653815751393e-07, "loss": 0.7739, "step": 6876 }, { "epoch": 0.96, "learning_rate": 1.0474607818645954e-07, "loss": 0.7937, "step": 6877 }, { "epoch": 0.96, "learning_rate": 1.0409762103853027e-07, "loss": 0.8367, "step": 6878 }, { "epoch": 0.96, "learning_rate": 1.0345116684497558e-07, "loss": 0.7563, "step": 6879 }, { "epoch": 0.96, "learning_rate": 1.0280671573663636e-07, "loss": 0.7732, "step": 6880 }, { "epoch": 0.96, "learning_rate": 1.0216426784395494e-07, "loss": 0.8325, "step": 6881 }, { "epoch": 0.96, "learning_rate": 1.0152382329696175e-07, "loss": 0.8286, "step": 6882 }, { "epoch": 0.96, "learning_rate": 1.0088538222528532e-07, "loss": 0.741, "step": 6883 }, { "epoch": 0.96, "learning_rate": 1.0024894475814783e-07, "loss": 0.7197, "step": 6884 }, { "epoch": 0.96, "learning_rate": 9.961451102436515e-08, "loss": 0.5497, "step": 6885 }, { "epoch": 0.96, "learning_rate": 9.898208115234787e-08, "loss": 0.7798, "step": 6886 }, { "epoch": 0.96, "learning_rate": 9.835165527010138e-08, "loss": 0.8252, "step": 6887 }, { "epoch": 0.96, "learning_rate": 9.772323350522694e-08, "loss": 0.7285, "step": 6888 }, { "epoch": 0.96, "learning_rate": 9.709681598491839e-08, "loss": 0.765, "step": 6889 }, { "epoch": 0.96, "learning_rate": 9.647240283596094e-08, "loss": 0.7791, "step": 6890 }, { "epoch": 0.96, "learning_rate": 9.584999418474128e-08, "loss": 0.8606, "step": 6891 }, { "epoch": 0.96, "learning_rate": 9.52295901572342e-08, "loss": 0.8411, "step": 6892 }, { "epoch": 0.96, "learning_rate": 9.461119087901261e-08, "loss": 0.8694, "step": 6893 }, { "epoch": 0.96, "learning_rate": 9.399479647523968e-08, "loss": 0.8035, "step": 6894 }, { "epoch": 0.96, "learning_rate": 9.338040707067675e-08, "loss": 0.7825, "step": 6895 }, { "epoch": 0.96, "learning_rate": 9.276802278967767e-08, "loss": 0.8413, "step": 6896 }, { "epoch": 0.96, "learning_rate": 9.215764375618885e-08, "loss": 0.855, "step": 6897 }, { "epoch": 0.96, "learning_rate": 9.15492700937548e-08, "loss": 0.7891, "step": 6898 }, { "epoch": 0.96, "learning_rate": 9.094290192551147e-08, "loss": 0.5752, "step": 6899 }, { "epoch": 0.96, "learning_rate": 9.033853937418735e-08, "loss": 0.7524, "step": 6900 }, { "epoch": 0.96, "learning_rate": 8.973618256210903e-08, "loss": 0.853, "step": 6901 }, { "epoch": 0.96, "learning_rate": 8.913583161119344e-08, "loss": 0.8206, "step": 6902 }, { "epoch": 0.96, "learning_rate": 8.853748664295337e-08, "loss": 0.8021, "step": 6903 }, { "epoch": 0.96, "learning_rate": 8.794114777849527e-08, "loss": 0.8091, "step": 6904 }, { "epoch": 0.96, "learning_rate": 8.73468151385215e-08, "loss": 0.8221, "step": 6905 }, { "epoch": 0.96, "learning_rate": 8.67544888433236e-08, "loss": 0.822, "step": 6906 }, { "epoch": 0.96, "learning_rate": 8.616416901279013e-08, "loss": 0.7654, "step": 6907 }, { "epoch": 0.96, "learning_rate": 8.557585576640548e-08, "loss": 0.8728, "step": 6908 }, { "epoch": 0.96, "learning_rate": 8.498954922324332e-08, "loss": 0.8105, "step": 6909 }, { "epoch": 0.96, "learning_rate": 8.440524950197537e-08, "loss": 0.8083, "step": 6910 }, { "epoch": 0.96, "learning_rate": 8.382295672086372e-08, "loss": 0.76, "step": 6911 }, { "epoch": 0.96, "learning_rate": 8.324267099776628e-08, "loss": 0.7798, "step": 6912 }, { "epoch": 0.96, "learning_rate": 8.266439245013469e-08, "loss": 0.7806, "step": 6913 }, { "epoch": 0.96, "learning_rate": 8.20881211950142e-08, "loss": 0.8185, "step": 6914 }, { "epoch": 0.96, "learning_rate": 8.15138573490426e-08, "loss": 0.8054, "step": 6915 }, { "epoch": 0.96, "learning_rate": 8.09416010284525e-08, "loss": 0.5521, "step": 6916 }, { "epoch": 0.96, "learning_rate": 8.037135234907012e-08, "loss": 0.7729, "step": 6917 }, { "epoch": 0.96, "learning_rate": 7.980311142631536e-08, "loss": 0.7915, "step": 6918 }, { "epoch": 0.96, "learning_rate": 7.923687837520066e-08, "loss": 0.8352, "step": 6919 }, { "epoch": 0.96, "learning_rate": 7.867265331033436e-08, "loss": 0.7529, "step": 6920 }, { "epoch": 0.96, "learning_rate": 7.81104363459162e-08, "loss": 0.8203, "step": 6921 }, { "epoch": 0.96, "learning_rate": 7.75502275957396e-08, "loss": 0.792, "step": 6922 }, { "epoch": 0.96, "learning_rate": 7.699202717319276e-08, "loss": 0.7988, "step": 6923 }, { "epoch": 0.96, "learning_rate": 7.643583519125752e-08, "loss": 0.7543, "step": 6924 }, { "epoch": 0.96, "learning_rate": 7.588165176250717e-08, "loss": 0.8367, "step": 6925 }, { "epoch": 0.96, "learning_rate": 7.532947699911197e-08, "loss": 0.8848, "step": 6926 }, { "epoch": 0.96, "learning_rate": 7.47793110128292e-08, "loss": 0.7968, "step": 6927 }, { "epoch": 0.96, "learning_rate": 7.423115391501867e-08, "loss": 0.7866, "step": 6928 }, { "epoch": 0.96, "learning_rate": 7.368500581662607e-08, "loss": 0.8195, "step": 6929 }, { "epoch": 0.96, "learning_rate": 7.314086682819189e-08, "loss": 0.8096, "step": 6930 }, { "epoch": 0.96, "learning_rate": 7.259873705985466e-08, "loss": 0.8206, "step": 6931 }, { "epoch": 0.96, "learning_rate": 7.205861662133884e-08, "loss": 0.5599, "step": 6932 }, { "epoch": 0.96, "learning_rate": 7.152050562196921e-08, "loss": 0.7693, "step": 6933 }, { "epoch": 0.96, "learning_rate": 7.098440417065977e-08, "loss": 0.802, "step": 6934 }, { "epoch": 0.96, "learning_rate": 7.045031237591815e-08, "loss": 0.8433, "step": 6935 }, { "epoch": 0.96, "learning_rate": 6.991823034584677e-08, "loss": 0.8213, "step": 6936 }, { "epoch": 0.96, "learning_rate": 6.938815818813838e-08, "loss": 0.5187, "step": 6937 }, { "epoch": 0.96, "learning_rate": 6.886009601008381e-08, "loss": 0.8223, "step": 6938 }, { "epoch": 0.96, "learning_rate": 6.833404391856203e-08, "loss": 0.8823, "step": 6939 }, { "epoch": 0.96, "learning_rate": 6.781000202004784e-08, "loss": 0.8022, "step": 6940 }, { "epoch": 0.96, "learning_rate": 6.728797042060753e-08, "loss": 0.5157, "step": 6941 }, { "epoch": 0.96, "learning_rate": 6.676794922590324e-08, "loss": 0.8014, "step": 6942 }, { "epoch": 0.96, "learning_rate": 6.624993854118744e-08, "loss": 0.7717, "step": 6943 }, { "epoch": 0.96, "learning_rate": 6.573393847130849e-08, "loss": 0.821, "step": 6944 }, { "epoch": 0.96, "learning_rate": 6.521994912070284e-08, "loss": 0.7769, "step": 6945 }, { "epoch": 0.96, "learning_rate": 6.470797059340506e-08, "loss": 0.8403, "step": 6946 }, { "epoch": 0.96, "learning_rate": 6.419800299304225e-08, "loss": 0.8281, "step": 6947 }, { "epoch": 0.97, "learning_rate": 6.369004642282961e-08, "loss": 0.8428, "step": 6948 }, { "epoch": 0.97, "learning_rate": 6.318410098558158e-08, "loss": 0.8555, "step": 6949 }, { "epoch": 0.97, "learning_rate": 6.268016678370181e-08, "loss": 0.8245, "step": 6950 }, { "epoch": 0.97, "learning_rate": 6.217824391918759e-08, "loss": 0.5856, "step": 6951 }, { "epoch": 0.97, "learning_rate": 6.167833249362987e-08, "loss": 0.8125, "step": 6952 }, { "epoch": 0.97, "learning_rate": 6.118043260821104e-08, "loss": 0.7755, "step": 6953 }, { "epoch": 0.97, "learning_rate": 6.06845443637083e-08, "loss": 0.8105, "step": 6954 }, { "epoch": 0.97, "learning_rate": 6.019066786049022e-08, "loss": 0.8159, "step": 6955 }, { "epoch": 0.97, "learning_rate": 5.969880319851906e-08, "loss": 0.7455, "step": 6956 }, { "epoch": 0.97, "learning_rate": 5.9208950477347424e-08, "loss": 0.7423, "step": 6957 }, { "epoch": 0.97, "learning_rate": 5.872110979612489e-08, "loss": 0.8215, "step": 6958 }, { "epoch": 0.97, "learning_rate": 5.8235281253590235e-08, "loss": 0.8616, "step": 6959 }, { "epoch": 0.97, "learning_rate": 5.7751464948077044e-08, "loss": 0.825, "step": 6960 }, { "epoch": 0.97, "learning_rate": 5.726966097751141e-08, "loss": 0.7799, "step": 6961 }, { "epoch": 0.97, "learning_rate": 5.6789869439409785e-08, "loss": 0.8557, "step": 6962 }, { "epoch": 0.97, "learning_rate": 5.631209043088448e-08, "loss": 0.7822, "step": 6963 }, { "epoch": 0.97, "learning_rate": 5.5836324048640366e-08, "loss": 0.8325, "step": 6964 }, { "epoch": 0.97, "learning_rate": 5.536257038897041e-08, "loss": 0.7964, "step": 6965 }, { "epoch": 0.97, "learning_rate": 5.48908295477657e-08, "loss": 0.8191, "step": 6966 }, { "epoch": 0.97, "learning_rate": 5.442110162050762e-08, "loss": 0.7896, "step": 6967 }, { "epoch": 0.97, "learning_rate": 5.395338670227013e-08, "loss": 0.792, "step": 6968 }, { "epoch": 0.97, "learning_rate": 5.348768488771971e-08, "loss": 0.8091, "step": 6969 }, { "epoch": 0.97, "learning_rate": 5.302399627111432e-08, "loss": 0.7771, "step": 6970 }, { "epoch": 0.97, "learning_rate": 5.256232094630776e-08, "loss": 0.5583, "step": 6971 }, { "epoch": 0.97, "learning_rate": 5.210265900674305e-08, "loss": 0.7981, "step": 6972 }, { "epoch": 0.97, "learning_rate": 5.16450105454569e-08, "loss": 0.8706, "step": 6973 }, { "epoch": 0.97, "learning_rate": 5.118937565507853e-08, "loss": 0.8567, "step": 6974 }, { "epoch": 0.97, "learning_rate": 5.0735754427830855e-08, "loss": 0.7695, "step": 6975 }, { "epoch": 0.97, "learning_rate": 5.028414695552486e-08, "loss": 0.7747, "step": 6976 }, { "epoch": 0.97, "learning_rate": 4.9834553329569656e-08, "loss": 0.5984, "step": 6977 }, { "epoch": 0.97, "learning_rate": 4.9386973640962456e-08, "loss": 0.8145, "step": 6978 }, { "epoch": 0.97, "learning_rate": 4.894140798029634e-08, "loss": 0.8218, "step": 6979 }, { "epoch": 0.97, "learning_rate": 4.8497856437753624e-08, "loss": 0.7991, "step": 6980 }, { "epoch": 0.97, "learning_rate": 4.805631910311026e-08, "loss": 0.8369, "step": 6981 }, { "epoch": 0.97, "learning_rate": 4.7616796065733664e-08, "loss": 0.8206, "step": 6982 }, { "epoch": 0.97, "learning_rate": 4.7179287414586e-08, "loss": 0.772, "step": 6983 }, { "epoch": 0.97, "learning_rate": 4.674379323821865e-08, "loss": 0.8577, "step": 6984 }, { "epoch": 0.97, "learning_rate": 4.631031362477778e-08, "loss": 0.7769, "step": 6985 }, { "epoch": 0.97, "learning_rate": 4.587884866199988e-08, "loss": 0.7349, "step": 6986 }, { "epoch": 0.97, "learning_rate": 4.5449398437215074e-08, "loss": 0.5805, "step": 6987 }, { "epoch": 0.97, "learning_rate": 4.5021963037344964e-08, "loss": 0.7717, "step": 6988 }, { "epoch": 0.97, "learning_rate": 4.4596542548903666e-08, "loss": 0.7849, "step": 6989 }, { "epoch": 0.97, "learning_rate": 4.417313705799675e-08, "loss": 0.832, "step": 6990 }, { "epoch": 0.97, "learning_rate": 4.3751746650322336e-08, "loss": 0.8378, "step": 6991 }, { "epoch": 0.97, "learning_rate": 4.333237141117219e-08, "loss": 0.783, "step": 6992 }, { "epoch": 0.97, "learning_rate": 4.291501142542842e-08, "loss": 0.7708, "step": 6993 }, { "epoch": 0.97, "learning_rate": 4.249966677756345e-08, "loss": 0.7931, "step": 6994 }, { "epoch": 0.97, "learning_rate": 4.208633755164782e-08, "loss": 0.8347, "step": 6995 }, { "epoch": 0.97, "learning_rate": 4.1675023831336816e-08, "loss": 0.8828, "step": 6996 }, { "epoch": 0.97, "learning_rate": 4.126572569988385e-08, "loss": 0.8285, "step": 6997 }, { "epoch": 0.97, "learning_rate": 4.085844324013044e-08, "loss": 0.7686, "step": 6998 }, { "epoch": 0.97, "learning_rate": 4.045317653451175e-08, "loss": 0.7731, "step": 6999 }, { "epoch": 0.97, "learning_rate": 4.00499256650555e-08, "loss": 0.7925, "step": 7000 }, { "epoch": 0.97, "learning_rate": 3.964869071337973e-08, "loss": 0.8171, "step": 7001 }, { "epoch": 0.97, "learning_rate": 3.9249471760696154e-08, "loss": 0.7952, "step": 7002 }, { "epoch": 0.97, "learning_rate": 3.885226888780791e-08, "loss": 0.8406, "step": 7003 }, { "epoch": 0.97, "learning_rate": 3.845708217510735e-08, "loss": 0.877, "step": 7004 }, { "epoch": 0.97, "learning_rate": 3.806391170258494e-08, "loss": 0.8669, "step": 7005 }, { "epoch": 0.97, "learning_rate": 3.7672757549815916e-08, "loss": 0.8002, "step": 7006 }, { "epoch": 0.97, "learning_rate": 3.7283619795972503e-08, "loss": 0.8162, "step": 7007 }, { "epoch": 0.97, "learning_rate": 3.6896498519817246e-08, "loss": 0.7556, "step": 7008 }, { "epoch": 0.97, "learning_rate": 3.6511393799704146e-08, "loss": 0.7555, "step": 7009 }, { "epoch": 0.97, "learning_rate": 3.612830571357862e-08, "loss": 0.8499, "step": 7010 }, { "epoch": 0.97, "learning_rate": 3.574723433897975e-08, "loss": 0.7629, "step": 7011 }, { "epoch": 0.97, "learning_rate": 3.536817975303697e-08, "loss": 0.7839, "step": 7012 }, { "epoch": 0.97, "learning_rate": 3.499114203247111e-08, "loss": 0.7889, "step": 7013 }, { "epoch": 0.97, "learning_rate": 3.461612125359559e-08, "loss": 0.5867, "step": 7014 }, { "epoch": 0.97, "learning_rate": 3.424311749231746e-08, "loss": 0.8767, "step": 7015 }, { "epoch": 0.97, "learning_rate": 3.387213082413077e-08, "loss": 0.7988, "step": 7016 }, { "epoch": 0.97, "learning_rate": 3.3503161324125456e-08, "loss": 0.7708, "step": 7017 }, { "epoch": 0.97, "learning_rate": 3.313620906698289e-08, "loss": 0.8066, "step": 7018 }, { "epoch": 0.97, "learning_rate": 3.2771274126972566e-08, "loss": 0.7642, "step": 7019 }, { "epoch": 0.98, "learning_rate": 3.240835657796093e-08, "loss": 0.8276, "step": 7020 }, { "epoch": 0.98, "learning_rate": 3.2047456493401465e-08, "loss": 0.8882, "step": 7021 }, { "epoch": 0.98, "learning_rate": 3.1688573946341287e-08, "loss": 0.5652, "step": 7022 }, { "epoch": 0.98, "learning_rate": 3.133170900942117e-08, "loss": 0.8218, "step": 7023 }, { "epoch": 0.98, "learning_rate": 3.097686175486781e-08, "loss": 0.8076, "step": 7024 }, { "epoch": 0.98, "learning_rate": 3.062403225450705e-08, "loss": 0.7959, "step": 7025 }, { "epoch": 0.98, "learning_rate": 3.0273220579749576e-08, "loss": 0.7236, "step": 7026 }, { "epoch": 0.98, "learning_rate": 2.9924426801601906e-08, "loss": 0.7852, "step": 7027 }, { "epoch": 0.98, "learning_rate": 2.957765099065979e-08, "loss": 0.7805, "step": 7028 }, { "epoch": 0.98, "learning_rate": 2.9232893217112646e-08, "loss": 0.7751, "step": 7029 }, { "epoch": 0.98, "learning_rate": 2.8890153550739097e-08, "loss": 0.8011, "step": 7030 }, { "epoch": 0.98, "learning_rate": 2.854943206091143e-08, "loss": 0.772, "step": 7031 }, { "epoch": 0.98, "learning_rate": 2.821072881659226e-08, "loss": 0.5251, "step": 7032 }, { "epoch": 0.98, "learning_rate": 2.7874043886335632e-08, "loss": 0.875, "step": 7033 }, { "epoch": 0.98, "learning_rate": 2.7539377338287043e-08, "loss": 0.8213, "step": 7034 }, { "epoch": 0.98, "learning_rate": 2.7206729240185635e-08, "loss": 0.8083, "step": 7035 }, { "epoch": 0.98, "learning_rate": 2.6876099659357558e-08, "loss": 0.8136, "step": 7036 }, { "epoch": 0.98, "learning_rate": 2.654748866272483e-08, "loss": 0.7499, "step": 7037 }, { "epoch": 0.98, "learning_rate": 2.6220896316798694e-08, "loss": 0.7651, "step": 7038 }, { "epoch": 0.98, "learning_rate": 2.589632268768072e-08, "loss": 0.8005, "step": 7039 }, { "epoch": 0.98, "learning_rate": 2.5573767841068353e-08, "loss": 0.8281, "step": 7040 }, { "epoch": 0.98, "learning_rate": 2.525323184224493e-08, "loss": 0.767, "step": 7041 }, { "epoch": 0.98, "learning_rate": 2.4934714756089663e-08, "loss": 0.8386, "step": 7042 }, { "epoch": 0.98, "learning_rate": 2.461821664706987e-08, "loss": 0.8567, "step": 7043 }, { "epoch": 0.98, "learning_rate": 2.4303737579245423e-08, "loss": 0.8245, "step": 7044 }, { "epoch": 0.98, "learning_rate": 2.399127761626874e-08, "loss": 0.8562, "step": 7045 }, { "epoch": 0.98, "learning_rate": 2.3680836821381447e-08, "loss": 0.8396, "step": 7046 }, { "epoch": 0.98, "learning_rate": 2.3372415257417735e-08, "loss": 0.8452, "step": 7047 }, { "epoch": 0.98, "learning_rate": 2.306601298680322e-08, "loss": 0.8229, "step": 7048 }, { "epoch": 0.98, "learning_rate": 2.2761630071553853e-08, "loss": 0.7756, "step": 7049 }, { "epoch": 0.98, "learning_rate": 2.2459266573278127e-08, "loss": 0.782, "step": 7050 }, { "epoch": 0.98, "learning_rate": 2.2158922553174866e-08, "loss": 0.5716, "step": 7051 }, { "epoch": 0.98, "learning_rate": 2.1860598072034333e-08, "loss": 0.843, "step": 7052 }, { "epoch": 0.98, "learning_rate": 2.1564293190238228e-08, "loss": 0.5558, "step": 7053 }, { "epoch": 0.98, "learning_rate": 2.1270007967758578e-08, "loss": 0.7981, "step": 7054 }, { "epoch": 0.98, "learning_rate": 2.0977742464161066e-08, "loss": 0.8359, "step": 7055 }, { "epoch": 0.98, "learning_rate": 2.068749673859949e-08, "loss": 0.8435, "step": 7056 }, { "epoch": 0.98, "learning_rate": 2.0399270849821297e-08, "loss": 0.7341, "step": 7057 }, { "epoch": 0.98, "learning_rate": 2.0113064856163155e-08, "loss": 0.7448, "step": 7058 }, { "epoch": 0.98, "learning_rate": 1.9828878815554287e-08, "loss": 0.7346, "step": 7059 }, { "epoch": 0.98, "learning_rate": 1.9546712785515344e-08, "loss": 0.8118, "step": 7060 }, { "epoch": 0.98, "learning_rate": 1.9266566823156197e-08, "loss": 0.7502, "step": 7061 }, { "epoch": 0.98, "learning_rate": 1.898844098517927e-08, "loss": 0.8428, "step": 7062 }, { "epoch": 0.98, "learning_rate": 1.8712335327878417e-08, "loss": 0.8154, "step": 7063 }, { "epoch": 0.98, "learning_rate": 1.843824990713783e-08, "loss": 0.7598, "step": 7064 }, { "epoch": 0.98, "learning_rate": 1.8166184778434238e-08, "loss": 0.7793, "step": 7065 }, { "epoch": 0.98, "learning_rate": 1.7896139996831374e-08, "loss": 0.842, "step": 7066 }, { "epoch": 0.98, "learning_rate": 1.762811561698996e-08, "loss": 0.7435, "step": 7067 }, { "epoch": 0.98, "learning_rate": 1.7362111693157712e-08, "loss": 0.7959, "step": 7068 }, { "epoch": 0.98, "learning_rate": 1.7098128279172676e-08, "loss": 0.8381, "step": 7069 }, { "epoch": 0.98, "learning_rate": 1.6836165428468776e-08, "loss": 0.7838, "step": 7070 }, { "epoch": 0.98, "learning_rate": 1.657622319406582e-08, "loss": 0.7888, "step": 7071 }, { "epoch": 0.98, "learning_rate": 1.6318301628578393e-08, "loss": 0.7974, "step": 7072 }, { "epoch": 0.98, "learning_rate": 1.6062400784208064e-08, "loss": 0.8074, "step": 7073 }, { "epoch": 0.98, "learning_rate": 1.5808520712752297e-08, "loss": 0.7572, "step": 7074 }, { "epoch": 0.98, "learning_rate": 1.5556661465594426e-08, "loss": 0.7549, "step": 7075 }, { "epoch": 0.98, "learning_rate": 1.5306823093713673e-08, "loss": 0.8, "step": 7076 }, { "epoch": 0.98, "learning_rate": 1.505900564767737e-08, "loss": 0.7938, "step": 7077 }, { "epoch": 0.98, "learning_rate": 1.4813209177644283e-08, "loss": 0.7896, "step": 7078 }, { "epoch": 0.98, "learning_rate": 1.4569433733363503e-08, "loss": 0.8401, "step": 7079 }, { "epoch": 0.98, "learning_rate": 1.4327679364175562e-08, "loss": 0.813, "step": 7080 }, { "epoch": 0.98, "learning_rate": 1.408794611901354e-08, "loss": 0.7756, "step": 7081 }, { "epoch": 0.98, "learning_rate": 1.3850234046399735e-08, "loss": 0.7991, "step": 7082 }, { "epoch": 0.98, "learning_rate": 1.3614543194446772e-08, "loss": 0.8525, "step": 7083 }, { "epoch": 0.98, "learning_rate": 1.3380873610859823e-08, "loss": 0.583, "step": 7084 }, { "epoch": 0.98, "learning_rate": 1.3149225342933281e-08, "loss": 0.8071, "step": 7085 }, { "epoch": 0.98, "learning_rate": 1.2919598437554081e-08, "loss": 0.7894, "step": 7086 }, { "epoch": 0.98, "learning_rate": 1.2691992941198384e-08, "loss": 0.8169, "step": 7087 }, { "epoch": 0.98, "learning_rate": 1.2466408899936e-08, "loss": 0.7385, "step": 7088 }, { "epoch": 0.98, "learning_rate": 1.2242846359423743e-08, "loss": 0.832, "step": 7089 }, { "epoch": 0.98, "learning_rate": 1.2021305364910974e-08, "loss": 0.8145, "step": 7090 }, { "epoch": 0.98, "learning_rate": 1.1801785961240709e-08, "loss": 0.8311, "step": 7091 }, { "epoch": 0.99, "learning_rate": 1.1584288192841853e-08, "loss": 0.78, "step": 7092 }, { "epoch": 0.99, "learning_rate": 1.136881210373697e-08, "loss": 0.843, "step": 7093 }, { "epoch": 0.99, "learning_rate": 1.1155357737538953e-08, "loss": 0.8398, "step": 7094 }, { "epoch": 0.99, "learning_rate": 1.0943925137451017e-08, "loss": 0.7925, "step": 7095 }, { "epoch": 0.99, "learning_rate": 1.0734514346268932e-08, "loss": 0.842, "step": 7096 }, { "epoch": 0.99, "learning_rate": 1.052712540637768e-08, "loss": 0.8384, "step": 7097 }, { "epoch": 0.99, "learning_rate": 1.0321758359752576e-08, "loss": 0.823, "step": 7098 }, { "epoch": 0.99, "learning_rate": 1.0118413247960368e-08, "loss": 0.8357, "step": 7099 }, { "epoch": 0.99, "learning_rate": 9.917090112160355e-09, "loss": 0.74, "step": 7100 }, { "epoch": 0.99, "learning_rate": 9.71778899309772e-09, "loss": 0.8845, "step": 7101 }, { "epoch": 0.99, "learning_rate": 9.520509931113531e-09, "loss": 0.7961, "step": 7102 }, { "epoch": 0.99, "learning_rate": 9.325252966136955e-09, "loss": 0.7579, "step": 7103 }, { "epoch": 0.99, "learning_rate": 9.132018137689713e-09, "loss": 0.5956, "step": 7104 }, { "epoch": 0.99, "learning_rate": 8.940805484880521e-09, "loss": 0.7983, "step": 7105 }, { "epoch": 0.99, "learning_rate": 8.751615046413975e-09, "loss": 0.8086, "step": 7106 }, { "epoch": 0.99, "learning_rate": 8.564446860580556e-09, "loss": 0.8008, "step": 7107 }, { "epoch": 0.99, "learning_rate": 8.379300965264403e-09, "loss": 0.7859, "step": 7108 }, { "epoch": 0.99, "learning_rate": 8.196177397939986e-09, "loss": 0.8071, "step": 7109 }, { "epoch": 0.99, "learning_rate": 8.0150761956721e-09, "loss": 0.8396, "step": 7110 }, { "epoch": 0.99, "learning_rate": 7.835997395113648e-09, "loss": 0.8054, "step": 7111 }, { "epoch": 0.99, "learning_rate": 7.658941032513411e-09, "loss": 0.7888, "step": 7112 }, { "epoch": 0.99, "learning_rate": 7.48390714370717e-09, "loss": 0.7542, "step": 7113 }, { "epoch": 0.99, "learning_rate": 7.310895764122139e-09, "loss": 0.7981, "step": 7114 }, { "epoch": 0.99, "learning_rate": 7.139906928775864e-09, "loss": 0.8035, "step": 7115 }, { "epoch": 0.99, "learning_rate": 6.970940672276216e-09, "loss": 0.823, "step": 7116 }, { "epoch": 0.99, "learning_rate": 6.803997028824727e-09, "loss": 0.7949, "step": 7117 }, { "epoch": 0.99, "learning_rate": 6.6390760322088134e-09, "loss": 0.8342, "step": 7118 }, { "epoch": 0.99, "learning_rate": 6.476177715810661e-09, "loss": 0.8131, "step": 7119 }, { "epoch": 0.99, "learning_rate": 6.315302112600563e-09, "loss": 0.7971, "step": 7120 }, { "epoch": 0.99, "learning_rate": 6.156449255139141e-09, "loss": 0.825, "step": 7121 }, { "epoch": 0.99, "learning_rate": 5.999619175579563e-09, "loss": 0.6003, "step": 7122 }, { "epoch": 0.99, "learning_rate": 5.844811905665326e-09, "loss": 0.7524, "step": 7123 }, { "epoch": 0.99, "learning_rate": 5.692027476728035e-09, "loss": 0.782, "step": 7124 }, { "epoch": 0.99, "learning_rate": 5.54126591969295e-09, "loss": 0.8013, "step": 7125 }, { "epoch": 0.99, "learning_rate": 5.392527265074554e-09, "loss": 0.8777, "step": 7126 }, { "epoch": 0.99, "learning_rate": 5.2458115429776524e-09, "loss": 0.809, "step": 7127 }, { "epoch": 0.99, "learning_rate": 5.101118783097381e-09, "loss": 0.7434, "step": 7128 }, { "epoch": 0.99, "learning_rate": 4.958449014720312e-09, "loss": 0.7839, "step": 7129 }, { "epoch": 0.99, "learning_rate": 4.817802266723348e-09, "loss": 0.8235, "step": 7130 }, { "epoch": 0.99, "learning_rate": 4.679178567572607e-09, "loss": 0.7797, "step": 7131 }, { "epoch": 0.99, "learning_rate": 4.542577945327864e-09, "loss": 0.7957, "step": 7132 }, { "epoch": 0.99, "learning_rate": 4.408000427635895e-09, "loss": 0.7942, "step": 7133 }, { "epoch": 0.99, "learning_rate": 4.27544604173602e-09, "loss": 0.7805, "step": 7134 }, { "epoch": 0.99, "learning_rate": 4.14491481445789e-09, "loss": 0.8005, "step": 7135 }, { "epoch": 0.99, "learning_rate": 4.016406772220372e-09, "loss": 0.8135, "step": 7136 }, { "epoch": 0.99, "learning_rate": 3.8899219410337695e-09, "loss": 0.8145, "step": 7137 }, { "epoch": 0.99, "learning_rate": 3.765460346500938e-09, "loss": 0.8335, "step": 7138 }, { "epoch": 0.99, "learning_rate": 3.6430220138106153e-09, "loss": 0.7584, "step": 7139 }, { "epoch": 0.99, "learning_rate": 3.5226069677463113e-09, "loss": 0.537, "step": 7140 }, { "epoch": 0.99, "learning_rate": 3.4042152326796418e-09, "loss": 0.7759, "step": 7141 }, { "epoch": 0.99, "learning_rate": 3.28784683257255e-09, "loss": 0.5649, "step": 7142 }, { "epoch": 0.99, "learning_rate": 3.1735017909806377e-09, "loss": 0.7253, "step": 7143 }, { "epoch": 0.99, "learning_rate": 3.0611801310453937e-09, "loss": 0.7993, "step": 7144 }, { "epoch": 0.99, "learning_rate": 2.9508818755019653e-09, "loss": 0.845, "step": 7145 }, { "epoch": 0.99, "learning_rate": 2.842607046674717e-09, "loss": 0.7888, "step": 7146 }, { "epoch": 0.99, "learning_rate": 2.736355666479451e-09, "loss": 0.7937, "step": 7147 }, { "epoch": 0.99, "learning_rate": 2.632127756421188e-09, "loss": 0.8457, "step": 7148 }, { "epoch": 0.99, "learning_rate": 2.5299233375952746e-09, "loss": 0.822, "step": 7149 }, { "epoch": 0.99, "learning_rate": 2.4297424306884978e-09, "loss": 0.8401, "step": 7150 }, { "epoch": 0.99, "learning_rate": 2.3315850559779696e-09, "loss": 0.8411, "step": 7151 }, { "epoch": 0.99, "learning_rate": 2.2354512333311317e-09, "loss": 0.8149, "step": 7152 }, { "epoch": 0.99, "learning_rate": 2.141340982205753e-09, "loss": 0.8051, "step": 7153 }, { "epoch": 0.99, "learning_rate": 2.049254321648819e-09, "loss": 0.7759, "step": 7154 }, { "epoch": 0.99, "learning_rate": 1.959191270299865e-09, "loss": 0.8193, "step": 7155 }, { "epoch": 0.99, "learning_rate": 1.8711518463887522e-09, "loss": 0.7561, "step": 7156 }, { "epoch": 0.99, "learning_rate": 1.7851360677334506e-09, "loss": 0.7869, "step": 7157 }, { "epoch": 0.99, "learning_rate": 1.701143951743367e-09, "loss": 0.5479, "step": 7158 }, { "epoch": 0.99, "learning_rate": 1.619175515420457e-09, "loss": 0.7676, "step": 7159 }, { "epoch": 0.99, "learning_rate": 1.5392307753536728e-09, "loss": 0.8167, "step": 7160 }, { "epoch": 0.99, "learning_rate": 1.4613097477256255e-09, "loss": 0.8475, "step": 7161 }, { "epoch": 0.99, "learning_rate": 1.3854124483059228e-09, "loss": 0.8567, "step": 7162 }, { "epoch": 0.99, "learning_rate": 1.311538892457831e-09, "loss": 0.8337, "step": 7163 }, { "epoch": 1.0, "learning_rate": 1.2396890951327235e-09, "loss": 0.8335, "step": 7164 }, { "epoch": 1.0, "learning_rate": 1.1698630708734115e-09, "loss": 0.7842, "step": 7165 }, { "epoch": 1.0, "learning_rate": 1.1020608338130346e-09, "loss": 0.7783, "step": 7166 }, { "epoch": 1.0, "learning_rate": 1.0362823976750592e-09, "loss": 0.777, "step": 7167 }, { "epoch": 1.0, "learning_rate": 9.725277757721697e-10, "loss": 0.5941, "step": 7168 }, { "epoch": 1.0, "learning_rate": 9.107969810095984e-10, "loss": 0.8164, "step": 7169 }, { "epoch": 1.0, "learning_rate": 8.510900258817955e-10, "loss": 0.5382, "step": 7170 }, { "epoch": 1.0, "learning_rate": 7.934069224724284e-10, "loss": 0.7769, "step": 7171 }, { "epoch": 1.0, "learning_rate": 7.377476824577124e-10, "loss": 0.8433, "step": 7172 }, { "epoch": 1.0, "learning_rate": 6.841123171030805e-10, "loss": 0.8123, "step": 7173 }, { "epoch": 1.0, "learning_rate": 6.325008372642937e-10, "loss": 0.7739, "step": 7174 }, { "epoch": 1.0, "learning_rate": 5.829132533874404e-10, "loss": 0.5891, "step": 7175 }, { "epoch": 1.0, "learning_rate": 5.353495755100469e-10, "loss": 0.8335, "step": 7176 }, { "epoch": 1.0, "learning_rate": 4.898098132577467e-10, "loss": 0.808, "step": 7177 }, { "epoch": 1.0, "learning_rate": 4.462939758487217e-10, "loss": 0.7642, "step": 7178 }, { "epoch": 1.0, "learning_rate": 4.0480207209037113e-10, "loss": 0.7971, "step": 7179 }, { "epoch": 1.0, "learning_rate": 3.653341103815322e-10, "loss": 0.8313, "step": 7180 }, { "epoch": 1.0, "learning_rate": 3.2789009871025955e-10, "loss": 0.8118, "step": 7181 }, { "epoch": 1.0, "learning_rate": 2.924700446549356e-10, "loss": 0.8237, "step": 7182 }, { "epoch": 1.0, "learning_rate": 2.590739553842703e-10, "loss": 0.8604, "step": 7183 }, { "epoch": 1.0, "learning_rate": 2.277018376584117e-10, "loss": 0.8098, "step": 7184 }, { "epoch": 1.0, "learning_rate": 1.9835369782783553e-10, "loss": 0.5798, "step": 7185 }, { "epoch": 1.0, "learning_rate": 1.7102954183112475e-10, "loss": 0.7759, "step": 7186 }, { "epoch": 1.0, "learning_rate": 1.4572937519941045e-10, "loss": 0.823, "step": 7187 }, { "epoch": 1.0, "learning_rate": 1.2245320305415143e-10, "loss": 0.8389, "step": 7188 }, { "epoch": 1.0, "learning_rate": 1.0120103010491378e-10, "loss": 0.7864, "step": 7189 }, { "epoch": 1.0, "learning_rate": 8.197286065492194e-11, "loss": 0.8862, "step": 7190 }, { "epoch": 1.0, "learning_rate": 6.476869859550761e-11, "loss": 0.7869, "step": 7191 }, { "epoch": 1.0, "learning_rate": 4.958854740833019e-11, "loss": 0.7844, "step": 7192 }, { "epoch": 1.0, "learning_rate": 3.64324101653768e-11, "loss": 0.834, "step": 7193 }, { "epoch": 1.0, "learning_rate": 2.5300289531182688e-11, "loss": 0.8691, "step": 7194 }, { "epoch": 1.0, "learning_rate": 1.6192187758390376e-11, "loss": 0.8962, "step": 7195 }, { "epoch": 1.0, "learning_rate": 9.108106688859863e-12, "loss": 0.8594, "step": 7196 }, { "epoch": 1.0, "learning_rate": 4.048047759219742e-12, "loss": 0.8352, "step": 7197 }, { "epoch": 1.0, "learning_rate": 1.0120119908751946e-12, "loss": 0.6143, "step": 7198 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 0.6482, "step": 7199 }, { "epoch": 1.0, "step": 7199, "total_flos": 2.055508174842521e+19, "train_loss": 0.8389650141634797, "train_runtime": 142923.3146, "train_samples_per_second": 6.447, "train_steps_per_second": 0.05 } ], "max_steps": 7199, "num_train_epochs": 1, "total_flos": 2.055508174842521e+19, "trial_name": null, "trial_params": null }